FounderRare: A Novel Statistical Package to Identify Rare Variants in Complex Diseases

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 30,479 characters · extracted from preprint-html · click to expand
FounderRare: A Novel Statistical Package to Identify Rare Variants in Complex Diseases | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search FounderRare: A Novel Statistical Package to Identify Rare Variants in Complex Diseases Samir Oubninte , Simon Girard , Claudia Moreau , Alexandre Bureau doi: https://doi.org/10.1101/2025.09.11.25335516 Samir Oubninte 1 Département de Médecine Sociale et Préventive, Université Laval , Québec City, Québec, Canada Find this author on Google Scholar Find this author on PubMed Search for this author on this site Simon Girard 2 Centre de recherche CERVO , Québec City, Québec, Canada 3 Département des sciences fondamentales, Université du Québec à Chicoutimi , Canada Find this author on Google Scholar Find this author on PubMed Search for this author on this site Claudia Moreau 3 Département des sciences fondamentales, Université du Québec à Chicoutimi , Canada Find this author on Google Scholar Find this author on PubMed Search for this author on this site Alexandre Bureau 1 Département de Médecine Sociale et Préventive, Université Laval , Québec City, Québec, Canada 2 Centre de recherche CERVO , Québec City, Québec, Canada Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: alexandre.bureau{at}fmed.ulaval.ca Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract FounderRare is a statistical package designed for the identification of rare variants in complex diseases. It leverages population genealogies, including those shaped by founder effects and identity-by-descent (IBD) segments, distinguishing it from other tools. This paper serves as a theoretical guide to the FounderRare package, illustrating its operations and capabilities. The package implements an IBD-based approach that computes the number of copies, among affected individuals, of the shared haplotype within genomic regions. The genome is partitioned into regions, within which clusters of affected individuals sharing specific IBD segments are identified. Statistical tests, denoted as S msg and S all , are included to evaluate the enrichment of IBD sharing among affected individuals. These tests rely on simulations of the null distribution and are designed to identify causal regions in the absence of control samples. FounderRare is optimized for cohorts comprising several thousand individuals—sample sizes typically required to achieve sufficient statistical power in rare variant analyses. By utilizing genotype array data, this tool enables cost-effective analysis at scale for researchers investigating complex diseases. It aids in pinpointing genomic regions likely to harbor rare variants, thereby contributing to a deeper understanding of the underlying genetic structure. FounderRare, R package, rare variants, complex diseases, population genealogy, identical-by-descent (IBD) segments 1 Introduction Complex diseases are shaped by an interplay of genetic and environmental elements. Despite the progress in genome-wide association studies (GWAS), a significant portion of the genetic variance of these diseases remains elusive, leading to the so-called “missing heritability” problem [ 1 , 2 ]. One potential explanation for this missing heritability could be the role of rare variants [ 3 ], which are hypothesized to have larger effects but lower frequencies compared to common variants. However, the detection of these rare variants poses a significant challenge due to their low statistical power, high heterogeneity, and limited availability of large sample sizes of whole genome sequences. To address these challenges, we introduce a statistical method that leverages both genealogical and genomic data from a population, including those with a founder effect, to pinpoint rare variants associated with complex diseases [ 4 ]. A population with a founder effect is a group that descends from a limited number of ancestors who possess a subset of the genetic diversity of the original population. Owing to the decreased genetic diversity and increased relatedness, populations with a founder effect are a rich source of rare variants. These rare variants are often shared among relatives and are located on Identical by Descent (IBD) segments, which are genomic regions inherited from a common ancestor without recombination. By tracking these IBD segments within a population, we can deduce recent variants that are passed down the genealogical tree and examine their association with disease phenotypes [ 7 ]. This approach provides a promising avenue to uncover part of the hidden heritability of complex diseases and advance our understanding of their genetic architecture. We have developed FounderRare , an R package that encapsulates our statistical methodology and a statistical measure of the most shared haplotype in a synthetic genomic region among affected individuals, known as S msg . This measure is used in the approach we developed to identify rare variants in populations with a founder effect [ 4 ]. FounderRare accepts IBD clusters as input and subsequently partitions the genome into synthetic genomic regions (SGs), guided by the IBD structure. It then identifies distinct clusters of affected individuals who share a specific SG. Following this, the value of statistical measures like S msg is computed. The effectiveness of FounderRare was evaluated using simulated and real data sets in a separate study [ 4 ]. The simulation of whole genome transmission in a Quebec founder ge-nealogy (sourced from the BALSAC population database, website: https://balsac.uqac.ca/ ) was performed using msprime [ 9 ]. Our approach was then compared with alternative strategies such as the Generalized Linear Mixed Model Association Test (GMMAT) [ 5 ] and the S all measure (an adapted version of S all proposed by Whittemore [ 6 ]). FounderRare can compute this adapted measure of S all . The results indicated that S msg implemented in FounderRare can be more powerful and robust than certain competing IBD segment test statistics, especially in identifying regions that contain a single causal variant. The FounderRare package is complemented by a comprehensive guide that explains its functionalities and presents typical examples of its output. The guide delves into the package installation process, detailing the necessary prerequisites and dependencies. It also provides a catalog of the functions embedded in the package, offering insights into their usage, thereby allowing for package adaptability for future research. Furthermore, the guide demonstrates the application of FounderRare on real datasets. One such dataset, named IBDClusters, is included as an example. This dataset is an output generated by Dash [ 7 ], a tool designed to infer clusters of individuals who are likely to share a single haplotype. 2 Methods and Implementation The FounderRare package is a tool designed to detect rare variants associated with complex diseases within a population with a founder effect, using IBD segments as a proxy. This package offers a set of functions that streamline the analysis process, including the creation of synthetic genomic regions, the examination of IBD structures, and the calculation of the statistic S msg for each SG. To effectively utilize the FounderRare package, it is recommended to acquire IBD clusters from a population with a founder effect. These necessary clusters are used in the output format of the Dash software. We adopted an affected-only strategy, which allowed us to focus on those individuals in the population who exhibited disease traits. Upon identifying IBD clusters using Dash or any other suitable tool, we follow the recommended workflow: Defining Initial Genomic Ranges for SG and Sliding-SG: The SG is defined by its Start and width . The start is the smallest cluster start position on the chromosome. The width is minL × 1000, where minL (default: 400) is the initial length in kilobases, giving an initial width of 400 Kbp. The Sliding-SG is constructed similarly, using a fraction of this width and a different position (see Figure 1 and the tutorial). For each SG, an associated Sliding-SG is created, overlap-ping the SG by half its length. Optional parameters allow users to adjust both SG and Sliding-SG for specific analyses. Analysis of IBD Structure and Generation of the Subsequent SG: This procedure involves identifying and comparing IBD structures between two SGs, specifically an SG and its corresponding Sliding-SG. The process begins with the function IBD structure() , which determines the IBD structure, defined as the set of clusters satisfying a specified overlap criterion within a given genomic range. This iscontrolled by an optional overlap cutoff specifying the minimum proportion of overlap between clusters and the SG range required for inclusion (default: 0.5). The resulting structures are then compared. If the SG and Sliding-SG share the same IBD structure, the SG is extended to the end of the Sliding-SG, and the output includes the extended SG genomic range (returned as a GRanges object, following Bioconductor conventions) and its IBD structure (see Table 1 ). If the structures differ, indicating distinct patterns, a new SG and its associated Sliding-SG are created. The new SG starts at the end of the current SG, with an initial length of 400 Kbp (default value of minL ). Ensuring Disjointedness of IBD Structures: The FounderRare package applies the Tunnel Boring Machine (TBM) principle—an iterative approach that progressively generates or enlarges SGs based on their IBD structures until the end of the chromosome is reached. This ensures that the SG under examination encompasses the farthest of all cluster ends. Once this step is complete, the extraction of disjoint clusters begins. This involves reviewing each SG to determine whether its IBD structure contains overlapping (i.e., non-disjoint) clusters (see Table 2 ). If overlaps are detected, two strategies are available to achieve disjointness. The recommended approach is to retain the clusters with the largest number of individuals among the overlapping clusters [ 4 ]. Alternatively, overlapping clusters can be merged. Computation of Shared SG Statistic: The value of IBS sharing statistics, such as S msg , involves computing the value of for every SG using Equation 1 . To account for varying sample sizes, the S msg statistic can be normalized by the number of affected individuals. where m i represents the number of disjoint clusters in SG i , and represent the number of haplotypes in each cluster ( i = 1, …, I = number of constructed SGs). Download figure Open in new tab Figure 1. Overview of SG Construction: This schematic illustrates the process of identifying and constructing SGs across two successive iterations (Iteration I and Iteration I+1). Horizontal lines, displayed in blue and brown, represent haplotypes shared among clusters of individuals, labeled with unique identifiers (e.g., cl3, cl15, cl22). The lengths of these lines vary, reflecting the diversity of shared haplotypes. Dashed black lines connect clusters that share identical SG start and end points. Percentages along the haplotype segments indicate the proportion of overlap with either the cluster SG or the sliding-SG (represented by the green box labeled “Sliding-SG”). At the bottom of the diagram, SG length is measured, demonstrating that segment lengths can vary across iterations. A vertical brown dashed line highlights an example where the SG length increases by 10 Kbp from Iteration I to Iteration I+1, attributed to the IBD structure of the SG being similar to that of the sliding-SG. Specifically, clusters with SG overlap ≥ 50% also exhibit sliding-SG overlap ≥ 50%. In subsequent iterations, the algorithm is expected to generate a new SG. This figure is reproduced from Oubninte et al . [ 4 ] View this table: View inline View popup Download powerpoint Table 1: SG Data Structure: Data structure for the first two SGs. Each SG is represented as a list containing two components: (i) the genomic range (as a GRanges or IRanges object) and (ii) the clusters included in its IBD structure. One cluster—cl0—appears in overlap between SG 1 and 2. View this table: View inline View popup Download powerpoint Table 2: Disjoint Clusters within SGs: Example of the output generated by the TBMD() function for the first two SGs. Each SG is represented by its genomic range and the corresponding sets of disjoint clusters—namely the input clusters cl0 and cl1, reformatted according to the SG structure. Each cluster consists of individuals sharing a haplotype; the suffix (e.g., .2) indicates the haplotype index for that individual. Additionally, the FounderRare package offers the functionality to preserve SGs with their original IBD structure, as well as the IBD structure with disjoint clusters. This dataset may serve as a foundation for developing new statistical measures that extend or improve upon the concept of the S msg statistic. Essentially, the FounderRare package is a toolkit that has been tested for the investigation of rare variants in complex diseases within a population with a founder effect. We have made available a separate guide on GitHub that details the necessary steps to download, install, and set up the FounderRare package. This guide includes comprehensive code examples to aid first-time users. 3 Practical Application: Harnessing the Power of the FounderRare Package In this section, we illustrate the application of the FounderRare package to identify rare variants in complex diseases by analyzing IBD structures. We provide a step-by-step guide on how to use the functions detailed in the package’s documentation for basic usage. For more comprehensive information, including additional functions and parameters that can be customized to the user’s needs, please refer to the accompanying vignette of the package. It provides detailed information about the function’s purpose and usage, thereby enhancing the user’s grasp of its application. Downloading and Installing FounderRare Package: To successfully download and install the FounderRare package, adhere to the guidelines provided in the vignette document. The required libraries, including GenomicRanges , FounderRare , dplyr , and tidyr , must be loaded as they furnish the necessary tools for effective data manipulation and analysis. Inferring Synthetic Genomic Regions: The inference of SGs can be achieved using the TBM() function, which constructs SGs based on the TBM principle. The function dynamically creates or expands SGs based on their Identity by Descent structures. It accepts several parameters, including IBD clusters (IBDClusters), and various overlap and length parameters. This process involves the utilization of numerous other functions provided by the package. Below is an example of R code to infer SGs using the recommended (default) values: # An example of Identity by Descent clusters information is loaded from the package. # For details on how to read IBD clusters from Dash output files, # please refer to the package’s vignette. data(“IBDClusters”) # Columns containing only NA values are removed from the IBDClusters data frame. IBDClusters = IBDClusters[, colSums(is.na(IBDClusters)) != nrow(IBDClusters)] # The TBM function is called to infer SGs. It uses the IBDClusters and chromosome information, # with default values for other parameters. SGList = TBM(IBDClusters, chr = 22) SGList # This will display the information of the created SG on the console. # The inferred SGs, along with their IBD structure, can be saved in an RData file. # The filename should be specified by the user. # We recommend that you customize the file name and specify the path. saveRDS(SGList, file = paste0(path, “SGList_chr”, chr, “.RData”)) 3. Disjointness in IBD Structures of SGs and S msg Computing: The TBMD() function is designed to transform the non-disjoint clusters present in the output list of SGs (SGList) from the TBM() function into a refined output comprising disjoint clusters. It sequentially examines each SG to determine whether the IBD structure within the SG encompasses non-disjoint clusters. By default, it employs the Disj Clst SG Bigger() function, which converts the IBD structure into disjoint clusters by retaining the clusters with the most individuals among overlapping clusters. # The TBMD() function is used to infer the SG with disjoint clusters. SGListWithDisjCls <-TBMD(SGList, IBDClusters) SGListWithDisjCls # This will display the details of the generated SG in the console. # The output can be saved into an RData file. saveRDS(SGListWithDisjCls, file = paste0(path, “SGListWithDisjCls_chr”, chr, “.RData”)) # The Smsg statistic is computed using the ‘SGListWithDisjCls’ output. outSmsg chr SG cd Start End Smsg #> 1 22 SG1 cd1 18857226 19697181 2 #> 2 22 SG2 cd1 19697182 20147176 3 # The computed Smsg statistic can be written to a csv file. write.table(outSmsg, paste0(SGListWithDisjCls, “.csv”), sep = “,”, quote = FALSE, row.names = FALSE, col.names = TRUE) In the final step, the distribution of S msg under the null hypothesis (H0) is needed. In the absence of controls, Oubninte et al.[ 4 ] used the affected subjects’ genealogy to simulate neutral genetic sequence data under a coalescent model using Msprime. This simulated whole-genome sequencing data is then used to infer clusters. Following this, steps 2 and 3 are applied to each replicate to generate the null distribution for the statistic. S msg is subsequently calculated for the real data. The causal regions that potentially harbor a rare variant are identified as those where the value of S msg exceeds a predetermined quantile of the distribution of S msg under H0. 4 Discussion The FounderRare package equips researchers with advanced tools to investigate the genetic architecture of complex diseases. This package is specifically designed to identify rare genetic variants that contribute to the etiology of these diseases. Noteworthy features include its scalability, possibility to use genotype array data, focus on affected individuals, ability to infer synthetic genomic regions and capacity for rapid chromosome scanning using moderate resources: generating the SGs is a process taking several minutes per chromosome, while ensuring disjointness of IBD structure and computing S msg takes merely a fraction of a second. An additional advantage of this package lies in its ability to recode the outputs of the synthetic genomic regions into a data frame. This feature enables the application of a diverse array of statistical methods specifically designed for common variants, positioning the FounderRare package as a beneficial resource for researchers in the field. Data Availability All data produced in the present study are available upon reasonable request to the authors Code Availability Code to run FounderRare is available on GitHub: https://github.com/oubninte/run_FounderRare . Information about the FounderRare package and its installation is available on https://github.com/oubninte/FounderRare . Funding This work was funded by Natural Sciences and Engineering Research Council of Canada (NSERC) and Canadian Institutes of Health Research (CIHR) Most of the data analyses were performed on computing resources from Compute Canada (now the Digital Research Alliance of Canada). Acknowledgments Example data used for illustration are taken from the Eastern Quebec Schizophrenia and Bipolar Disorder Study. Signed consent was obtained from all participants or from the parents for participants under 18 years of age for collection of all data analyzed here, under the supervision of the University-affiliated neuroscience and mental health ethics committee. We thank M. Maziade (Laval University) for access to data from this study. We are grateful to all participants who enabled this study by contributing their DNA and to the participants who provided family information enabling the reconstruction of their genealogy. Footnotes This version of the manuscript has been revised to correct an issue in the reference list. One of the cited references was missing and had been incorrectly displayed. The reference has now been properly updated. No other changes have been made to the manuscript. References [1]. ↵ Pritchard JK , Cox NJ . 2002 . The allelic architecture of human disease genes: common disease-common variant…or not? Hum. Mol. Genet .. 11 : 2417 – 2423 . OpenUrl CrossRef PubMed Web of Science [2]. ↵ Eichler EE , Flint J , Gibson G , Kong A , Leal SM , Moore JH , Nadeau JH . 2010 . Missing heritability and strategies for finding the underlying causes of complex disease . Nat. Rev. Genet .. 11 : 446 – 450 . OpenUrl CrossRef PubMed Web of Science [3]. ↵ Schork NJ , Murray SS , Frazer KA , Topol EJ . 2009 . Common vs. rare allele hypotheses for complex diseases . Curr. Opin. Genet. Dev .. 19 : 212 – 219 . OpenUrl CrossRef PubMed Web of Science [4]. ↵ Oubninte , S. , Girard , S. , Moreau , C. , Maziade , M. , and Bureau , A. ( 2025 ). Statistical Approach Leveraging Genealogies of Populations with a Founder Effect and Identical by Descent Segments to Identify Rare Variants in Complex Diseases . medRxiv, 2025 . https://www.medrxiv.org/content/early/2025/09/18/2025.09.16.25335588 . DOI: 10.1101/2025.09.16.25335588 OpenUrl Abstract / FREE Full Text [5]. ↵ Chen H , Wang C , Conomos MP , Stilp AM , Li Z , Sofer T , Szpiro AA , Chen W , Brehm JM , Celedón JC et al. 2016 . Control for population structure and relatedness for binary traits in genetic association studies via logistic mixed models . Am. J.Hum. Genet .. 98 : 653 – 666 . OpenUrl PubMed [6]. ↵ Whittemore A. 1996 . Genome scanning for linkage: an overview . Am J Hum Genet . 59 : 704 – 16 . PMID: 8751872 ; PMCID: PMC1914900 . OpenUrl PubMed Web of Science [7]. ↵ Gusev A , Kenny EE , Lowe JK , Salit J , Saxena R , Kathiresan S , Altshuler DM , Friedman JM , Breslow JL , Pe’er I. DASH: a method for identical-by-descent haplotype mapping uncovers association with recent variation . Am J Hum Genet . 2011 Jun 10; 88 ( 6 ): 706 – 717 . doi: 10.1016/j.ajhg.2011.04.023 . Epub 2011 May 27. PMID: 21620352 ; PMCID: PMC3113343 . OpenUrl CrossRef PubMed [8]. Wu MC , Lee S , Cai T , Li Y , Boehnke M , Lin X. Rare-variant association testing for sequencing data with the sequence kernel association test . Am J Hum Genet . 2011 Jul 15; 89 ( 1 ): 82 – 93 . doi: 10.1016/j.ajhg.2011.05.029 . Epub 2011 Jul 7. PMID: 21737059 ; PMCID: PMC3135811 . OpenUrl CrossRef PubMed [9]. ↵ Franz Baumdicker , Gertjan Bisschop , Daniel Goldstein , Graham Gower , Aaron P Ragsdale , Georgia Tsambos , Sha Zhu , Bjarki Eldon , E Castedo Ellerman , Jared G Galloway , Ariella L Gladstein , Gregor Gorjanc , Bing Guo , Ben Jeffery , Warren W Kretzschumar , Konrad Lohse , Michael Matschiner , Dominic Nelson , Nathaniel S Pope , Consuelo D Quinto-Cortés , Murillo F Rodrigues , Kumar Saunack , Thibaut Sellinger , Kevin Thornton , Hugo van Kemenade , Anthony W Wohns , Yan Wong , Simon Gravel , Andrew D Kern , Jere Koskela , Peter L Ralph , Jerome Kelleher , Efficient ancestry and mutation simulation with msprime 1.0 , Genetics , Volume 220 , Issue 3 , March 2022 , iyab229 , doi: 10.1093/genetics/iyab229 OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted September 23, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following FounderRare: A Novel Statistical Package to Identify Rare Variants in Complex Diseases Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share FounderRare: A Novel Statistical Package to Identify Rare Variants in Complex Diseases Samir Oubninte , Simon Girard , Claudia Moreau , Alexandre Bureau medRxiv 2025.09.11.25335516; doi: https://doi.org/10.1101/2025.09.11.25335516 Share This Article: Copy Citation Tools FounderRare: A Novel Statistical Package to Identify Rare Variants in Complex Diseases Samir Oubninte , Simon Girard , Claudia Moreau , Alexandre Bureau medRxiv 2025.09.11.25335516; doi: https://doi.org/10.1101/2025.09.11.25335516 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Epidemiology Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (299) Cardiovascular Medicine (4425) Dentistry and Oral Medicine (443) Dermatology (382) Emergency Medicine (607) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1507) Epidemiology (15221) Forensic Medicine (30) Gastroenterology (1123) Genetic and Genomic Medicine (6588) Geriatric Medicine (667) Health Economics (997) Health Informatics (4524) Health Policy (1368) Health Systems and Quality Improvement (1612) Hematology (540) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15910) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (145) Nephrology (667) Neurology (6588) Nursing (346) Nutrition (998) Obstetrics and Gynecology (1143) Occupational and Environmental Health (956) Oncology (3331) Ophthalmology (970) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (663) Pediatrics (1690) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5440) Public and Global Health (9219) Radiology and Imaging (2195) Rehabilitation Medicine and Physical Therapy (1369) Respiratory Medicine (1196) Rheumatology (593) Sexual and Reproductive Health (710) Sports Medicine (529) Surgery (710) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9ffc2e704b6dc13d',t:'MTc3OTQ1NjY4OA=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00