Conservative evolution of genetic and genomic features in Caenorhabditis becei, an experimentally tractable gonochoristic worm

doi:10.1101/2025.05.09.653148

Conservative evolution of genetic and genomic features in Caenorhabditis becei, an experimentally tractable gonochoristic worm

2025 · doi:10.1101/2025.05.09.653148

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 110,402 characters · extracted from preprint-html · click to expand

Conservative evolution of genetic and genomic features in Caenorhabditis becei, an experimentally tractable gonochoristic worm | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Conservative evolution of genetic and genomic features in Caenorhabditis becei , an experimentally tractable gonochoristic worm Jose Salome Correa , View ORCID Profile Luke M. Noble , View ORCID Profile Solomon A. Sloat , View ORCID Profile Tuc H. M. Nguyen , View ORCID Profile Matthew V. Rockman doi: https://doi.org/10.1101/2025.05.09.653148 Jose Salome Correa 1 Department of Biology and Center for Genomics & Systems Biology New York University , New York, New York Find this author on Google Scholar Find this author on PubMed Search for this author on this site Luke M. Noble 1 Department of Biology and Center for Genomics & Systems Biology New York University , New York, New York 2 EnviroDNA , Melbourne, Australia Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Luke M. Noble Solomon A. Sloat 1 Department of Biology and Center for Genomics & Systems Biology New York University , New York, New York 3 Department of Biology, University of North Carolina , Chapel Hill, North Carolina Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Solomon A. Sloat Tuc H. M. Nguyen 1 Department of Biology and Center for Genomics & Systems Biology New York University , New York, New York Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Tuc H. M. Nguyen Matthew V. Rockman 1 Department of Biology and Center for Genomics & Systems Biology New York University , New York, New York Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Matthew V. Rockman For correspondence: mrockman{at}nyu.edu Abstract Full Text Info/History Metrics Supplementary material Preview PDF Abstract Caenorhabditis nematodes represent a promising model clade for evolutionary genetics and genomics, but research has focused on the three androdioecious species, those with self-fertile hermaphrodites, all in the Elegans Group of species. The majority of Caenorhabditis species are gonochorists, with males and females, characterized by inconveniently high heterozygosity and inbreeding depression. We have identified C. becei , a Japonica Group species from Panamá, as an experimentally tractable gonochorist. We describe a new chromosomal genome assembly of a healthy inbred C. becei reference strain, integrating data from PacBio HiFi reads, Illumina short reads, genetic linkage, and HiC chromatin contacts, and experimental gene annotation with short- and long-read data. Several genetic properties that are well characterized in the Elegans Group are present in this Japonica Group species: the organization of the genetic map, cosegregation of autosomal indels and sex chromosomes, and segregation distortion due to Medea elements, demonstrated here for the first time in a gonochoristic Caenorhabditis species. Some aspects of the genome are highly conserved, including synteny across the six chromosomes and the distributions of repetitive sequences and genes along each chromosome. Other features are quite distinctive, including evolved shifts in GC composition & heterogeneity along the genome. Both codon & amino acid usage are shifted in concert with the species’ genomic GC content. C. becei has an unusually large X chromosome, which we find is associated with multiple local gene family expansions. These findings and resources lay the foundation for further experimental and computational studies of Caenorhabditis genetics and genomics. INTRODUCTION Caenorhabditis elegans is among our most powerful experimental model organisms, and decades of intensive study have revealed innumerable details about its cellular, molecular, and developmental biology. C. elegans sits within a speciose clade of morphologically similar nematodes that share many features, down to the number and arrangement of cells ( Memar et al. , 2019 ; Zhao et al. , 2008 ). Some pairs of reproductively isolated species completely lack distinguishing morphological features ( Sudhaus & Kiontke, 2007 ). Most Caenorhabditis species share ecological attributes as well, reproducing within patches of decomposing plant matter and feeding on bacteria. Despite the morphological and ecological conservatism of Caenorhabditis nematodes, they are extremely divergent at the sequence level; distantly related Caenorhabditis are more diverged at the level of protein sequences than the most distantly related vertebrates or insects ( Kiontke et al. , 2004 ). The combination of conservation and divergence makes Caenorhabditis a particularly attractive model for comparative genomics and genetics, as factors that can confound evolutionary analysis in other groups – life history, trophic level, body size, and so forth – hardly vary within this clade ( Kiontke et al. , 2011 ; Stevens et al. , 2019 ). Moreover, comparative experimental analysis of many species under identical conditions is straightforward, as more than 70 species are available in culture and compatible with standard laboratory growth conditions ( Daul et al. , 2019 ). Despite these advantages, comparative experimental and population genetics has focused largely on a handful of species closely related to C. elegans , within the Elegans Group in the phylogeny. Further, the bulk of research has focused on the three species, all within the Elegans Group, that exhibit androdioecy, a mating system of self-fertile hermaphrodites and cross-fertile males. To understand which genetic and genomic features of the Caenorhabditis model species are shared more broadly across the clade, we generated a contiguous genome assembly for C. becei , an experimentally advantageous species in the Japonica group, sister to the well-studied Elegans group ( Stevens et al ., 2019 ). We then tested for conservation, convergence, or divergence in a range of genetic and genomic characteristics. C. becei has many useful properties as an experimental representative of both the Japonica Group and gonochoristic (male/female) Caenorhabditis species more broadly. It shares with C. elegans (and most Caenorhabditis ) a compact genome, free of repetitive centromeres or Y-chromosomes, and it is amenable to cryopreservation. It grows well in laboratory culture and so has already proved useful for experimental studies of viral susceptibility, sex ratio, and reproductive biology ( Huang et al ., 2023 ; Lamelza et al ., 2019 ; Shaw & Kennedy, 2022 ). Its genes and genome can be manipulated by microinjection of plasmids or nucleoprotein particles, and it has a rapid generation time, cycling from egg to egg in less than 48 hours at its native temperature of 25°C. C. becei is named for its type locality, Barro Colorado Island (BCI), Panamá ( Stevens et al ., 2019 ). It is a common species in the rainforest of BCI, the most intensively studied tropical forest on earth, and consequently it holds great promise for ecological studies ( Sloat et al ., 2022 ). C. becei ’s greatest virtue, however, and the one that motivated its selection as our model species, is that its populations harbor a relatively modest load of deleterious recessive variants, facilitating construction of healthy and fecund inbred lines (preprint forthcoming). For short-lived small-bodied organisms like nematodes, inbred lines are a critical tool for genetic analysis, allowing experimental replication of genotypes – including outbred genotypes generated by crossing inbred lines ( Andersen & Rockman, 2022 ). C. becei provides a route to genomic analysis of inbreeding depression, a phenomenon absent from the self-fertile species like C. elegans and nearly intractable in hyperdiverse Elegans Group species like C. brenneri and C. remanei ( Adams et al ., 2022 ; Baer et al. , 2010 ; Barrière & Félix, 2005 ; Dolgin et al ., 2007 ), and to quantitative genetic analysis of outcrossing-related traits, including reproductive behaviors that are vestigial in C. elegans . Previously, we reported a short-read draft assembly of C. becei inbred line QG2083 in 1,567 scaffolds ( Stevens et al ., 2019 ), and we subsequently used linkage data to consolidate the reference into a 256-scaffold assembly ( Lamelza et al ., 2019 ). These fragmented assemblies have already proved valuable in comparative studies of gene and regulatory network evolution ( Carelli et al. , 2022 ; Eurmsirilerd & Maduro, 2020 ; Kursel et al ., 2021 ; Maduro, 2020 ; Nelson & Ambros, 2021 ; Fusca et al . 2024 ). Here, we generate a new assembly, with chromosomal scaffolds, for an independent inbred line, QG2082. We integrated data from PacBio HiFi reads, Illumina short reads, genetic linkage, and HiC chromatin contacts. We describe the assembly of the new C. becei reference genome and our experimental and computational annotation of genes and repetitive elements. Taking advantage of C. becei ’s compatibility with laboratory conditions, we also show that several genetic properties that are well characterized in the Elegans Group are conserved with this Japonica Group species: the organization of the genetic map, segregation distortion due to Medea elements, and the pattern of cosegregation of autosomal variants and sex chromosomes. RESULTS C. becei is part of a Neotropical clade of species with narrow ranges To situate C. becei within Caenorhabditis , we used data from 2,059 single-copy orthologs present in at least 80% of 60 Caenorhabditis species to generate the most comprehensive phylogeny of the genus to date ( Figure 1 ). The major outline of the phylogeny, inferred from individual gene trees under the multispecies coalescent model, is largely congruent with previously inferences ( Dayi et al ., 2021 ; Kiontke et al ., 2011 ; Sloat et al ., 2022 ; Stevens et al ., 2019 , 2020 ), with strong support for the Elegans and Japonica Groups and their union in the Elegans Supergroup. Support for the other named groups is also strong, though the branches connecting them to one another are more equivocal. Download figure Open in new tab Figure 1. Phylogeny of Caenorhabditis inferred from protein sequences of 2,059 single-copy orthologs. Gene trees were estimated by maximum likelihood and the species tree estimated under the multispecies coalescent. The unrooted phylogeny is plotted with the root on the branch connecting the Auriculariae Group to the rest of the species ( Dayi et al. , 2021 ; Sloat et al ., 2022 ; Slos et al ., 2017 ; Stevens et al ., 2019 ). Branch lengths are maximum likelihood estimates from the concatenated protein sequences. Named species Groups and Supergroups are indicated. Branch support (quadripartition frequency) is 100% for all branches except where indicated. C. becei falls within a well-supported section of the Japonica Group. The phylogeny shows that C. becei evolved within a clade of species that are endemic to narrow geographic ranges in the neotropics. Each species is known from only a single region ( becei and panamensis from Barro Colorado Island, nouraguensis and macrosperma from French Guiana, yunquensis from Puerto Rico, and waitukubuli from Dominica), though they are often very abundant locally ( Félix et al ., 2014 ; Kiontke et al ., 2011 ; Stevens et al ., 2019 ; Sloat et al. , 2022 ). For example, C. nouraguensis is the single most common species observed in French Guiana ( Félix et al ., 2013 ; Ferrari et al ., 2017 ). The depth of sampling in French Guiana and BCI is sufficient to conclude that the species found at each locale are likely absent from the other ( Sloat et al. , 2022 ). The neotropics are not well sampled otherwise, and many additional species in this clade remain to be discovered. The genome of C. becei We assembled a chromosomally scaffolded reference genome for C. becei strain QG2082 (Table S1). This inbred line was derived by 25 generations of sib-mating from wild-caught isofemale line QG704, isolated in 2012 from a Gustavia superba flower rotting on the forest floor on Barro Colorado Island, and then cryopreserved ( Sloat et al. , 2022 ). Assembly integrated PacBio HiFi long reads, Illumina short reads, linkage data from a genetic cross, and HiC chromatin contact data. The nuclear genome assembly spans 93.9 Mb. DNA sequence statistics, such as GC content, repeat content, and gene density, show symmetrical patterns along the chromosomes and align with recombination rate domains, consistent with good chromosomal completeness and an absence of large-scale assembly errors. Most chromosomes terminate at both ends in oriented telomeric repeat sequences ( Figure S1 ). Chromosomes were assigned identities based on conserved synteny with C. elegans . The mitochondrial genome of C. becei is a 13,708 bp circular molecule encoding 12 protein-coding genes, 2 ribosomal RNAs, and 22 transfer RNAs. The genome shares many features with C. elegans , with identical gene order and minimal intergenic space. Two characteristics of the C. becei genome stand out. First, one chromosome, identified by coverage and synteny as the X chromosome, is much larger than the other chromosomes, almost twice the length of the shortest chromosome and 40% longer than the C. elegans X ( Figure 2 ). Second, the GC content of the genome is unusually high and exceptionally heterogeneous. Download figure Open in new tab Figure 2. C. becei has a small genome but a giant X chromosome. Chromosome sizes are plotted for species of Caenorhabditis with published chromosomally scaffolded genomes. Architecture of the genetic map We characterized the relationship between the genetic map and physical genome, using data from an advanced intercross between inbred lines QG2082 and QG2083 ( Lamelza et al. , 2019 ). These inbred lines were derived from independent isofemale lines collected from localities separated by 3 kilometers. The resulting C. becei recombination landscape, the first for a Caenorhabditis species outside the Elegans group, closely matches the patterns known from C. elegans . Each chromosome has a low-recombination central domain flanked by high recombination arms, and in most cases, small tip regions with little or no recombination ( Figure 3A , Table S2). The no-recombination tips are very small in C. becei , and potentially absent in some cases (or unassembled, although the presence of long telomeric repeats on most chromosomes argues against this). Download figure Open in new tab Figure 3. A. C. becei Marey maps showing effective genetic position (crossovers per chromosome in the G 4 BC 2 mapping cross) as a function of physical position. Gray bars indicate the arm-center boundaries as estimated by segmented linear regression. B. Normalized Marey maps for the six Rhabditid species with complete physical and genetic maps. The phylogeny at right is not to scale; Pristionchus pacificus is very distantly related to Caenorhabditis . The overall pattern of recombination rate variation along the autosomes is largely conserved across the Caenorhabditis species with characterized recombination maps ( Figure 3B ). C. elegans, C. briggsae, and C. tropicalis show concordant domains of zero, high, and low recombination in tips, arms, and centers respectively ( Barnes et al ., 1995 ; Noble et al ., 2021 ; Rockman & Kruglyak, 2009 ; Ross et al ., 2011 ; Stevens et al ., 2022 ); C. remanei is exceptional; it shows the typical arm-center organization but has high recombination in the tips ( Teterina et al. , 2023 ). Distantly related Pristionchus pacificus also shows Caenorhabditis -like domain architecture, despite substantial differences in meiotic machinery ( Rillo-Bohn et al ., 2021 ; Yoshida et al. , 2023 ). C. becei resembles C. elegans and C. briggsae in having a distinct if subtle domain structure on the X chromosome, while other species have idiosyncratic or inverted X chromosome domain structure (though the P. pacificus X chromosome map may be distorted by inversions: Rillo-Bohn et al ., 2021 ). We used segmented linear regression to estimate boundaries between the center and arm domains and to estimate recombination rates for each species (Table S3, Figure S2 ), under the assumption of complete crossover interference (i.e., 50cM chromosomes, as in C. elegans ). C. becei autosome arms have relatively high recombination rates (mean 8.1 cM/Mb, range 6.5-10.9), similar to those of C. tropicalis (mean 8.2 cM/Mb) and C. briggsae (mean 7.8), slightly higher than those of C. elegans (mean 6.5) and much greater than found in C. remanei (mean 3.3 ( Noble et al ., 2021 ; Parée et al. , 2025 ; Rockman & Kruglyak, 2009 ; Ross et al ., 2011 ; Snoek et al. , 2019 ; Teterina et al ., 2023 ). These rates reflect the relative physical lengths of the chromosomes: shorter chromosomes typically have more recombination per physical length. In a naïve regression of arm recombination rate on chromosome length, incorporating all autosome arms from the five Caenorhabditis species, chromosome length explains 35% of the recombination rate variance (p<10 -5 ). The relationship between rate and length is also influenced by the proportion of chromosome with crossover suppression in the center, which varies among species and chromosomes. C. becei autosomes have generally typical center sizes, representing approximately half the chromosome length, with the exception of the unusually long center of chromosome V (63%). However, the degree of crossover suppression in C. becei is unusually strong, with estimated recombination rates of only 0.1 to 0.6 cM/Mb, lower than that observed in other species (Table S3). Given findings from artificially lengthened C. elegans chromosomes ( Libuda et al ., 2013 ), the large size of the C. becei X chromosome may exceed the length over which interference acts, allowing for occasional double crossovers. The observed number of crossovers per X chromosome (0.86) is indeed greater than the number expected under complete interference with our cross design (0.75), though not significantly so ( p = 0.09). On the other hand, the autosomes have fewer crossovers per chromosome (0.99-1.13) than expected (1.25), and the deficit is significant for chromosomes II, III, and IV (2-sided p -values < 0.05). The autosomal deficit may be due to segregation distortion (see below) or to direct selection against recombinant chromosomes. In the absence of these forces, the ratio of X to autosome crossovers that we observe is improbable ( p = 0.0015) if crossover interference on the X is complete. The data are thus equivocal about the possibility of double crossovers on the X, and our advanced intercross experimental design precludes simply counting crossovers to check. Regardless, the C. becei X experiences a relatively low absolute recombination rate, due to its unusual physical length and its hemizygosity in males. Autosomal sex linkage Caenorhabditis nematodes exhibit a remarkable pattern of correlated segregation of sex chromosomes and autosomal insertion-deletion polymorphisms (T. S. Le et al ., 2017 ; Wang et al. , 2010 ). Males in these species have an X0 sex chromosome composition, and autosomal insertions tend to segregate away from the X chromosome and into X-nullosomic sperm. This pattern, known as skew, has been observed in several Elegans-group species and one more distantly related species, C. portoensis , but has not yet been examined in the Japonica group. We generated an autosomally integrated transgene, qgIs7 , which drives strong expression of fluorescent reporters. We tested whether qgIs7 segregated at equal frequencies into male and female progeny of an F 1 male crossed to a wild-type female. The genetic background of all strains is QG2082, and strains are expected to differ only in the presence or absence of the multicopy transgene array on an autosome. Under the skew model, the transgene should disproportionately segregate into sperm that lack an X chromosome, and therefore it will occur in an excess of male offspring and a deficit of female offspring. We observed this pattern (1,719 offspring, Fisher’s Exact Test p = 0.0004). The Transmission Bias Ratio ( Le et al ., 2017 ), the ratio of preferred to unpreferred segregation, is 1.19, similar to values observed in other gonochoristic Caenorhabditis and much lower than in the selfing species. Another way to state these results is that the autosomal insertion is genetically linked to the nullosome at a distance of 45.7±2.4 cM. Segregation distortion due to Medea elements The genetic mapping experiment revealed strong allele frequency skews on two chromosomes, I and III, with the QG2083 allele having increased in frequency in both cases ( Figure 4A ). The simplest model for this pattern is selection favoring alleles that increase developmental rate or brood size. However, QG2082 exhibits both faster development and larger brood sizes than QG2083, implying that selection favoring QG2083 alleles may have a more complicated basis. In all three selfing Caenorhabditis species, transmission-ratio distortion observed in experimental mapping crosses is attributable to parent-by-offspring genetic interactions, where a heterozygous parent (mother for Medea elements, father for Peel elements) damages offspring that are homozygous for the non- Medea/Peel allele ( Ben-David et al ., 2017 , 2021 ; Noble et al ., 2021 ; Rockman, 2025 ; Seidel et al ., 2008 ; Zdraljevic et al ., 2024 ). Download figure Open in new tab Figure 4. Medea alleles cause segregation distortion. A. Allele frequencies among G 4 BC 2 recombinant genomes. Strong distortion of inheritance favoring QG2083 is present on chromosomes I and III. B. Experimental crosses implicate maternal-effect loci that act in heterozygous mothers and cause lethality or arrest in homozygous offspring. The phenotype frequencies of progeny from each of 16 classes of cross are shown in stacked bar charts, with sample size below. Parental genotypes on chromosomes I, III, X, and mitochondrial genomes are colored according to their origins in QG2082 or QG2083, and also indicated by the subscripts 2 or 3, respectively. We performed experimental crosses to test for Medea or Peel activity, and we discovered that QG2083 carries alleles with Medea activity ( Figure 4B ). Only offspring of heterozygous mothers were affected, and the affected offspring were in proportion to the expected fraction homozygous for QG2082 alleles ( Figure S3 ). Offspring of F 1 females x QG2082 males were most severely affected, with less than half of progeny showing wild-type development, while the reciprocal crosses, QG2082 females x F 1 males, showed no impact. By comparing the counts of affected offspring from different classes of crosses, we estimate that the loci on chromosomes I and III are each acting as Medea loci with average penetrances exceeding 50%. The data also show a potential interaction with mitochondrial genotype or a parent-of-origin effect, as also observed for Medea elements in C. tropicalis ( Ben-David et al. , 2017 , 2021 ; Noble et al ., 2021 ), seen in the different patterns in the second and third rows of Figure 4B . Repetitive Element Landscape The genome of C. becei has a low repetitive element content (15%), among the lowest in Caenorhabditis , comparable to C. niphades (11.3%), C. bovis (13%), and C. elegans (18%) ( Sun et al ., 2022 ; Woodruff & Teterina, 2020 ). The most abundant repeats were Tc1-Mariners (6.6%), consistent with their dominance across other Caenorhabditis species ( Woodruff & Teterina, 2020 ). Other abundant repeat types included CACTA elements (1.3%), simple repeats (1.1%), and unclassified repeats (4.2%) ( Figure S4 ). Repetitive elements were more abundant in the arms than in the centers ( Figure S5 ). This non-random distribution of repeats is consistent across most Caenorhabditis species, except for C. inopinata and C. bovis , where a more homogeneous repeat landscape is observed due to the recent expansion of Tc1-Mariner elements ( Woodruff & Teterina, 2020 ). To estimate repetitive element age, we used Kimura distances as a proxy for divergence. Repeat divergence distributions showed no peaks indicative of recent transposon expansion, and we found no evidence of recent repetitive element activity for any repeat type. Gene structure We used two experimental strategies to generate mRNA data for gene annotation. First, we grew mixed-stage mixed-sex populations under five divergent conditions then pooled the worms, extracted RNA, and Illumina-sequenced a stranded mRNA library. Second, we grew mixed-stage mixed-sex populations under two conditions, isolated RNA, and generated long-read Iso-seq data. We integrated these data with protein sequence data from other species to infer gene models. We annotated 24,025 protein-coding genes, and 32.81% of the genome is CDS. We have not annotated non-coding RNAs, though they are likely to be interesting in this species. C. becei lacks the highly conserved miRNA let-7 and may be using other mechanisms to replace its function ( Nelson and Ambros 2021 ). In C. becei , introns and coding sequences (CDS) have very different proportions in chromosomal arms and centers: arms are heavily enriched for intronic DNA, while centers are dense with CDS ( Figure S6 ). In C. niphades , C. becei ’s closest relative with a published chromosomal assembly, introns and CDS are similarly extensive in the arms, but intronic DNA decreases and CDS increases in the centers ( Figure S6 ). Genomic GC Content Among species with chromosomal assemblies, C. becei has genomic GC content that is both high and unusually variable along the chromosomes ( Figure 5 ). The variance in GC content along chromosomes is much greater in C. becei than in the other species with chromosomal assemblies, independent of the scale over which GC% is measured ( Figure S7 ). In C. becei , chromosomes I-IV exhibit notably high GC content in their centers and lower GC content in their arms. In contrast, chromosomes V and X show a more uniform distribution of high GC content along both the center and the arms. Download figure Open in new tab Figure 5. GC content varies along chromosomes and among species. GC% is plotted for non-overlapping 100kb windows along the length of each chromosome, along with loess-fitted lines (degree 2, span 1/8). C. becei is unusual in its high GC content (a trait shared with C. niphades , the other Japonica Group species with a chromosomal assembly) and its high variance, most notably on chromosomes I-IV. In C. becei , the average GC content of features follows a descending order of exon > genomic average > repeat > introns/intergenic regions ( Figure 6 ). This ordering is conserved across species, but the differences are more pronounced in C. becei and Elegans Group species than in C. niphades or C. angaria ( Figure S8 ). In these latter species, GC content is relatively consistent across the chromosomes within each species and across annotation features. Download figure Open in new tab Figure 6. GC content of genomic features in C. becei . GC content was calculated from the counts of G+C divided by the total number of bases of the feature within non-overlapping 10 kb windows along the length of the chromosome with LOESS-fitted lines (span = 0.2). Codon and Amino Acid Usage Distinct patterns of codon usage are observed among Caenorhabditis species, potentially reflecting GC content biases. C. becei and C. niphades have high GC content and use codons with higher GC content, while C. angaria has lower GC content and uses codons with lower GC content ( Figure 7 ). Species in the Elegans group exhibit intermediate codon usage patterns, showing less pronounced deviations compared to the Japonica and Drosophilae groups. Download figure Open in new tab Figure 7. Codon usage and amino acid composition in Caenorhabditis species. A. Relative synonymous codon usage (RSCU). Rows correspond to species, and columns represent codons grouped by amino acid. Tiles represent the RSCU value for each codon in a given species. RSCU values greater than 1.0 indicate codons used more frequently than expected under uniform usage, with higher values shaded in orange and lower values shaded in purple. B. Amino acid usage: Rows correspond to species, with the last row displaying the mean percentage of each amino acid across all species. The mean is calculated by averaging the percentage of each amino acid in the CDS across species. Tiles represent the deviation from the mean amino acid percentage for each species, with the mean calculated separately for each amino acid. Fill colors indicate the direction and magnitude of the deviation: values above the mean are shaded in blue, and values below the mean in red. The intensity of the shading reflects the magnitude of the deviation. The top row shows the average GC% of codons encoding each amino acid. A similar trend is observed in amino acid usage, in which C. becei and C. niphades show positive deviations from the mean for amino acids associated with high GC codons and negative deviations for those linked to low GC codons. In contrast, C. angaria exhibits the opposite pattern, with positive deviations for amino acids associated with low GC codons and negative deviations for those linked to high GC codons ( Figure 7B ). These results suggest that GC content influences both codon and amino acid usage across Caenorhabditis species. Synteny We observe strong synteny between the chromosomes of C. becei and C. elegans ( Figure 8 ), as expected given the well-established conservation of ancestral linkage groups (Nigon elements) in Rhabditid nematodes ( Gonzalez de la Rosa et al. , 2021 ). The most striking feature of the synteny pattern is the absence of 1:1 orthologs in the arms of the C. becei X chromosome. The large size of the X is associated with a sizable increase in gene number on the X chromosome: 5,345 in C. becei compared to 2,877 in C. elegans . Download figure Open in new tab Figure 8. Synteny between C. elegans , C. becei, and C. niphades . Each line connects single-copy orthologues (n=1878). We compared synteny between C. becei and C. niphades, the closest species with a chromosomal assembly, using a set of 1,878 one-to-one orthologs. We found extensive collinearity across all chromosomes, though key differences remained. On Chromosome X, the C. niphades ends are inverted relative to C. becei (equivalently: the chromosomes differ by a giant inversion). The regions that lack single-copy orthologs between C. becei and C. elegans also lack single-copy orthologs in the smaller C. niphades X chromosome. This suggests that the gene duplication on C. becei Chromosome X is a recent, lineage-specific expansion rather than a shared feature of the Japonica group ( Figure 8 ). For Chromosomes I, II, III, and V, inversions were restricted to the central regions, while the arms remained highly collinear. Comparative ortholog analysis reveals widespread gene duplications in C. becei The gross similarities between the C. becei and C. niphades genomes allow us to probe the major differences we have identified between them: C. becei has a bigger genome, with more heterogeneity in GC and feature distribution, and its X has large regions that lack one-to-one orthologs. To understand how gene family evolution contributes to these patterns, we used gene annotations from eight high-quality chromosomal assemblies ( C. angaria, C. becei, C. briggsae, C. elegans, C. inopinata, C. niphades, C. remanei, and C. tropicalis ) to classify genes into orthogroups. Orthogroups were categorized as single-copy, multi-copy, or unassigned. Multi-copy orthogroups contained more than one gene within a species, while single-copy orthogroups included genes that were present as a single copy in a given species but had orthologs in other species. Unassigned orthogroups consisted of genes that were species-specific, with no detectable orthologs in other species. Single-copy genes were similar in number, distribution, and length across the chromosomes of both C. becei and C. niphades , with approximately 1,000 single-copy genes per chromosome, spanning an average length of 3.45 ± 0.24 Mb per chromosome in C. becei and 3.09 ± 0.29 Mb in C. niphades . However, the relative proportion of genome occupied by single-copy genes was lower in C. becei, because multi-copy orthogroups occupy a much larger proportion of its genome ( Figure S9 ). In both species, single-copy genes were most abundant in chromosome centers, less frequent in the arms, and slightly enriched at chromosome tips, following a consistent pattern across all chromosomes ( Figure 9 ). Download figure Open in new tab Figure 9. Distribution of duplicated, single-copy, and unassigned genes across the chromosomes of C. becei and C. niphades . Gene counts are plotted in 100 kb windows across the chromosomes of each species, with LOESS-fitted lines (span = 0.2). Genes are categorized based on orthogroup analysis: multi-copy (black), single-copy (red), and unassigned genes (blue). Multi-copy genes belong to orthogroups with more than one gene in a species. Single-copy genes belong to orthogroups with only one gene in a species. Unassigned genes are single-copy genes that are not assigned to any orthogroup shared with another species. GC content (gold) are the percentage of bases within a 100 kb window that are G+C, with LOESS-fitted lines (span = 0.2). Chromosome arm-center boundaries are plotted as dotted lines. Patterns for multi-copy genes differed among C. becei chromosomes, just as they do for GC content. Chromosomes I–IV are similar in their counts of multi-copy genes (∼1000), while chromosome V and X have substantially more: 1,673 and 2,192 ( Figure 9 ). In contrast, C. niphades has fewer multi-copy genes, ranging from 311 to 487 per chromosome ( Figure 9B ). In C. becei , multi-copy genes tend to be abundant in the transition regions between the arms and centers. The exceptionalism of C. becei chromosomes V and X extends to the unassigned (species-specific) orthogroups as well. The number of unclassified genes per chromosome is comparable between C. niphades and chromosomes I-IV of C. becei , while chromosomes V and X in C. becei carry about 60% more ( Figure 9 ). Overall, comparing the same chromosome between species, chromosomes I-IV differ proportionately in the fraction dedicated to single-copy and unassigned orthogroups and intergenic regions, all of which are longer in C. becei than in C. niphades , while each C. becei chromosome also has extra length due to much higher numbers of genes from multi-copy orthogroups. On C. becei chromosomes V and X, the contributions of unassigned and multi-copy orthogroups are magnified. While the distribution of genes along the chromosomes matches the single-copy distribution on chromosomes I-IV, the pattern on V and X deviates from the single-copy gene distribution due to the higher abundance of multi-copy and unassigned genes in the arms. Within C. becei ’s large X chromosome, genes belonging to orthogroups with the highest gene counts are often clustered, indicating localized expansions or tandem duplications within these gene families ( Figure S10 ). The duplication patterns on chromosome X involve multiple orthogroups, rather than being dominated by a single expanding gene family (Table S4). Functional analysis of the X-chromosome orthogroups identified specific common protein domains. These include “T-box transcription factor, DNA-binding domain,” indicating roles in transcriptional regulation, and “RNA exonuclease REXO1/REXO3/REXO4-like” domains, suggesting functions in RNA processing and turnover (Table S4). However, many orthogroups lacked functional annotations, highlighting substantial genomic novelty on the X, particularly among expanded gene families (Table S4). DISCUSSION Caenorhabditis becei is a promising model for studies of gonochoristic Caenorhabditis , and we here lay the genetic and genomic foundations for future studies. Part of its appeal is its type locality, the intensely studied forests of Barro Colorado Island, Panamá. Our phylogenetic analysis finds C. becei deeply nested within a neotropical radiation of species in the Japonica Group, with close relatives spread across Central and South America and the Caribbean. The Caenorhabditis clade provides a powerful lens into genome evolution, recombination, and species divergence, but most studies have focused on the Elegans group. Draft genomes from its sister, the Japonica group, have revealed generally high GC content and compact genomes ( Stevens et al. , 2019 ; Sun et al. , 2022 ). C. becei now joins C. niphades in representing the Japonica group with chromosomally contiguous assemblies. The C. becei genome is much larger than that of C. niphades , but the two remain highly syntenic and collinear for one-to-one orthologs, suggesting that genome expansion in C. becei is a recent event rather than a shared feature of the Japonica group. The structure of the C. becei genetic map, the first for a Caenorhabditis species outside the Elegans group, is very similar to that observed in the four species with available maps ( Barnes et al. , 1995 ; Noble et al. , 2021 ; Rockman & Kruglyak, 2009 ; Ross et al. , 2011 ; Stevens et al. , 2022 ; Teterina et al. , 2023 ). Recombination is structured into relatively discrete domains, with low recombination in the centers and high recombination in the arms. The most conspicuous departure from other species is the large extent of the low-recombination center on chromosome V, spanning 63% of the chromosome. Another familiar feature of Caenorhabditis genetics is also conserved: the skewed inheritance of autosomal indels with respect to segregation of the X chromosome in male meiosis, which we demonstrated using new strains carrying autosomally integrated fluorescent transgenes. Our genetic map, like those previously generated for the androdioecious Caenorhabditis species, was affected by strong segregation distortion on several chromosomes. We showed that the observed segregation distortion likely reflects the action of multiple Medea elements, which act in heterozygous mothers and cause developmental delays or lethality in offspring that do not inherit them ( Beeman et al. , 1992 ). This is the first demonstration of Medea elements in the Japonica group and in dioecious Caenorhabditis , and it suggests that the striking ubiquity of these genetic elements is a broadly shared feature of Caenorhabditis biology ( Ben-David et al. , 2017 , 2021 ; Noble et al. , 2021 ; Seidel et al. , 2008 ; Zdraljevic et al. , 2024 ), and not a quirk of the androdioecious mating system. In our study, the alternate alleles at the Medea loci are from isofemale lines collected within a few kilometers of one another in 2012, and their evolutionary dynamics are likely to depart substantially from those predicted for primarily selfing lineages ( Rockman 2025 ). At the DNA sequence level, the C. becei genome is distinctive for its high GC content, a feature shared with C. niphades . The elevated GC content influences codon usage bias in C. becei , as demonstrated by comparative analysis across Caenorhabditis : species with higher genomic GC content tend to preferentially use GC-rich codons, a pattern observed in both C. becei and C. niphades ( Figure 7 ). This bias extends beyond codon preferences to amino acid composition: both C. becei and C. niphades preferentially use amino acids encoded by GC-rich codons. Chromosomes I-IV (but not V or X) have dramatic heterogeneity in GC content, very high in centers and tips and very low in the chromosome arms. These arm regions are also dramatically depleted of coding sequences relative to other parts of the genome ( Figure S6 ), and coding sequences are substantially more GC-rich than other classes of sequence. However, the pattern is not driven solely by coding sequence density, as the intronic, intergenic, and repetitive classes of sequence have high GC content outside of the low-GC arms ( Figure 6 ). The extreme variation in GC content along chromosomes I-IV may reflect chromosome-specific mutational processes. Chromosomes V and X differ from the others. They have much more uniform GC content ( Figures 5 & 6 ) and also a more uniform density of coding sequences ( Figure S6 ), in part due to an unusually high number of gene duplications and orphan genes ( Figure 9 ). Orphan genes, which lack detectable homologs in other species, may arise through de novo evolution, rapid divergence, or duplication followed by functional divergence ( Tautz & Domazet-Lošo, 2011 ). Their enrichment on chromosomes V and X suggests that these chromosomes may act as hotspots for lineage-specific gene emergence ( Bouvarel et al. , 2024 ). Chromosomes V and X are also distinctive for their low recombination rates, due to both long physical lengths, a long central domain on V, and X hemizygosity in males. These features correlate with the high number of gene duplications and orphan genes. Gene duplications are most abundant around the arm-center boundaries on chromosome V and in the chromosome arms on the X ( Figure 9 ). The absence of large-scale duplications in chromosome centers does not imply that duplications never arise there but suggests that they may be less likely to be retained. This may be due to strong purifying selection acting on functionally constrained single-copy genes and orphan genes, which dominate these regions. Orphan genes persist in chromosome centers, perhaps via functional integration into essential pathways ( Tautz & Domazet-Lošo, 2011 ). Repeat elements are strongly enriched in chromosome arms and depleted in centers, matching recombination rate variation across the genome. The depletion of repeats in chromosome centers is likely due to strong purifying selection, which removes insertions in these functionally constrained regions ( Woodruff & Teterina, 2020 ). This is similar to the absence of gene duplications in centers, where functionally constrained genes dominate, and disruptive insertions are more likely to be deleterious ( Thomas, 2006 ). The arm-rich, center-poor repeat distribution is also observed in other Caenorhabditis species without recent repeat activity ( Woodruff & Teterina, 2020 ). The C. becei X chromosome is exceptionally large, 40% longer than that of C. elegans ( Figure 2 ) and contains more genes than any other chromosome ( Figure 9 ). The expansion of the X in C. becei suggests unique evolutionary pressures, perhaps involving reduced recombination, sex-specific selection, and dosage-sensitive gene accumulation. Because the X is hemizygous in males, it experiences distinct selection pressures ( Cutter, 2018 ). The absence of a homologous pairing partner prevents recombination in males, reducing the efficiency of purging deleterious mutations while exposing recessive variants to stronger selection. This could result in greater retention of beneficial mutations, including duplicated and orphan genes, if they provide an adaptive advantage ( Maciejowski et al. , 2005 ). The accumulation of duplicated genes in C. becei raises questions about their evolutionary significance and functional relevance. In C. becei , the clustering of gene expansions within orthogroups suggests non-random duplication events, possibly linked to selection for co-regulated gene networks or dosage effects ( Csankovszki et al. , 2004 ; Maciejowski et al. , 2005 ; Strome et al. , 2014 ). Functional analyses of X-linked duplicated genes revealed an overrepresentation of transcription factors and RNA-processing genes, suggesting that at least some of these duplications may play regulatory roles. The C. becei genome represents an appealing model for studies of genome evolution, with interactions between gene duplication, GC content heterogeneity, recombination rate variation, and codon usage biases. The nonrandom chromosomal distribution of gene duplications and orphan genes suggests that selection, recombination, mutation, and genome architecture play key roles in shaping gene retention. Future studies should focus on determining the functional significance of orphan and unclassified genes, particularly those located in chromosome centers and X-linked regions, to assess whether they contribute to adaptive processes, dosage compensation mechanisms, or reproductive functions. Understanding the role of recombination in shaping chromosomal architecture will also be critical, particularly in regions where gene duplications and transposons appear to be accumulating. Comparative analyses with additional Japonica species will provide further insight into which of these patterns are unique to C. becei and which reflect broader evolutionary trends within the clade. METHODS Phylogeny We collected protein sequence data for 57 species from published genomes and transcriptomes and, by permission, from the Caenorhabditis Genome Project ( caenorhabditis.org ). In addition, we generated new data for three undescribed species from Queensland, Australia ( C. sp. 51 , C. sp. 52 , and C. sp 67 ), using RNAseq and de novo transcriptome assembly, exactly as described for C. krikudae in Sloat et al . (2022) . The fastqs and transcriptome assemblies are deposited with NCBI in association with BioProject ID PRJNA1128046. The sources of data for all 60 species are provided in Table S5. To identify a set of single-copy orthologs for phylogenetic analysis, we used BUSCO 5.3.0, ( Seppey et al. , 2019 ), using the nematode_odb10 dataset on each of the protein fasta files. For each protein sequence in its database, BUSCO identifies homologous sequences in the input file and classifies them as single or multicopy. We identified the set of inferred single-copy orthologs present in at least 80% of the species in the dataset and generated multisequence fasta files for each, using busco2fasta ( https://github.com/lstevens17/busco2fasta ). We then used MAFFT 7.475 ( Katoh & Standley, 2013 ) to align the sequences, with default settings. We trimmed these alignments to eliminate poorly aligned regions using TrimAl 1.4.1 ( Capella-Gutiérrez et al. , 2009 ) with settings -gt 0.8 -st 0.001 -resoverlap 0.75 -seqoverlap 80. This process yielded 2,059 alignments. We estimated maximum-likelihood gene trees using IQ-TREE 1.6.12 ( Nguyen et al ., 2015 ) with the LG+I+G model ( Le & Gascuel, 2008 ; Yang, 1994 ). We then estimated a species tree from the collection of gene trees under the coalescent model implemented in ASTRAL-III 5.7.8 ( Zhang et al. , 2018 ). To estimate branchlengths, we used a concatenation of the 2,059 sequence alignments (806,191 amino acid positions), generated with catfasta2phyml ( https://github.com/nylander/catfasta2phyml ) to concatenate the alignments. We then IQ-TREE with the LG+I+G model to fit branch lengths to the ASTRAL tree. We rooted the phylogeny using the Auriculariae Group as the outgroup to the rest of Caenorhabditis ( Sloat et al. , 2022 ). Plots were generated using the ape package ( Paradis & Schliep, 2019 ) in R ( R Core Team, 2024 ). Genome Assembly QG2082 was grown on NGMA plates at 25°. A mixed-stage mixed-sex population was flash frozen in liquid nitrogen and the frozen worm pellet was shipped to the University of Oregon Genome and Cell Characterization Core Facility for HiFi sequencing. Flash-frozen worms were also shipped to Dovetail Genomics (Santa Cruz, CA; https://dovetailgenomics.com ) for Hi-C sequencing with 150bp Illumina reads. Short-read data for QG2082 (Illumina paired-end), QG2083 (Illumina paired-end and mate-paired), and for G 4 BC 2 lines (Illumina paired-end) are described in Lamelza et al . (2019) . We generated assemblies using PacBio HiFi reads (≥Q20) with assemblers Flye ( Kolmogorov et al ., 2019 ), Hifiasm ( Cheng et al ., 2021 ), and Hi-Canu (Nurk et al. , 2020), and Hi-C-scaffolded Flye and Hifiasm assemblies with Juicer ( Durand et al ., 2016 ). As in Noble et al . (2021) , we then evaluated each assembly for consistency with genetic linkage data (implemented in a Snakemake pipeline available at https://github.com/lukemn/becei ), and then closed gaps of estimated 0cM genetic distance where strand-consistent spanning reads from local mapping were available. The final assembly drew partially redundant sequences from two primary assemblies (Flye -m 10 -g 100Mb; Hifiasm -l 0). For chromosomes I, IV and X, sequences from Hi-C scaffolding of the Hifiasm assembly were used to span primary sequences. Each chromosome was iteratively polished with HiFi reads, using calls from DeepVariant ( Poplin et al ., 2018 ) and bcftools norm/consensus (Danacek et al ., 2021), until either no homozygous variants were called, or a local minimum in read mapping error rate was found. Telomeric sequences were counted using R library seqinr ( Charif & Lobry 2007 ). To assemble the C. becei mitochondrial genome, we first mapped Q20- and Q30-filtered PacBio HiFi reads to the C. becei nuclear reference genome using minimap2 (version 2.22; Li 2018 ), and extracted unmapped reads using samtools (version 1.14; Danecek et al. , 2021 ). We then aligned unmapped Q20 reads to the mitochondrial genome of C. nouraguensis (Accession: NC_035250.1 ), using minimap2 to identify mitochondrial reads. Subsequently, we de novo assembled the Q20 mitochondrial reads using Flye (version 2.9.5; Kolmogorov et al. , 2019 ) with a minimum overlap of 1,000 bp, and generated a single circular 13,708 bp contig with high coverage. This draft contig was then used as a reference to map the higher-accuracy Q30 HiFi reads, which we assembled using Flye with a 10 kb minimum overlap, producing a single high-confidence circular contig. This final assembly was annotated using MITOS2 ( Al Arab et al. , 2017 ; Donath et al. 2019 ) and manually curated. The nuclear and mitochondrial genome assemblies and underlying data are available from the NCBI at BioProject PRJNA989223. Genetic Map Data for genetic map construction are described in Lamelza et al . (2019) . For the map described here, we used short-read sequence data from 92 individual G 4 BC 2 populations. Each such population is a pool of worms carrying one unique set of recombinant chromosomes, each the product of several generations of meiosis. Reads were mapped to the QG2082 reference genome and ancestries inferred along each chromosome using MSG ( Andolfatto et al. , 2011 ). The data plotted in Figure 3A are in Table S2. Domain boundary positions for C. becei and other species were estimated by segmented linear regression using the segmented package ( Muggeo, 2008 ). We first interpolated genetic positions for 200 evenly spaced physical positions along each chromosome, then excluded 1 Mb from each end of each chromosome to avoid effects of tip regions, which generally have suppressed recombination and whose boundaries are poorly resolved in most species given the limited available data. We then regressed genetic position on physical position with the constraint that there be three linear segments. Note that domain boundary positions are imprecise, given the modest number of crossovers present in the data; as shown by simulations in ( Rockman & Kruglyak, 2009 ), even in the case of precise boundaries, uniform domains, and relatively large samples of crossovers, the confidence intervals for boundaries are on the order of a megabase. To generate null distributions for crossover counts under the hypothesis of complete interference, we simulated G 4 BC 2 crosses in R (File S1). For comparisons with other species (Table S3 and Figure S2 ), we used the following datasets: C. briggsae 99 F 2 RILs QX1410 x VX34 Stevens et al. , 2022 https://github.com/AndersenLab/briggsae_reference_genome_MS/blob/main/3_recombinationm ap/CB_genetic_map.Rda C. tropicalis 119 F 2 RILs NIC58xJU1373 Noble et al. , 2021 https://github.com/lukemn/tropicalis/blob/master/geneticMap/data/c_tropicalis_flye_geneticMap . rda C. remanei 341 F 2 s PX506 x PX553 Teterina et al. , 2023 https://figshare.com/ndownloader/files/41808561 C. elegans 1045 RIAILs CB4856 x N2 & CB4856 x QX1430 (N2 peel-1(ttTi12715) I npr-1(qg1) X) Brady et al. , 2019 https://github.com/AndersenLab/linkagemapping The X-chromosome map was re-estimated after excluding markers surrounding the npr-1 introgression qg1 in RIAIL sets 2 and 3, which cause a spurious map expansion otherwise. Pristionchus pacificus 93 F2s PS312 x PS1843 Rillo-Bohn et al. , 2021 https://cdn.elifesciences.org/articles/70990/elife-70990-fig8-data1-v2.xlsx We used the P. pacificus oocyte genetic map data only, due to strain-dependent crossover suppression in the male data, likely attributable to inversions. The X data are also distorted in a putatively strain-dependent fashion, as described in Rillo-Bohn et al . (2021) Autosomal Sex Linkage To create a strain with an integrated transgene insertion, we used Gibson cloning to generate plasmids pSAS02 ( Cbr-P plg-1 ::GFPnovo2::unc54utr with the pSM-GFPnovo2 backbone) and pSAS06 ( Cel-P fkh-6 ::mCherry::unc54utr in the pCFJ104 backbone). The backbone plasmids were acquired from Addgene and the final plasmids were verified by Oxford nanopore whole-plasmid sequencing (Plasmidsaurus.com). We PCR-amplified the reporters ( promoter::FP::UTR ) from the plasmids and injected them together into QG2082 and recovered lines transmitting both transgenes. Several hundred L4 animals of a transmitting line were UV irradiated at 500 J/m 2 . Those animals were passaged for 5 generations before backcrossing individuals to QG2082 to screen for Mendelian segregation of the integrated array. Lines positive for integration were backcrossed an additional 12x before homozygosing the integrated array as line QG4602 ( qgIs7 ). Plasmid sequences are provided in File S2. To test for skew, we performed reciprocal crosses between QG2082 and QG4602 under standard conditions at 25°C. We then crossed F 1 males to QG2082 females and collected and scored all progeny laid within timed windows. We observed 343 insertion + males, 278 insertion − males, 507 insertion + females, and 591 insertion − females. The biased sex ratios are consistent with the known bias in C. becei ( Huang et al. , 2023 ). Recombination frequency is estimated as the number of unpreferred-phase gametes (X+insertion or 0+wildtype) out of n = 1,719 total, and the 95% confidence interval is the normal approximation for binomial proportions. Segregation distortion To test for parental-by-offspring genetic interactions ( Medea or Peel ), we performed replicates of the sixteen possible pairwise crosses between four genotypes: QG2082, QG2083, and the F 1 s from each direction of the cross between QG2082 and QG2083. We included all possible F 1 s in order to account for possible effects of mt-DNA or X-linked interactors. The reciprocal F 1 females differ in their mitochondrial genotype, and the reciprocal F 1 males differ in which X chromosome they carry. Under a Medea hypothesis, the only affected individuals will be a subset of the progeny of heterozygous females, specifically those offspring homozygous for QG2082 alleles on the right arm of chromosome I or the center of chromosome III. Under a Peel hypothesis, the only affected individuals will be the comparable subset of the progeny of heterozygous males. A detailed accounting of the expected results under the Medea hypothesis are shown in Figure S3 . Worms were maintained on OP50 E. coli at 25°C during the experiments and for three generations beforehand. For each cross, 9 L4 females and 10 L4 males were transferred to a 6cm plate on day 1 and left to mature and mate overnight. The following day (day 2), females with mating plugs were transferred to individual plates for a 7-hour egg lay period. Crosses were handled in a random order and plates were blinded to genotype for subsequent scoring. After the egg lay, females were then removed and the embryos laid on the plate were counted. On day 3, 18 hours after the end of the egg lay, unhatched embryos and deformed, arrested L1 larvae were counted. The deformed larvae were characteristically arrested in a two- or three-fold posture as if unable to move after hatching. On day 4, 42-48 hours after the end of the egg lay period, wild-type males and females, L4 males and females, and active L1-L3 larvae were counted. At this timepoint all larvae are the product of the original egg lay, as eggs laid by the adult offspring have not yet hatched. Raw count data are reported in Table S6. To summarize the results, counts were pooled by cross and plotted as proportions, with the total being the number of embryos counted on day 2, immediately after the egg lay. In many cases, the sum of unhatched embryos, deformed L1s, developmentally delayed larvae, and wild-type adults was less than the number of embryos present initially. This gap is due in part to the difficulty in observing the small arrested L1 larvae, but it also reflects slight errors in counting each of the classes of embryos and worms. This gap between total embryos counted on day 2 and total offspring accounted for on days 3 and 4 is recorded as “missing” in Figure 4 . Under the two- Medea model, a greater proportion of QG2082-backcross progeny will be affected than F 2 progeny. More specifically, assuming the Medeas have independent (i.e, multiplicative) effects, the difference in affected proportions between these two classes of progeny is an estimator of 1/16 β I + 1/16 β III + 3/16 β I β III , where the β s are the penetrances of the Medea loci on chromosomes I and III. Pooling observations across relevant experiments, we count 517/827 affected offspring in the QG2082 backcrosses and 644/1544 in the F 2 s. The difference in affected proportions is 0.21±0.04 (95% confidence interval calculated via Agresti-Caffo method). If the two Medeas have the same penetrance, the data provide an estimate of the penetrance as 0.77±0.10. Alternatively, if one Medea is completely penetrant, the data imply the other has a penetrance ∼0.59±0.16. Repetitive Element Analysis We generated a redundant set of repetitive element libraries, identified de novo using the tools RepeatModeler ( Flynn et al. , 2020 ), TransposonPSI (B. Haas, 2007 ), LTRharvest ( Ellinghaus et al. , 2008 ), LTRdigest ( Steinbiss et al. , 2009 ), SINE-Scan ( Mao & Wang, 2017 ), SineFinder ( Wenke et al. , 2011 ), TirVish ( Gremme et al. , 2013 ), HelitronScanner ( Xiong et al. , 2014 ), MITE-Tracker ( Crescente et al. , 2018 ), MUSTv2 ( Ge et al. , 2017 ), and MiteFinderII ( Hu et al. , 2018 ). These libraries were merged with nematode-specific repeat libraries from Repbase ( Bao et al. , 2015 ) and Dfam ( Storer et al. , 2021 ) to create a single redundant repeat library. To remove redundancies, we used USEARCH ( Edgar, 2010 ) to cluster the sequences in the library. The resulting non-redundant library was further filtered for any potential non-repeat clusters by using BlastX ( Camacho et al. , 2009 ) to search against nematode-specific proteins and non-coding RNAs. The repeat discovery pipeline was adapted from a protocol previously used to characterize repeats in the C. inopinata genome ( Coghlan et al. , 2018 ; Woodruff & Teterina, 2020 ). To validate this pipeline, we replicated previously reported repeat contents for C. inopinata , C. elegans , C. briggsae , C. nigoni , C. remanei , and C. bovis ( Woodruff & Teterina, 2020 ). We used the hierarchical classification schema applied in other Caenorhabditis species ( Woodruff & Teterina, 2020 ). The non-redundant repetitive element library was classified using multiple tools: RepeatClassifier ( Flynn et al. , 2020 ), Dfam Classifier ( Storer et al. , 2021 ), TransposonUltimate RFSB Classifier (Riehl et al. , 2021), and Geneious Sequence Classifier ( https://www.geneious.com ). We assigned the consensus classification from these tools, with conflicting classifications labeled as “unknown.” Repeat libraries were generated independently for each genome assembly, and each genome was masked with RepeatMasker ( http://www.repeatmasker.org/ ), using only their specific repeat libraries. We used the final RepeatMasker-generated masking results to characterize the genomic repeat landscape at both the global and taxonomic levels. To account for nested repeats, we disjoined the GFF so that each base pair in the genome was assigned to only one TE copy. This allowed us to distinguish between the number of repeat insertions and the number of bases covered by a given repeat taxon ( Anderson et al. , 2019 ). We estimated the age of repetitive elements by calculating Kimura distances ( Kapusta et al. , 2017 ), which measure the divergence of individual repeat copies from their consensus sequence. Kimura distances were extracted from the “.align” file generated by RepeatMasker, and we calculated the mean Kimura distances across non-overlapping 10-kb windows for all repeat taxonomic ranks. Gene Structure QG2082 worms were raised under standard conditions with OP50 E. coli food and then split into five conditions, as described in Sloat et al . (2022) : 1) CemBio bacterial strains ( Dirksen et al. , 2020 ) as food; 2) OP50 and standard conditions; 3) OP50 plus heat stress; 4) OP50 plus cold stress; 5) starvation. Temperature stresses consisted of 35°C or 4°C for 2 hours followed by a 2-hour recovery prior to RNA extraction. Total RNA was isolated using TRIzol following the protocol described in Green & Sambrook (2020) . The mRNA libraries were constructed using the Illumina Stranded mRNA Prep Ligation protocol. These barcoded libraries were then pooled and sequenced using a NextSeq 500 MidOutput 2X150 for 300 cycles. For the Iso-seq RNA extraction, we grew two sets of mixed-stage worms. One was well fed and the other starved for 2 days to generate a mix of dauer, arrested L1s, and starved adults. Worms were washed 5x in M9 to remove bacteria. The resulting pellet was resuspended in a mortar and pestle tube with 100 µL of TriZol and flash frozen in liquid nitrogen. The frozen powder was ground and 900 µL of additional TRIzol was added. The frozen lysate was then repeatedly (x10) thawed at 37°C on a heat block, and vortexed for 30 seconds. Then, 200 µl of chloroform was added per 1 ml TRIzol. The sample was mixed by inversion for 15 seconds before incubation at room temperature for 3 minutes for phase separation. The sample was then spun at 12,000 g for 15 mins at 4°C. The upper aqueous phase was then transferred to a fresh tube. We next added an equal volume of 100% ethanol, mixed by pipetting, and transferred the whole to a Qiagen RNeasy spin column, which was processed according to the manufacturer’s instructions. The resulting RNA was measured with the Qubit and the samples were combined to equal concentrations. The RNA was sent to the Center for Genomic and Computational Biology at Duke University for PacBio Sequel Sequencing. We generated de novo gene models generally following the protocol of Doyle et al . (2020) . RNAseq reads were mapped to the genome using STAR ( Dobin & Gingeras, 2015 ). The resulting BAM was used as hints for BRAKER2 ( Brůna et al. , 2021 ), which trains AUGUSTUS ( Stanke et al. , 2006 ) using ab initio predictions generated by GeneMark-ES ( Ter-Hovhannisyan et al. , 2008 ). Attempts to use mapped Iso-Seq or proteins of closely related Nematodes as input for BRAKER2 yielded poor results. Therefore, only short read RNAseq was used. To better utilize the Iso-Seq data we mapped it to the genome using PASA ( Haas et al. , 2003 ). We then loaded the BRAKER2 annotation into PASA to iteratively update existing annotations based on alignment evidence. We performed two rounds of updates to merge the two annotations following the recommendations of the PASA authors. We incorporated further sources of evidence by mapping C. elegans proteins to the C. becei genome using Exonerate ( Slater & Birney, 2005 ) with an alignment score threshold of 50%. GFFs were subsequently extracted from the exonerate output with Exonerate_to_evm_gff3.pl from EvidenceModeler ( Haas et al. , 2008 ). BRAKER2, PASA, and exonerate annotations were combined using weights of 2, 5, and 2 respectively in EvidenceModeler. The evidence modeler annotations were updated one last time for two rounds in PASA to incorporate additional evidence from long-read transcripts adding any UTR and isoform information that may have been missed or discarded. Genomic GC Content We calculated the GC content with bedtools nuc ( Quinlan & Hall, 2010 ). For analyses by functional class, we used species-specific GFF annotation files and computed base composition for each genomic feature. A nested masking approach was employed, where genomes were first masked for exons and subsequently for repeats, allowing for the separation of intergenic and intronic regions from exonic and repetitive sequences. At each masking step, feature-specific GC content was calculated. To assess localized variations, GC content was then calculated in 10 kb windows across the genome for each feature. Codon and Amino Acid Usage To identify differences in codon preference among Caenorhabditis species, we analyzed the mean Relative Synonymous Codon Usage (RSCU) values ( Sharp & Li, 1986 ). RSCU is a measure of codon bias, indicating how frequently a given codon is used relative to the expected frequency if all synonymous codons for an amino acid were used equally. An RSCU value of 1 suggests that a codon is used at its expected frequency under no bias, whereas values greater than 1 indicate codon preference, and values less than 1 indicate underrepresentation of that codon. Coding sequences for each species were retrieved from FASTA files, and RSCU values were calculated using the uco function from the seqinr package in R ( Charif & Lobry, 2007 ). Amino acid composition was calculated by mapping codons to their corresponding amino acids and summing codon counts for each amino acid across all coding sequences (CDS) in a species. Synteny Analysis To visualize conserved gene order, we identified single-copy orthologs shared among C. becei , C. niphades , and C. elegans and then generated plots connecting the chromosomal positions of these orthologs across species. We found that chromosomes of C. niphades ( Sun et al. , 2022 ) were syntenic with their corresponding chromosomes in C. elegans and C. becei , but the order of the genes along five of the chromosomes (I, II, III, V, and X) was largely inverted, suggesting that the genome fasta for these chromosomes represents the reverse complement relative to the other species. Chromosome IV, in contrast, was highly collinear between C. becei and C. niphades . For the plots in Figure 8 , we reversed the orientation of the five C. niphades chromosomes to maximize the collinearity. Ortholog Identification & Functional Annotation Orthologous gene families were identified using OrthoFinder2 ( Emms & Kelly, 2019 ) with default parameters. The longest coding DNA sequence for each gene across multiple Caenorhabditis species was extracted and used as input. Genes were assigned to orthogroups, representing clusters of orthologous and paralogous genes shared among species. This enabled comparison of gene family expansions, contractions, and species-specific duplications. To assess chromosomal distributions, the positions of single-copy and duplicated orthologs were mapped using the C. becei genome annotation. Gene counts were binned into 100 kb windows, and the distribution of multi-copy, single-copy, and unassigned genes was analyzed across chromosomes. To characterize orthogroups, we calculated gene count and additive length, where additive length represents the sum of all gene lengths within an orthogroup. This approach was used to compare the overall genomic contribution of orthogroups with different copy numbers and to examine patterns of gene family expansion. Functional annotation of coding sequences was performed using InterProScan v5.65 ( Blum et al. , 2021 ), with parameters for nucleotide input, translation, domain prediction, Gene Ontology (GO) assignment, and pathway annotation (interproscan.sh -t n -dp -goterms -pa). InterProScan results were parsed into a non-redundant gene-level table containing the InterPro accession, type, and description, along with associated GO terms and functional descriptions. These annotations were then added to the corresponding gene features in the genome annotation (GFF) file. DATA AVAILABILITY STATEMENT Newly generated transcriptomes used to assemble the phylogeny in Figure 1 are associated with BioProject ID PRJNA1128046. QG2082 HiFi, HiC, Illumina RNAseq, and PacBioIsoseq data used to assemble and annotate the C. becei genome, and the assembly and annotation files, are associated with BioProject PRJNA989223. SUPPLEMENTARY FILES File S1. G 4 BC 2 Simulations. This R script generates samples of chromosomes under the experimental design used to build the genetic map, under the assumption of complete crossover interference. It then tests the fit of the observed crossover number to the simulation results. File S2. Reporter plasmid sequences. Fasta formatted DNA sequences for pSAS02 and pSAS06, plasmids for expression of male-specific GFP and female specific mCherry. SUPPLEMENTARY TABLES Table S1: C. becei nuclear genome assembly statistics. Table S2. The genetic map of C. becei , with physical positions of markers on the genome assembly. Table S3. Domains in C. becei and other species From genetic and physical maps for each chromosome, after excluding the terminal megabase from each end, we used segmented linear regression to identify three recombination-rate domains. The table records the positions of the boundaries (LC and CR, boundaries between the left arm and center and between the center and right arm, respectively), the percent of chromosome length that is in the left arm and tip, center domain, and right arm and tip, and then the recombination rates estimated for each domain from the regression slopes. Note that four of the 36 chromosome maps (6 chromosomes x 6 species) have recombination rate patterns that do not match the expectations of the regression, and the numbers in the table for these are not meaningful. These chromosomes – C. tropicalis X, C. remanei IV and X, and P. pacificus X – are indicated by “No” in the “Domains” column in the table. The P. pacificus X is likely affected by segregating inversions and so may not reflect the meiotic map in structural homozygotes. Table S4. Gene Count and Additive Length Table for top Orthogroups in chromosome X. This table provides the number of genes and the additive length per orthogroup for C. becei . The table includes the orthogroup ID and a brief functional description (if available). Table S5. Transcriptome data sources for the phylogenetic analysis in Figure 1 . Table S6. Medea data. Results of experimental crosses testing for Medea or Peel activity. These are the data underlying Figure 4B . Each row represents one worm’s progeny, indexed in column 1 to its randomly assigned plate number. Columns 2-10 count the numbers of embryos observed after egg lay, unhatched embryos and deformed larvae the next day, and then wild-type adult females, wild-type adult males, L4 females, L4 males, and L1-3 larvae on the subsequent day. Columns 11 and 12 record the genotypes of the parents of the cross, and column 13 records an identifier for which of the 16 classes of cross the row represents. SUPPLEMENTARY FIGURES Download figure Open in new tab Figure S1. Chromosomes end with oriented telomere sequences in most cases. The plot shows stacked histograms of the counts of TTAGGC (blue) and GCCTAA (red), in 100kb bins along each chromosome. The left ends of chromosomes I and III lack telomere sequences. Download figure Open in new tab Figure S2. Domains in C. becei and other species. Marey maps for each of the chromosomes in six species with genetic map data. Vertical lines mark the estimated positions of chromosome domain boundaries. The x-axis is the physical position along the chromosome, in Mb, and the y-axis is the genetic position, in cM, after rescaling each map to 50 cM total length. The x-axis runs from 0 to 26 Mb in each plot, with the exceptions of P. pacificus chromosomes I and IV, which are much longer. As described in Table S2, four chromosome maps (marked with asterisks) do not have the expected domain structure: C. tropicalis X, C. remanei IV and X, and P. pacificus X. Download figure Open in new tab Figure S3. Sixteen Punnett squares showing the expected frequencies of affected progeny under a model of Medea elements on chromosomes I and III in QG2083 that independently affect QG2082-homozygous progeny of heterozygous mothers. Download figure Open in new tab Figure S4. Transposable element superfamilies in C. becei . Each row represents a transposable element (TE) superfamily, grouped by higher-level taxonomic categories and colored by repeat order. Colored boxes next to each superfamily indicate the arm-center difference (Cohen’s d), calculated as the difference in mean repeat density between chromosome arms (normalized position ≥ 0.25) and centers (normalized position < 0.25), divided by the pooled standard deviation. Positive values (red) reflect higher repeat density in chromosome arms, negative values (blue) indicate enrichment in chromosome centers, and values near zero are shown in grey. Numbers within boxes show the percentage of the genome occupied by each superfamily. Download figure Open in new tab Figure S5. Global repetitive element landscape across 10-kb windows along the length of the chromosomes in C. becei . Blue lines show the smoothed trend in repeat density, generated by fitting a generalized additive model to the data. Download figure Open in new tab Figure S6. Genomic feature composition across the chromosomes of C. becei and C. niphades . The proportion of each 100-kb window occupied by coding (CDS, red), intronic (blue), repetitive (green), and intergenic (gray) bases is shown along each chromosome. Bars are stacked to sum to 100% per window. Intergenic regions represent sequence not annotated as CDS, intron, or repeat. Download figure Open in new tab Figure S7. The C. becei genome is unusually variable in its local GC percentage. Here the standard deviation of GC% across the genome is shown as a function of the length scale over which GC is measured, in bins of 1 to 500 kb. The spacing along the x-axis is logged. The nine species shown in comparison to C. becei are those plotted in Figure 5 . Download figure Open in new tab Figure S8. GC content of genomic features in Caenorhabditis species. GC content was calculated from the counts of G+C divided by the total number of bases of the feature within non-overlapping 10 kb windows along the length of the chromosome, with LOESS-fitted lines (span = 0.2). C. elegans here represents the relatively homogenous Elegans Group species. Download figure Open in new tab Figure S9. Chromosome size and ortholog classification of CDS and introns in C. becei and C. niphades . The total length of gene regions (CDS + introns) and intergenic DNA is shown for each chromosome. Gene regions were merged and classified based on orthogroup analysis into four categories: duplicated (red), single-copy (blue), unclassified (purple), and intergenic (gray). Percentages within bars indicate the proportion of each feature relative to chromosome size. Download figure Open in new tab Figure S10. Gene positions along Chromosome X for top orthogroups by count. The figure displays the positions of genes from the orthogroups with highest number of genes in chromosome X of C. becei . Each horizontal blue line represents the start and end positions of genes for a given orthogroup. The x-axis indicates the chromosomal position in megabases (Mb), while the y-axis shows the orthogroup identifiers, sorted by gene count. ACKNOWLEDGMENTS This work was supported by grants GM121828 and GM141906 from the National Institute for General Medical Sciences and HG013015 from National Human Genome Research Institute, and by support from the Zegar Foundation to the NYU GenCore facility. We thank the staff of NYU GenCore, the NYU IT High Performance Computing Team, Maggie Weitzman and the University of Oregon GC3 for HiFi data, Dovetail Genomics for Hi-C data, Duke University Genome Sequencing & Analysis Core for IsoSeq data, Arielle Martel for help in the lab, and the Caenorhabditis Genomes Project and WormBase for data. We thank Lewis Stevens for advice and suggestions. Funder Information Declared National Institute of General Medical Sciences, https://ror.org/04q48ey07 , GM121828 , GM141906 National Human Genome Research Institute, https://ror.org/00baak391 , HG013015 REFERENCES ↵ Adams , P. E. , Crist , A. B. , Young , E. M. , Willis , J. H. , Phillips , P. C. , & Fierst , J. L . ( 2022 ). Slow recovery from inbreeding depression generated by the complex genetic architecture of segregating deleterious mutations . Molecular Biology and Evolution , 39 , msab330 ↵ Al Arab , M. , Höner Zu Siederdissen , C. , Tout , K. , Sahyoun , A.H. , Stadler , P.F. , & Bernt , M. ( 2017 ). Accurate annotation of protein-coding genes in mitochondrial genomes . Mol Phylogenet Evol . 106 : 209 – 216 . OpenUrl CrossRef PubMed ↵ Andersen , E. C. , & Rockman , M. V . ( 2022 ). Natural genetic variation as a tool for discovery in Caenorhabditis nematodes . Genetics 220 , iyab156 ↵ Anderson , S. N. , Stitzer , M. C. , Brohammer , A. B. , Zhou , P. , Noshay , J. M. , O’Connor , C. H. , Hirsch , C. D. , Ross-Ibarra , J. , Hirsch , C. N. , & Springer , N. M . ( 2019 ). Transposable elements contribute to dynamic genome content in maize . The Plant Journal 100 , 1052 – 1065 . OpenUrl CrossRef PubMed ↵ Andolfatto , P. , Davison , D. , Erezyilmaz , D. , Hu , T. T. , Mast , J. , Sunayama-Morita , T. , & Stern , D. L . ( 2011 ). Multiplexed shotgun genotyping for rapid and efficient genetic mapping . Genome Research , 21 , 610 – 617 . OpenUrl Abstract / FREE Full Text ↵ Baer , C. F. , Joyner-Matos , J. , Ostrow , D. , Grigaltchik , V. , Salomon , M. P. , & Upadhyay , A . ( 2010 ). Rapid decline in fitness of mutation accumulation lines of gonochoristic (outcrossing) Caenorhabditis nematodes . Evolution 64 , 3242 – 3253 . OpenUrl CrossRef PubMed Web of Science ↵ Bao , W. , Kojima , K. K. , & Kohany , O . ( 2015 ). Repbase Update, a database of repetitive elements in eukaryotic genomes . Mobile DNA 6 , 11 . OpenUrl CrossRef PubMed ↵ Barnes , T. M. , Kohara , Y. , Coulson , A. , & Hekimi , S . ( 1995 ). Meiotic recombination, noncoding DNA and genomic organization in Caenorhabditis elegans . Genetics , 141 ( 1 ), 159 – 179 . OpenUrl Abstract / FREE Full Text ↵ Barrière , A. , & Félix , M.-A . ( 2005 ). High local genetic diversity and low outcrossing rate in Caenorhabditis elegans natural populations . Current Biology 15 , 1176 – 1184 . OpenUrl CrossRef PubMed Web of Science ↵ Beeman , R. W. , Friesen , K. S. , & Denell , R. E . ( 1992 ). Maternal-effect selfish genes in flour beetles . Science 256 , 89 – 92 . OpenUrl Abstract / FREE Full Text ↵ Ben-David , E. , Burga , A. , & Kruglyak , L . ( 2017 ). A maternal-effect selfish genetic element in Caenorhabditis elegans . Science 356 , 1051 – 1055 . OpenUrl Abstract / FREE Full Text ↵ Ben-David , E. , Pliota , P. , Widen , S. A. , Koreshova , A. , Lemus-Vergara , T. , Verpukhovskiy , P. , Mandali , S. , Braendle , C. , Burga , A. , & Kruglyak , L . ( 2021 ). Ubiquitous selfish toxin-antidote elements in Caenorhabditis species . Current Biology 31 , 990 – 1001 . OpenUrl CrossRef PubMed ↵ Blum , M. , Chang , H.-Y. , Chuguransky , S. , Grego , T. , Kandasaamy , S. , Mitchell , A. , Nuka , G. , Paysan-Lafosse , T. , Qureshi , M. , Raj , S. , Richardson , L. , Salazar , G. A. , Williams , L. , Bork , P. , Bridge , A. , Gough , J. , Haft , D. H. , Letunic , I. , Marchler-Bauer , A. , … Finn , R. D . ( 2021 ). The InterPro protein families and domains database: 20 years on . Nucleic Acids Research , 49 , D344 – D354 . OpenUrl CrossRef PubMed ↵ Bouvarel , L. , Liu , D. , & Zheng , C . ( 2024 ). Visualizing genomic evolution in Caenorhabditis through WormSynteny . BMC Genomics , 25 , 1009 . OpenUrl CrossRef PubMed ↵ Brůna , T. , Hoff , K. J. , Lomsadze , A. , Stanke , M. , & Borodovsky , M . ( 2021 ). BRAKER2: automatic eukaryotic genome annotation with GeneMark-EP+ and AUGUSTUS supported by a protein database . NAR Genomics and Bioinformatics , 3 , lqaa108. ↵ Camacho , C. , Coulouris , G. , Avagyan , V. , Ma , N. , Papadopoulos , J. , Bealer , K. , & Madden , T. L . ( 2009 ). BLAST+: architecture and applications . BMC Bioinformatics 10 , 421 . OpenUrl CrossRef PubMed ↵ Capella-Gutiérrez , S. , Silla-Martínez , J. M. , & Gabaldón , T . ( 2009 ). trimAl: a tool for automated alignment trimming in large-scale phylogenetic analyses . Bioinformatics 25 , 1972 – 1973 . OpenUrl CrossRef PubMed Web of Science ↵ Carelli , F. N. , Cerrato , C. , Dong , Y. , Appert , A. , Dernburg , A. , & Ahringer , J . ( 2022 ). Widespread transposon co-option in the Caenorhabditis germline regulatory network . Science Advances 8 , eabo4082. ↵ Charif , D. , & Lobry , J. R. ( 2007 ). SeqinR 1.0-2: A contributed package to the R project for statistical computing devoted to biological sequences retrieval and analysis . In Structural Approaches to Sequence Evolution (pp. 207 – 232 ). Springer Berlin Heidelberg . ↵ Cheng H , Concepcion GT , Feng X , Zhang H , Li H . ( 2021 ) Haplotype-resolved de novo assembly using phased assembly graphs with hifiasm . Nat Methods 18 , 170 – 175 . OpenUrl CrossRef PubMed ↵ Coghlan , A. , Coghlan , A. , Tsai , I. J. , & Berriman , M . ( 2018 ). Creation of a comprehensive repeat library for a newly sequenced parasitic worm genome . Protocol Exchange . doi: 10.1038/protex.2018.054 OpenUrl CrossRef ↵ Crescente , J. M. , Zavallo , D. , Helguera , M. , & Vanzetti , L. S . ( 2018 ). MITE Tracker: an accurate pproach to identify miniature inverted-repeat transposable elements in large genomes . BMC Bioinformatics , 19 , 348 . OpenUrl CrossRef PubMed ↵ Csankovszki , G. , McDonel , P. , & Meyer , B. J . ( 2004 ). Recruitment and spreading of the C. elegans dosage compensation complex along X chromosomes . Science 303 , 1182 – 1185 . OpenUrl Abstract / FREE Full Text ↵ Cutter , A. D . ( 2018 ). X exceptionalism in Caenorhabditis speciation . Molecular Ecology 27 , 3925 – 3934 . OpenUrl CrossRef ↵ Danecek P , Bonfield JK , Liddle J , Marshall J , Ohan V , Pollard MO , Whitwham A , Keane T , McCarthy SA , Davies RM , Li H . ( 2021 ) Twelve years of SAMtools and BCFtools . Gigascience 10 , giab008. ↵ Daul , A. L. , Andersen , E. C. , & Rougvie , A. E . ( 2019 ). The Caenorhabditis Genetics Center (CGC) and the Caenorhabditis elegans Natural Diversity Resource . In The Biological Resources of Model Organisms (pp. 69 – 94 ). CRC Press . ↵ Dayi , M. , Kanzaki , N. , Sun , S. , Ide , T. , Tanaka , R. , Masuya , H. , Okabe , K. , Kajimura , H. , & Kikuchi , T. ( 2021 ). Additional description and genome analyses of Caenorhabditis auriculariae representing the basal lineage of genus Caenorhabditis . Scientific Reports , 11 6720 . OpenUrl CrossRef PubMed ↵ Dirksen , P. , Assié , A. , Zimmermann , J. , Zhang , F. , Tietje , A.-M. , Marsh , S. A. , Félix , M.-A. , Shapira , M. , Kaleta , C. , Schulenburg , H. , & Samuel , B. S . ( 2020 ). CeMbio - The Caenorhabditis elegans Microbiome Resource . G3 10 , 3025 – 3039 . OpenUrl Abstract / FREE Full Text ↵ Dobin , A. , & Gingeras , T. R . ( 2015 ). Mapping RNA-seq reads with STAR . Current Protocols in Bioinformatics 51 , 11 – 14 . OpenUrl CrossRef ↵ Dolgin , E. S. , Charlesworth , B. , Baird , S. E. , & Cutter , A. D . ( 2007 ). Inbreeding and outbreeding depression in Caenorhabditis nematodes . Evolution 61 , 1339 – 1352 . OpenUrl CrossRef PubMed Web of Science ↵ Donath , A. , Jühling , F. , Al-Arab , M. , Bernhart , S.H. , Reinhardt , F. , Stadler , P.F. , Middendorf , M. , & Bernt , M . ( 2019 ). Improved annotation of protein-coding genes boundaries in metazoan mitochondrial genomes . Nucleic Acids Res . 47 , 10543 – 10552 . OpenUrl CrossRef PubMed ↵ Doyle , S. R. , Tracey , A. , Laing , R. , Holroyd , N. , Bartley , D. , Bazant , W. , Beasley , H. , Beech , R. , Britton , C. , Brooks , K. , Chaudhry , U. , Maitland , K. , Martinelli , A. , Noonan , J. D. , Paulini , M. , Quail , M. A. , Redman , E. , Rodgers , F. H. , Sallé , G. , … Cotton , J. A . ( 2020 ). Genomic and transcriptomic variation defines the chromosome-scale assembly of Haemonchus contortus , a model gastrointestinal worm . Communications Biology 3 , 656 . OpenUrl CrossRef PubMed ↵ Durand NC , Shamim MS , Machol I , Rao SS , Huntley MH , Lander ES , & Aiden EL . ( 2016 ). Juicer provides a one-click system for analyzing loop-resolution Hi-C experiments . Cell Syst . 3 , 95 – 8 . OpenUrl CrossRef PubMed ↵ Edgar , R. C . ( 2010 ). Search and clustering orders of magnitude faster than BLAST . Bioinformatics 26 , 2460 – 2461 . OpenUrl CrossRef PubMed Web of Science ↵ Ellinghaus , D. , Kurtz , S. , & Willhoeft , U . ( 2008 ). LTRharvest, an efficient and flexible software for de novo detection of LTR retrotransposons . BMC Bioinformatics 9 , 18 . OpenUrl CrossRef PubMed ↵ Emms , D. M. , & Kelly , S . ( 2019 ). OrthoFinder: phylogenetic orthology inference for comparative genomics . Genome Biology 20 , 238 . OpenUrl CrossRef PubMed ↵ Eurmsirilerd , E. , & Maduro , M. F . ( 2020 ). Evolution of developmental GATA factors in nematodes . Journal of Developmental Biology 8 , 27 . OpenUrl CrossRef PubMed ↵ Félix , M.-A. , Braendle , C. , & Cutter , A. D . ( 2014 ). A streamlined system for species diagnosis in Caenorhabditis (Nematoda: Rhabditidae) with name designations for 15 distinct biological species . PloS One 9 , e94723 . OpenUrl CrossRef PubMed ↵ Félix , M.-A. , Jovelin , R. , Ferrari , C. , Han , S. , Cho , Y. R. , Andersen , E. C. , Cutter , A. D. , & Braendle , C . ( 2013 ). Species richness, distribution and genetic diversity of Caenorhabditis nematodes in a remote tropical rainforest . BMC Evolutionary Biology 13 , 10 . OpenUrl CrossRef PubMed ↵ Ferrari , C. , Salle , R. , Callemeyn-Torre , N. , Jovelin , R. , Cutter , A. D. , & Braendle , C . ( 2017 ). Ephemeral-habitat colonization and neotropical species richness of Caenorhabditis nematodes . BMC Ecology 17 , 43 . OpenUrl CrossRef PubMed ↵ Flynn , J. M. , Hubley , R. , Goubert , C. , Rosen , J. , Clark , A. G. , Feschotte , C. , & Smit , A. F . ( 2020 ). RepeatModeler2 for automated genomic discovery of transposable element families . Proc Natl Acad Sci USA 117 , 9451 – 9457 . OpenUrl Abstract / FREE Full Text ↵ Fusca , D. D. , Kasimatis , K.R. , Zhu , H. V. , & Cutter , A.D . 2024 . Dynamic birth and death of Argonaute gene family functional repertoire across Caenorhabditis nematodes . bioRxiv doi: 10.1101/2024.10.27.620551 . OpenUrl Abstract / FREE Full Text ↵ Ge , R. , Mai , G. , Zhang , R. , Wu , X. , Wu , Q. , & Zhou , F . ( 2017 ). MUSTv2: an improved de novo detection program for recently active Miniature Inverted Repeat Transposable Elements (MITEs) . Journal of Integrative Bioinformatics 14 , 20170029 . OpenUrl PubMed ↵ Gonzalez de la Rosa , P. M. , Thomson , M. , Trivedi , U. , Tracey , A. , Tandonnet , S. , & Blaxter , M. ( 2021 ). A telomere-to-telomere assembly of Oscheius tipulae and the evolution of rhabditid nematode chromosomes . G3 11 , 1 – 17 . OpenUrl CrossRef PubMed ↵ Green , M. R. , & Sambrook , J . ( 2020 ). Total RNA extraction from Caenorhabditis elegans . Cold Spring Harbor Protocols 2020 , 101683 . OpenUrl CrossRef PubMed ↵ Gremme , G. , Steinbiss , S. , & Kurtz , S . ( 2013 ). GenomeTools: a comprehensive software library for efficient processing of structured genome annotations . IEEE/ACM Transactions on Computational Biology and Bioinformatics 10 , 645 – 656 . OpenUrl CrossRef ↵ Haas , B. ( 2007 ). TransposonPSI: an application of PSI-Blast to mine (retro-) transposon ORF homologies . Broad Institute , Cambridge, MA, USA . https://transposonpsi.sourceforge.net/ ↵ Haas , B. J. , Delcher , A. L. , Mount , S. M. , Wortman , J. R. , Smith , R. K. , Jr . , Hannick , L. I. , Maiti , R. , Ronning , C. M. , Rusch , D. B. , Town , C. D. , Salzberg , S. L. , & White , O . ( 2003 ). Improving the Arabidopsis genome annotation using maximal transcript alignment assemblies . Nucleic Acids Research 31 , 5654 – 5666 . OpenUrl CrossRef PubMed Web of Science ↵ Haas , B. J. , Salzberg , S. L. , Zhu , W. , Pertea , M. , Allen , J. E. , Orvis , J. , White , O. , Buell , C. R. , & Wortman , J. R . ( 2008 ). Automated eukaryotic gene structure annotation using EVidenceModeler and the Program to Assemble Spliced Alignments . Genome Biology 9 , R7 . OpenUrl CrossRef PubMed ↵ Huang , Y. , Lo , Y.-H. , Hsu , J.-C. , Le , T. S. , Yang , F.-J. , Chang , T. , Braendle , C. , & Wang , J . ( 2023 ). Widespread sex ratio polymorphism in Caenorhabditis nematodes . Royal Society Open Science 10 , 221636 . OpenUrl CrossRef PubMed ↵ Hu , J. , Zheng , Y. , & Shang , X . ( 2018 ). MiteFinderII: a novel tool to identify miniature inverted-repeat transposable elements hidden in eukaryotic genomes . BMC Medical Genomics 11 ( Suppl 5 ), 101 . OpenUrl CrossRef PubMed J. Johnson , A. , & F Gomez , D. ( 2020 ). General assembly and alignment in Geneious v1 . doi: 10.17504/protocols.io.bnvfme3n ↵ Kapusta , A. , Suh , A. , & Feschotte , C . ( 2017 ). Dynamics of genome size evolution in birds and mammals . Proc Natl Acad Sci USA 114 , E1460 – E1469 . OpenUrl Abstract / FREE Full Text ↵ Katoh , K. , & Standley , D. M . ( 2013 ). MAFFT multiple sequence alignment software version 7: improvements in performance and usability . Molecular Biology and Evolution 30 , 772 – 780 . OpenUrl CrossRef PubMed Web of Science ↵ Kiontke , K. C. , Félix , M.-A. , Ailion , M. , Rockman , M. V. , Braendle , C. , Pénigault , J.-B. , & Fitch , D. H. A . ( 2011 ). A phylogeny and molecular barcodes for Caenorhabditis , with numerous new species from rotting fruits . BMC Evolutionary Biology 11 , 339 . OpenUrl CrossRef PubMed ↵ Kiontke , K. , Gavin , N. P. , Raynes , Y. , Roehrig , C. , Piano , F. , & Fitch , D. H. A . ( 2004 ). Caenorhabditis phylogeny predicts convergence of hermaphroditism and extensive intron loss . Proc Natl Acad Sci USA 101 , 9003 – 9008 . OpenUrl Abstract / FREE Full Text ↵ Kolmogorov , M. , Yuan , J. , Lin , Y. , & Pevzner , P.A . ( 2019 ). Assembly of long, error-prone reads using repeat graphs . Nat Biotechnol . 37 , 540 – 546 . OpenUrl CrossRef PubMed ↵ Kursel , L. E. , Cope , H. D. , & Rog , O . ( 2021 ). Unconventional conservation reveals structure-function relationships in the synaptonemal complex . bioRxiv . doi: 10.1101/2021.06.16.448737 OpenUrl Abstract / FREE Full Text ↵ Lamelza , P. , Young , J. M. , Noble , L. M. , Caro , L. , Isakharov , A. , Palanisamy , M. , Rockman , M. V. , Malik , H. S. , & Ailion , M . ( 2019 ). Hybridization promotes asexual reproduction in Caenorhabditis nematodes . PLoS Genetics 15 , e1008520 . OpenUrl CrossRef ↵ Le , S. Q. , & Gascuel , O . ( 2008 ). An improved general amino acid replacement matrix . Molecular Biology and Evolution 25 , 1307 – 1320 . OpenUrl CrossRef PubMed Web of Science ↵ Le , T. S. , Yang , F.-J. , Lo , Y.-H. , Chang , T. C. , Hsu , J.-C. , Kao , C.-Y. , & Wang , J. ( 2017 ). Non-Mendelian assortment of homologous autosomes of different sizes in males is the ancestral state in the Caenorhabditis lineage . Scientific Reports 7 , 12819 . OpenUrl CrossRef PubMed ↵ Li , H . ( 2018 ) Minimap2: pairwise alignment for nucleotide sequences , Bioinformatics 34 , 3094 – 3100 . OpenUrl CrossRef PubMed ↵ Libuda , D. E. , Uzawa , S. , Meyer , B. J. , & Villeneuve , A. M . ( 2013 ). Meiotic chromosome structures constrain and respond to designation of crossover sites . Nature 502 , 703 – 706 . OpenUrl CrossRef PubMed Web of Science ↵ Maciejowski , J. , Ahn , J. H. , Cipriani , P. G. , Killian , D. J. , Chaudhary , A. L. , Lee , J. I. , Voutev , R. , Johnsen , R. C. , Baillie , D. L. , Gunsalus , K. C. , Fitch , D. H. A. , & Hubbard , E. J. A . ( 2005 ). Autosomal genes of autosomal/X-linked duplicated gene pairs and germ-line proliferation in Caenorhabditis elegans . Genetics 169 , 1997 – 2011 . OpenUrl Abstract / FREE Full Text ↵ Maduro , M. F . ( 2020 ). Evolutionary dynamics of the SKN-1 → MED → END-1,3 regulatory gene cascade in Caenorhabditis endoderm specification . G3 10 , 333 – 356 . OpenUrl Abstract / FREE Full Text ↵ Mao , H. , & Wang , H . ( 2017 ). SINE_scan: an efficient tool to discover short interspersed nuclear elements (SINEs) in large-scale genomic datasets . Bioinformatics 33 , 743 – 745 . OpenUrl CrossRef PubMed ↵ Memar , N. , Schiemann , S. , Hennig , C. , Findeis , D. , Conradt , B. , & Schnabel , R . ( 2019 ). Twenty million years of evolution: The embryogenesis of four Caenorhabditis species are indistinguishable despite extensive genome divergence . Developmental Biology 447 , 182 – 199 . OpenUrl CrossRef PubMed ↵ Muggeo , V. M. R. ( 2008 ). Segmented: An R package to fit regression models with broken-line relationships . R News 8 , 20 – 25 . OpenUrl ↵ Nelson , C. , & Ambros , V. ( 2021 ). A cohort of Caenorhabditis species lacking the highly conserved let-7 microRNA . G3 11 , jkab022 ↵ Nguyen , L.-T. , Schmidt , H. A. , von Haeseler , A. , & Minh , B. Q. ( 2015 ). IQ-TREE: a fast and effective stochastic algorithm for estimating maximum-likelihood phylogenies . Molecular Biology and Evolution 32 , 268 – 274 . OpenUrl CrossRef PubMed ↵ Noble , L. M. , Rockman , M. V. , & Teotónio , H . ( 2021 ). Gene-level quantitative trait mapping in Caenorhabditis elegans . G3 11 , jkaa061 Noble , L. M. , Yuen , J. , Stevens , L. , Moya , N. , Persaud , R. , Moscatelli , M. , Jackson , J. L. , Zhang , G. , Chitrakar , R. , Baugh , L. R. , Braendle , C. , Andersen , E. C. , Seidel , H. S. , & Rockman , M. V . ( 2021 ). Selfing is the safest sex for Caenorhabditis tropicalis . eLife 10 , e62587 . OpenUrl CrossRef PubMed Nurk S , Walenz BP , Rhie A , Vollger MR , Logsdon GA , Grothe R , Miga KH , Eichler EE , Phillippy AM , Koren S. ( 2019 ). HiCanu: accurate assembly of segmental duplications, satellites, and allelic variants from high-fidelity long reads . Genome Res . 30 , 1291 – 1305 . OpenUrl ↵ Paradis , E. , & Schliep , K . ( 2019 ). ape 5.0: an environment for modern phylogenetics and evolutionary analyses in R . Bioinformatics 35 , 526 – 528 . OpenUrl CrossRef PubMed ↵ Parée , T. , Noble , L. , Roze , D. , & Teotónio , H . ( 2025 ). Selection can favor a recombination landscape that limits polygenic adaptation . Molecular Biology and Evolution 42 , msae273 ↵ Poplin , R. , Chang , P.C. , Alexander , D. , Schwartz , S. , Colthurst , T. , Ku , A. , Newburger , D. , Dijamco , J. , Nguyen , N. , Afshar , P.T. , Gross , S.S. , Dorfman , L. , McLean , C.Y. , & DePristo , M.A . ( 2018 ). A universal SNP and small-indel variant caller using deep neural networks . Nat Biotechnol 36 , 983 – 987 . OpenUrl CrossRef PubMed ↵ Quinlan , A. R. , & Hall , I. M . ( 2010 ). BEDTools: a flexible suite of utilities for comparing genomic features . Bioinformatics 26 , 841 – 842 . OpenUrl CrossRef PubMed Web of Science ↵ R Core Team . ( 2024 ) R: A Language and Environment for Statistical Computing . R Foundation for Statistical Computing , Vienna, Austria . Riehl , K. , Riccio , C. , Miska , E. A. , & Hemberg , M . ( 2022 ). TransposonUltimate: software for transposon classification, annotation and detection . Nucleic Acids Research 50 , gkac136. ↵ Rillo-Bohn , R. , Adilardi , R. , Mitros , T. , Avşaroğlu , B. , Stevens , L. , Köhler , S. , Bayes , J. , Wang , C. , Lin , S. , Baskevitch , K. A. , Rokhsar , D. S. , & Dernburg , A. F . ( 2021 ). Analysis of meiosis in Pristionchus pacificus reveals plasticity in homolog pairing and synapsis in the nematode lineage . eLife 10 , e70990 . OpenUrl CrossRef PubMed ↵ Rockman , M. V . ( 2025 ). Parental-effect gene-drive elements under partial selfing, or why do Caenorhabditis genomes have hyperdivergent regions? Genetics 229 , iyae175. ↵ Rockman , M. V. , & Kruglyak , L . ( 2009 ). Recombinational landscape and population genomics of Caenorhabditis elegans . PLoS Genetics 5 , e1000419 . OpenUrl CrossRef PubMed ↵ Ross , J. A. , Koboldt , D. C. , Staisch , J. E. , Chamberlin , H. M. , Gupta , B. P. , Miller , R. D. , Baird , S. E. , & Haag , E. S . ( 2011 ). Caenorhabditis briggsae recombinant inbred line genotypes reveal inter-strain incompatibility and the evolution of recombination . PLoS Genetics 7 , e1002174 . OpenUrl CrossRef PubMed ↵ Seidel , H. S. , Rockman , M. V. , & Kruglyak , L . ( 2008 ). Widespread genetic incompatibility in C. elegans maintained by balancing selection . Science 319 , 589 – 594 . OpenUrl Abstract / FREE Full Text ↵ Seppey , M. , Manni , M. , & Zdobnov , E. M . ( 2019 ). BUSCO: Assessing genome assembly and annotation completeness . Methods in Molecular Biology 1962 , 227 – 245 . OpenUrl CrossRef PubMed ↵ Sharp , P. M. , & Li , W. H . ( 1986 ). An evolutionary perspective on synonymous codon usage in unicellular organisms . Journal of Molecular Evolution 24 , 28 – 38 . OpenUrl CrossRef PubMed Web of Science ↵ Shaw , C. L. , & Kennedy , D. A . ( 2022 ). Developing an empirical model for spillover and emergence: Orsay virus host range in Caenorhabditis . Proceedings Biological Sciences 289 , 20221165 . OpenUrl CrossRef PubMed ↵ Slater , G. S. C. , & Birney , E . ( 2005 ). Automated generation of heuristics for biological sequence comparison . BMC Bioinformatics 6 , 31 . OpenUrl CrossRef PubMed ↵ Sloat , S. A. , Noble , L. M. , Paaby , A. B. , Bernstein , M. , Chang , A. , Kaur , T. , Yuen , J. , Tintori , S. C. , Jackson , J. L. , Martel , A. , Salome Correa , J. A. , Stevens , L. , Kiontke , K. , Blaxter , M. , & Rockman , M. V . ( 2022 ). Caenorhabditis nematodes colonize ephemeral resource patches in neotropical forests . Ecology and Evolution 12 , e9124 . OpenUrl CrossRef ↵ Slos , D. , Sudhaus , W. , Stevens , L. , Bert , W. , & Blaxter , M . ( 2017 ). Caenorhabditis monodelphis sp. n .: defining the stem morphology and genomics of the genus Caenorhabditis. BMC Zoology 2 , 4 . OpenUrl ↵ Snoek , B. L. , Volkers , R. J. M. , Nijveen , H. , Petersen , C. , Dirksen , P. , Sterken , M. G. , Nakad , R. , Riksen , J. A. G. , Rosenstiel , P. , Stastna , J. J. , Braeckman , B. P. , Harvey , S. C. , Schulenburg , H. , & Kammenga , J. E . ( 2019 ). A multi-parent recombinant inbred line population of C. elegans allows identification of novel QTLs for complex life history traits . BMC Biology 17 , 24 . OpenUrl CrossRef PubMed ↵ Stanke , M. , Keller , O. , Gunduz , I. , Hayes , A. , Waack , S. , & Morgenstern , B . ( 2006 ). AUGUSTUS: ab initio prediction of alternative transcripts . Nucleic Acids Research 34 , W435 – W439 . OpenUrl CrossRef PubMed Web of Science ↵ Steinbiss , S. , Willhoeft , U. , Gremme , G. , & Kurtz , S . ( 2009 ). Fine-grained annotation and classification of de novo predicted LTR retrotransposons . Nucleic Acids Research 37 , 7002 – 7013 . OpenUrl CrossRef PubMed Web of Science ↵ Stevens , L. , Félix , M.-A. , Beltran , T. , Braendle , C. , Caurcel , C. , Fausett , S. , Fitch , D. , Frézal , L. , Gosse , C. , Kaur , T. , Kiontke , K. , Newton , M. D. , Noble , L. M. , Richaud , A. , Rockman , M. V. , Sudhaus , W. , & Blaxter , M . ( 2019 ). Comparative genomics of 10 new Caenorhabditis species . Evolution Letters 3 , 217 – 236 . OpenUrl CrossRef PubMed ↵ Stevens , L. , Moya , N. D. , Tanny , R. E. , Gibson , S. B. , Tracey , A. , Na , H. , Chitrakar , R. , Dekker , J. , Walhout , A. J. M. , Baugh , L. R. , & Andersen , E. C . ( 2022 ). Chromosome-level reference genomes for two strains of Caenorhabditis briggsae : An improved platform for comparative genomics . Genome Biology and Evolution 14 , evac042. ↵ Stevens , L. , Rooke , S. , Falzon , L. C. , Machuka , E. M. , Momanyi , K. , Murungi , M. K. , Njoroge , S. M. , Odinga , C. O. , Ogendo , A. , Ogola , J. , Fèvre , E. M. , & Blaxter , M . ( 2020 ). The genome of Caenorhabditis bovis . Current Biology 30 , 1023 – 1031 . OpenUrl CrossRef PubMed ↵ Storer , J. , Hubley , R. , Rosen , J. , Wheeler , T. J. , & Smit , A. F . ( 2021 ). The Dfam community resource of transposable element families, sequence models, and genome annotations . Mobile DNA 12 , 2 . OpenUrl CrossRef PubMed ↵ Strome , S. , Kelly , W. G. , Ercan , S. , & Lieb , J. D. ( 2014 ). Regulation of the X chromosomes in Caenorhabditis elegans . Cold Spring Harbor Perspectives in Biology 6 , a018366 . OpenUrl Abstract / FREE Full Text ↵ Sudhaus , W. , & Kiontke , K . ( 2007 ). Comparison of the cryptic nematode species Caenorhabditis brenneri sp. n. and C. remanei (Nematoda: Rhabditidae) with the stem species pattern of the Caenorhabditis Elegans group . Zootaxa 1456 , 45 – 62 . OpenUrl ↵ Sun , S. , Kanzaki , N. , Dayi , M. , Maeda , Y. , Yoshida , A. , Tanaka , R. , & Kikuchi , T . ( 2022 ). The compact genome of Caenorhabditis niphades n. sp ., isolated from a wood-boring weevil, Niphades variegatus . BMC Genomics 23 , 765 . OpenUrl CrossRef PubMed ↵ Tautz , D. , & Domazet-Lošo , T . ( 2011 ). The evolutionary origin of orphan genes . Nature Reviews Genetics 12 , 692 – 702 . OpenUrl CrossRef PubMed ↵ Ter-Hovhannisyan , V. , Lomsadze , A. , Chernoff , Y. O. , & Borodovsky , M . ( 2008 ). Gene prediction in novel fungal genomes using an ab initio algorithm with unsupervised training . Genome Research 18 , 1979 – 1990 . OpenUrl Abstract / FREE Full Text ↵ Teterina , A. A. , Willis , J. H. , Lukac , M. , Jovelin , R. , Cutter , A. D. , & Phillips , P. C . ( 2023 ). Genomic diversity landscapes in outcrossing and selfing Caenorhabditis nematodes . PLoS Genetics 19 , e1010879 . OpenUrl CrossRef PubMed ↵ Thomas , J. H . ( 2006 ). Analysis of homologous gene clusters in Caenorhabditis elegans reveals striking regional cluster domains . Genetics 172 , 127 – 143 . OpenUrl Abstract / FREE Full Text ↵ Wang , J. , Chen , P.-J. , Wang , G. J. , & Keller , L . ( 2010 ). Chromosome size differences may affect meiosis and genome size . Science 329 , 293 . OpenUrl Abstract / FREE Full Text ↵ Wenke , T. , Döbel , T. , Sörensen , T. R. , Junghans , H. , Weisshaar , B. , & Schmidt , T . ( 2011 ). Targeted identification of short interspersed nuclear element families shows their widespread existence and extreme heterogeneity in plant genomes . The Plant Cell 23 , 3117 – 3128 . OpenUrl Abstract / FREE Full Text ↵ Woodruff , G. C. , & Teterina , A. A . ( 2020 ). Degradation of the repetitive genomic landscape in a close relative of Caenorhabditis elegans . Molecular Biology and Evolution 37 , 2549 – 2567 . OpenUrl CrossRef PubMed ↵ Xiong , W. , He , L. , Lai , J. , Dooner , H. K. , & Du , C . ( 2014 ). HelitronScanner uncovers a large overlooked cache of Helitron transposons in many plant genomes . Proc Natl Acad Sci USA 111 , 10263 – 10268 . OpenUrl Abstract / FREE Full Text ↵ Yang , Z . ( 1994 ). Maximum likelihood phylogenetic estimation from DNA sequences with variable rates over sites: approximate methods . Journal of Molecular Evolution 39 , 306 – 314 . OpenUrl CrossRef PubMed Web of Science ↵ Yoshida , K. , Rödelsperger , C. , Röseler , W. , Riebesell , M. , Sun , S. , Kikuchi , T. , & Sommer , R. J . ( 2023 ). Chromosome fusions repatterned recombination rate and facilitated reproductive isolation during Pristionchus nematode speciation . Nature Ecology & Evolution 7 , 424 – 439 . OpenUrl PubMed ↵ Zdraljevic , S. , Walter-McNeill , L. , Bruni , G. N. , Bloom , J. S. , Leighton , D. H. W. , Collins , J. B. , Marquez , H. , Alexander , N. , & Kruglyak , L . ( 2024 ). Divergent C. elegans toxin alleles are suppressed by distinct mechanisms . bioRxiv doi: 10.1101/2024.04.26.591160 . OpenUrl Abstract / FREE Full Text ↵ Zhang , C. , Rabiee , M. , Sayyari , E. , & Mirarab , S . ( 2018 ). ASTRAL-III: polynomial time species tree reconstruction from partially resolved gene trees . BMC Bioinformatics 19 ( Suppl 6 ), 153 . OpenUrl CrossRef PubMed ↵ Zhao , Z. , Boyle , T. J. , Bao , Z. , Murray , J. I. , Mericle , B. , & Waterston , R. H . ( 2008 ). Comparative analysis of embryonic cell lineage between Caenorhabditis briggsae and Caenorhabditis elegans . Developmental Biology 314 , 93 – 99 . OpenUrl CrossRef PubMed Web of Science View the discussion thread. Back to top Previous Next Posted May 15, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Conservative evolution of genetic and genomic features in Caenorhabditis becei, an experimentally tractable gonochoristic worm Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Conservative evolution of genetic and genomic features in Caenorhabditis becei , an experimentally tractable gonochoristic worm Jose Salome Correa , Luke M. Noble , Solomon A. Sloat , Tuc H. M. Nguyen , Matthew V. Rockman bioRxiv 2025.05.09.653148; doi: https://doi.org/10.1101/2025.05.09.653148 Share This Article: Copy Citation Tools Conservative evolution of genetic and genomic features in Caenorhabditis becei , an experimentally tractable gonochoristic worm Jose Salome Correa , Luke M. Noble , Solomon A. Sloat , Tuc H. M. Nguyen , Matthew V. Rockman bioRxiv 2025.05.09.653148; doi: https://doi.org/10.1101/2025.05.09.653148 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Evolutionary Biology Subject Areas All Articles Animal Behavior and Cognition (7640) Biochemistry (17706) Bioengineering (13902) Bioinformatics (41978) Biophysics (21465) Cancer Biology (18611) Cell Biology (25528) Clinical Trials (138) Developmental Biology (13387) Ecology (19920) Epidemiology (2067) Evolutionary Biology (24332) Genetics (15615) Genomics (22519) Immunology (17747) Microbiology (40424) Molecular Biology (17194) Neuroscience (88662) Paleontology (667) Pathology (2838) Pharmacology and Toxicology (4827) Physiology (7650) Plant Biology (15160) Scientific Communication and Education (2046) Synthetic Biology (4302) Systems Biology (9826) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00