Recovering ecological interactions by mining non-target data from whole genome re-sequencing projects

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 61,496 characters · extracted from preprint-html · click to expand
Recovering ecological interactions by mining non-target data from whole genome re-sequencing projects | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Recovering ecological interactions by mining non-target data from whole genome re-sequencing projects View ORCID Profile Mirkka Jones , View ORCID Profile Pasi Rastas , View ORCID Profile J. Camilo Chacón-Duque , View ORCID Profile Michelle F. DiLeo , Abhilash Nair , View ORCID Profile Vicencio Oostra , View ORCID Profile Marjo Saastamoinen , View ORCID Profile Anne Duplouy doi: https://doi.org/10.1101/2025.01.17.633498 Mirkka Jones 1 Organismal and Evolutionary Biology Research Program, Faculty of Biological and Environmental Sciences, University of Helsinki , Helsinki, Finland 2 Research services, Aalto University , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Mirkka Jones Pasi Rastas 3 Institute of Biotechnology, University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Pasi Rastas J. Camilo Chacón-Duque 4 Centre for Palaeogenetics, Stockholm University , Stockholm, Sweden 5 Department of Zoology, Stockholm University , Stockholm, Sweden Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for J. Camilo Chacón-Duque Michelle F. DiLeo 6 Ontario Ministry of Natural Resources and Forestry , Ontario, Canada Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Michelle F. DiLeo Abhilash Nair 1 Organismal and Evolutionary Biology Research Program, Faculty of Biological and Environmental Sciences, University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site Vicencio Oostra 7 School of Biological and Behavioural Sciences, Queen Mary University of London , London, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Vicencio Oostra Marjo Saastamoinen 1 Organismal and Evolutionary Biology Research Program, Faculty of Biological and Environmental Sciences, University of Helsinki , Helsinki, Finland 8 Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Marjo Saastamoinen Anne Duplouy 1 Organismal and Evolutionary Biology Research Program, Faculty of Biological and Environmental Sciences, University of Helsinki , Helsinki, Finland 8 Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Anne Duplouy For correspondence: anne.duplouy{at}helsinki.fi Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract The study of parasitic species can shed light on aspects of their host’s ecology. Such interactions are however often unknown or understudied due to the difficulty to detect and/or quantify many infections. Whole-genome sequencing and re-sequencing data have been generated at an increasing rate and reduced costs over the last two decades. Projects based on whole organisms, like whole insect specimens, provide genomic material for the target taxon, but may also include sequencing reads from associated microbes and other parasites. Here, we screened for the presence of non-host reads in a collection of whole-genome (re-) sequence projects from the Glanville fritillary butterfly, Melitaea cinxia, a model organism in research on the ecology and evolution of species in spatially structured and fragmented landscapes. We identified infections with different bacteria and eukaryotic parasites, which are shared between populations and underly both previously known and new biotic interactions for this butterfly species. The bacterial symbiont Wolbachia , usually common in insects, was found at relatively low prevalence, while Spiroplasma was ubiquitous across samples from several European populations of the butterfly. Additionally, we confirmed expected rates of larval parasitism by at least two parasitoid wasps. Such results provide proof of principle that key ecological interactions can be uncovered efficiently from existing data, an important first step to characterising the role host-associated organisms play in shaping the ecology and evolutionary history of their host species. Introduction Whether costly or beneficial, infections can have large impacts on their hosts’ life-histories, population dynamics and genetic diversity ( Glasl et al. 2016 ; Hochachka et al. 2021 ; Rogowski et al. 2020 ; Tollenaere et al. 2014 ). For example, In the Åland Islands, the infection of 10% or more of all available Melitaea cinxia butterfly larvae by the parasitoid wasp Cotesia melitaearum can severely affect local butterfly host populations (Lei et al. 1997a; Shaw et al. 2009 ), while neighbouring populations might remain unaffected by the parasitoid (Lei et al. 1997b; van Nouhuys 2016 ). Similarly, bacterial symbionts that are maternally transmitted, such as Wolbachia and Spiroplasma , can manipulate diverse host life-histories and other reproductive traits ( Correa & Ballard 2016 ; Duplouy & Hornett 2018 ). They can, for example, induce cytoplasmic incompatibility (CI) between infected males and uninfected females ( Charlat et al. 2006 ; Hornett et al. 2008 ; Koehncke et al. 2009 ; Pollmann et al. 2022 ), or protect their host against pathogens ( Teixeira et al. 2008 ; Łukasik et al. 2013 ), thus boosting the reproductive output of the symbiont-infected females compared to uninfected ones. These manipulations facilitate the spread of the symbiont through the host population, and in turn lead to a reduction in the genetic diversity of their host, as host infected mitochondrial haplotypes hitchhike successful infections ( Charlat et al. 2009 ; Deng et al. 2021 ; Graham & Wilson 2012 ). Such infections are, however, not always included in ecological and evolutionary studies of host species, as they often remain hidden because they may be tricky to detect and not always abundant across their host geographical distribution. The development of next-generation sequencing methods has allowed the birth of metagenomics, which aims to sequence and analyse the reads from both a targeted host and its diverse associated organisms. In insects, metagenomic analyses from whole-body sequencing projects have, for example, identified a wide diversity of previously hidden, or difficult to study or culture bacterial endosymbionts ( i.e ., microbes that live inside host cells or tissues)( Gibson et al. 2014 ; Twort et al. 2022 ; Vancaester & Blaxter 2023 ). These studies have revealed key ecological and evolutionary species-interactions ( Chellappan & Ranjith 2021 ; Liang et al. 2020 ; Vancaester & Blaxter 2023 ), and provide insights into many complex species-interactions, including the taxonomic identity and genetic diversity of associated species, their prevalence and biogeography, as well as their function ( Ghanavi et al. 2021 ; Susi et al. 2019 ; Zhang et al. 2018 ). Nonetheless, despite the dramatic effects that infections can have on their hosts, and despite the development of metagenomic approaches, whole-genome projects rarely include analyses investigating the metagenome of the targeted host species. Consequently, many infections remain uncharacterized, significantly limiting the conclusions drawn from studies of their host populations. The Glanville fritillary butterfly, Melitaea cinxia , is a well-known model-species for the study of the eco-evolutionary consequences of habitat fragmentation on wild species ( Duplouy et al. 2013 ; Hanski & Heino 2003 ; Kahilainen et al. 2018 ). The species is widespread across Eurasia, where it is known to feed on a few host plant species ( Hanski et al. 2004 ), including the ribwort plantain, Plantago lanceolata . In particular, a metapopulation of the butterfly in the Åland Islands, an archipelago between the coast of Finland and Sweden in the Baltic Sea, has been the focus of 30 years of ecological and evolutionary dynamics studies ( Ojanen et al. 2013 ; Saastamoinen 2022 ). Studies of this butterfly metapopulation have been complemented by studies of their associated community of specialized parasitoid wasps (Lei et al. 1997a; van Nouhuys et al. 2012 ), as well as a handful of recent microbiota studies ( Duplouy et al. 2018 ; Duplouy et al. 2020a ; Minard et al. 2019 ; Rosa et al. 2019 ). The rearing of field-collected M. cinxia larvae in the laboratory shows that parasitoid wasps emerge each year from about 30% of the larvae ( Montovan et al. 2015 ), and that the presence of a parasitoid infection affects the species composition of the larval gut microbiota ( Minard et al. 2019 ). Although these results have provided insights on trophic and symbiotic interactions within this ecological system (Lei et al. 1997a; van Nouhuys et al. 2012 ), several aspects of these interactions remain unclear. For example, it is unclear whether all parasitism attempts are successful, or whether the parasitoid emergence rate only represents a fraction of the parasitoid eggs laid. The exceptionally detailed understanding of the ecology of M. cinxia has recently been complemented with a large amount of genetic and genomic information, including three high-quality versions of the whole genome and chromosomal assembly of the butterfly species ( Ahola et al. 2014 ; Smolander et al. 2022 ; Vila et al. 2021 ), and ongoing population re-sequencing studies. Here, we analyse several M. cinxia genomic datasets as a source of non-target genomic material reflecting diverse prokaryotic and eukaryotic infections in larvae and adult butterflies from the Åland Islands (Finland), as well as from adults collected across Europe and North-Africa (France, Morocco, Spain, Switzerland). Specifically, we investigate presence, prevalence and geographical range of an array of parasites, including the common endosymbiotic bacteria Wolbachia and Spiroplasma , and the Cotesia and Hyposoter larval parasitoids. The detection of microbial symbiont species provides the foundation for further characterizing how they might affect the population dynamics and genetics of their host species. Detected parasitoid infection rates, in turn, provide information on both the prevalence and the potential amplitude of their impacts on butterfly host populations. Materials and Methods a) Origin of raw sequence data The Glanville fritillary butterfly, Melitaea cinxia (Linnaeus, 1758), is a widespread checkerspot species across Europe, and the model organism for 30 years of ecological and evolutionary studies on the effects of habitat fragmentation in the Åland Islands, an archipelago in the Baltic Sea region ( Ojanen et al. 2013 ). Across the butterfly’s geographical range, the species inhabits meadow habitats, where larvae feed on few host plants, including Plantago lanceolata (Linnaeus, 1753) and Veronica spicata (Linnaeus, 1753). The butterfly’s eggs, larvae and pupae are parasitised by several common parasitoid wasp species, including specialized species such as Hyposoter horticola (Gravenhorst, 1829) and Cotesia melitaearum (Wilkinson, 1937). These wasps belong to the Braconidae and Ichneumonidae groups, respectively, and are known to have important impacts on the butterfly’s population dynamics (Lei et al. 1997a). The bacterial microbiota associated with larvae collected in the field in the Åland islands, or reared in the laboratory, have been previously characterized through 16S rRNA gene metabarcoding approaches ( Duplouy et al. 2020a ; Minard et al. 2019 ). The first assembly of the genome of M. cinxia was released in 2014 ( Ahola et al. 2014 ), followed by two chromosome-level assemblies in 2021 ( Vila et al. 2021 ) and 2022 ( Smolander et al. 2022 ). We retrieved the raw sequence data from five whole genome sequence datasets, including two genomic assembly projects ( Ahola et al. 2014 ; Smolander et al. 2022 ) with NCBI references # PRJNA191594 and # PRJNA607899 , respectively, and from three additional independent projects comparing genomic characteristics of different local or regional populations (labelled Adults Europe #C; Åland larvae & adults #D; and Åland larvae #E). Dataset #D was derived from both larval and adult specimens collected in the Åland Islands in 2009 and 2010, dataset #E from wild larval samples collected in the Åland Islands in 2018 and 2019, while dataset #C included only wild adult specimens collected during summer 2020 in France, Morocco, Spain, and Switzerland. The sample preparation and sequencing techniques vary between projects, including NovaSeq, NovaSeq 150bp Paired-Ends, and NextSeq 170bp PE (as described in Table 1 ). View this table: View inline View popup Download powerpoint Table 1: Sample size, country of origin, developmental stage, and sex for each of the genomic project screened for non-host reads. The * samples were pooled without prior knowledge of the sex of the larvae. Unfortunately, the low coverage for each specimen in all projects compromised the deep characterization of the metagenome of each specimen individually. Thus, to improve our ability to detect non-host material, we pooled all samples from the same dataset, same population and same sex (when known) together. This reduced the total number of samples from the original N initial =425 specimens (plus the two full genome projects) to N final =166 samples (plus the two full genome projects). Details on the pooled sample size, country of origin, life stage and sex of the samples, as well as the sequencing method used for each project, are described in Table 1 . b) Sex characterization of larval samples Although we characterized the sex of the adult specimens through visual inspection of their external genitalia prior to dissections, the larvae of this butterfly species do not show any external sexually dimorphic traits, and thus their sex could only be determined after sequencing. Females were identified based on homozygosity across a set of 22 Z-chromosome specific single-nucleotide polymorphism loci ( Kahilainen et al. 2022 ). c) Screening for non-host genomic material We trimmed the Illumina paired-end reads to remove Illumina adapter sequences and any low-quality bases from the start and end of reads using Trimmomatic version 0.39 ( Bolger et al. 2014 ) with the ILLUMINACLIP adapter-clipping settings 2:30:10 LEADING:3 TRAILING:3 SLIDINGWINDOW:4:15 MINLEN:50. We then used the SPAdes assembly toolkit version 3.15.0 ( Bankevich et al. 2012 ) ( https://github.com/ablab/spades ) with the --meta (metagenomic) flag to denovo assemble the trimmed paired reads into contigs ( Nurk et al. 2017 ). To reduce heterozygosity, we applied the Redundans pipeline ( Pryszcz & Gabaldón 2016 ) to the assembled scaffolds, and later annotated them to NCBI TaxIDs using BLASTN searches (BLAST v. 2.12.0, https://docs.csc.fi/apps/blast/ ) against the NCBI non-redundant nucleotide database, retaining one aligned contig per scaffold (max_target_seqs 1). We only saved the best alignment for each query-subject pair (max_hsps 1), and with an E-value less than 1 × e−25. We then used BWA-MEM ( Li & Durbin 2009 ; Li & Durbin 2010 ) to map all the original trimmed and corrected reads to the reference scaffolds and converted the results into sorted bam format files containing sample, sequence and mapped read data with SAMtools ( Li & Durbin 2009 ). Finally, we generated BlobPlots and associated statistics at the genus taxonomic rank for each assembly with Blobtools v1.1 ( Laetsch & Blaxter 2017 ) based on the BLASTn similarity search results, and using coverage and GC content values to differentiate host genomic material (Table S1). Contamination with any non-host material was considered real, when the value of the ‘bam0_read_map_p’ output from the Blobtools analysis was above 0.5%. Three samples (from #D), were removed prior to subsequent analyses because of their overall lack of non-host data (all non-host hits <0.5% in AF10-173-6, AF10-7007-1, and 09-8544-001-1-5). Additionally, to check that our results were repeatable, we compared the outputs of our Blobtools analyses with the outputs from CC-Metagen analyses ( https://github.com/vrmarcelino/CCMetagen )( Clausen et al. 2018 ; Marcelino et al. 2020 ) for five randomly chosen samples (AF18_2155_1, AF19_48_1, AF19_57_1, AF10-13341-3 and AF19_1956_1). d) Non-host community composition analyses By combining the Blobtools results at the genus level from all the samples, and only selecting the non-host species with a total ‘bam0_read_map_p’ output equal to or above 1%, we created a community matrix of 78 non-host species. This included prokaryote species, as well as some eukaryote species. Hits to Diptera taxa and to Homo sapiens were considered to represent clear sample preparation contaminations and were manually removed before any further analyses. We tested for dissimilarities between treatments (Country, Dataset or Life stage) in this community matrix, using the ANOSIM statistic R test with N=9999 permutations in the VEGAN package in R v.2023.12.0+369 ( RCoreTeam 2020 ). e) Building genome assemblies of common parasites and symbionts We retrieved a representative list of high-quality Wolbachia and Spiroplasma genomes from the NCBI Genome Data Hub (by April 2022), to build independent reference databases of each microbial symbiont ( Valerio et al. 2024a ). The available NCBI genome projects were filtered to only include ‘Complete’ and/or ‘Reference’ genomes. Similarly, we built a reference database for the parasitoid wasp Cotesia sp. using only the two high-quality genomic projects available from NCBI (by April 2022), including the genome assembly of C. congregata (WGS project #CAJNRD03), and the genome assembly of C. glomerata (WGS project #JAHXZJ01). In an attempt to build the Wolbachia, Spiroplasma and Cotesia assemblies from our metagenomic analyses, we combined the reference Wolbachia , Spiroplasma and Cotesia genomes and two M. cinxia full genomes ( Smolander et al. 2022 ; Vila et al. 2021 ) into a single fasta file, after renaming their sequences with a prefix Wo, Sp, Co, or ci, respectively. We used BWA-MEM ( Li & Durbin 2009 ; Li & Durbin 2010 ) to map raw reads from all other projects to this multi species reference. Reads with an alignment score >= 240 (max score is 300, 150bp+150bp reads) were then assembled using the SPAdes software ( Bankevich et al. 2012 ), following the same protocol as in the Blobtools pipeline described above. Results a) Detection of infections from genomic material of M. cinxia Despite combining samples from the same population, year and sex (when possible), the depth of the non- M. cinxia genomic data and total amount of reads assigned to M. cinxia and non- cinxia organism per sample remained low for many samples (Table S2). The amount of non-host material from both host genome sequencing projects ( Ahola et al. 2014 ; Smolander et al. 2022 ) were too low to be confidently further examined (data not shown). The number of reads assigned to M. cinxia from the three re-sequencing projects varies from 7485 to 44687900 reads per sample (with an average=20540118.3), while the number of reads assigned to non-host varies from 4024 to 43524459 reads per sample (with an average=707841) (Table S2). Screening of these samples still provided information on several expected and unexpected infection patterns. The outputs of the Blobtools analyses were similar to those of CC-Metagen analyses on five replicated samples (Table S3). The larval samples AF18_2155_1 and AF19_1956_1 were poor in non-host material, while sample AF19_48_1 contained Spiroplasma reads, sample AF19_57_1 contained genomic material of Braconidae wasps and their polydnavirus, and sample AF10-13341-3 included reads from Pseudomonas , Enterobacter , Klebsiella , and Gluconobacter . The analysis of dissimilarity between the non-host communities associated with our samples indicated that both the source dataset (ANOSIM, R=0.124, p=1e-4, Figure 1A ), and butterfly life stage (ANOSIM, R=0.0222, p=0.0077, Figure 1B ) affected community composition. Country, however, had no significant effect on the composition of non-host communities (ANOSIM, R=-0.128, p=0.996, Figure 1C ). Our analyses, however, only investigate the non-host species community at the genus level, and analyses at the strain level could show different community patterns between countries. Download figure Open in new tab Download figure Open in new tab Figure 1: NMDS1 graph of the non-host community composition. Samples are coloured as (Top) per dataset, (Middle) per life stage, and (Bottom) per country of origin (Salmon ellipse for France covers all other ellipse, and is only shown partially in the graph; The Moroccan population only includes 1 sample and is not represented by any ellipse). Our analyses showed that four and six M. cinxia samples were contaminated with genomic material from two genera of parasitoid wasps: Cotesia sp. and Hyposoter sp. , respectively ( Duplouy et al. 2015 ; van Nouhuys 2016 ). Such contamination was found in both female and male larvae, but never from adult specimens. Genomic reads (ie. N=186432 reads or above) from the braconid Cotesia sp . wasp, as well as from the wasp-associated bracovirus ( Benoist et al. 2017 ; Savary et al. 1999 ), were identified in four larval samples, from the Eckerö and Hammarland communes in Åland (patch #572, 1646, 57, and 1056). Genomic reads from the Ichneumonid Hyposoter sp. wasp, as well as reads from the wasp-associated ichnovirus ( Clavijo et al. 2011 ; Dorémus et al. 2013 ), were detected from six larvae (Table S1) collected from the communes of Saltvik, Hammarland and Sund in the Åland Islands (patch #123, 535×2, 9620, 9025, 9051). We also detected genomic material from the bacterial endosymbionts Wolbachia , Spiroplasma , and Rickettsiella , which are generally ubiquitous in insects ( Duplouy & Hornett 2018 ; Raina et al. 2018 ; Weinert et al. 2015 ). Spiroplasma infections were encountered in 23/86 (26.7%) larval and 22/83 (26.5%) of adult host samples, from both female and male specimens. Spiroplasma was detected from specimens from all source countries, except from Morocco, which is only represented by one sample in our dataset. Despite its high prevalence in our samples, Spiroplasma always represented less than 10% of the total reads per sample (ie. 9400 or more reads/sample). In contrast, Wolbachia was represented by 3.7% to 43.4% of the non-host reads per sample (155526 or more reads/sample), and occurred at a lower prevalence in our datasets, with only five adult samples found infected (5/166, 3%) (Table S1). These Wolbachia -infected samples include three pools of females and two of males, from either Spain or Switzerland. The other endosymbiotic bacterium Rickettsiella was detected in a unique larval sample, and was represented by 54% of the non-host reads of that sample. Many other bacterial species were also found sporadically, including Erwinia (one French adult and one Finnish larval samples, 7%, and 80% of the non-host reads, respectively), Rhanella (two larval samples, 5% and 58% of the non-host reads), Serratia (one French adult sample, 63.5% of the non-host reads), and Yersinia (one adult and five larval samples from the Åland Islands, 1.6% to 50.4% of the non-host reads respectively). One adult sample from the commune of Vall d’Estos in Spain was highly dissimilar to all others (Table S1). This Spanish sample was almost fully contaminated with the bacterium Proteus (96.9% of the non-host reads), and it was the only sample carrying this bacterium in our dataset. This sample was not excluded from the analyses but was excluded as a visual outlier from Figure 1 . Four microbial genera, Gluconobacter, Enterobacter, Actobacter and Alphabaculovirus were only found in the adult and larval Åland dataset #D, while all other microbes were identified from several datasets. b) Genomic assemblies of identified non-host organisms By combining all reads from Åland, we were only able to assemble a 11.2Mb genomic assembly of Cotesia (eg. expected whole genome size >180Mb), and a 65Kb genomic assembly of Spiroplasma (ie. expected whole genome size ≈1.2Mb). We also assembled a 95Kb assembly of Wolbachia genome, by combining reads from the five infected specimens (ie. expected whole genome size ≈1.2Mb, Table 2 ). The covered regions spanned several host genomic scaffolds, and each at a very low abundance ( Figure S1 ). We were unable to retrieve and compare sequences of commonly characterized loci of Cotesia , Spiroplasma or Wolbachia strains to our partial assemblies ( Duplouy et al. 2015 ; Kankare et al. 2005 ). The comparison of the largest contigs from each partial assembly against the NCBI nucleotide database (Blastn search conducted in December 2024, Table 2 ) however supports the assigned identities of our three partial assemblies. Notably, although the GC contents of both the Cotesia and Spiroplasma partial assemblies correlate with previous genomic analyses on these organisms (36% and 25%, respectively), our Wolbachia partial assembly exhibits a much higher GC content than other Wolbachia genomic projects (49% instead of the usual 34%) ( Table 2 ). View this table: View inline View popup Table 2: Statistics and features of three partial genomic assemblies, and best match output (i.e. blastn) between the largest contig of each assembly and the nucleotide NCBI database (December 2024). Discussion Our screening for non-host genomic material in five independent whole genome sequencing datasets of the butterfly M. cinxia revealed the presence of genomic material from different non-host micro- and macro-organisms. Our approach of exploring the non-host genomic material from whole genome sequencing projects for evidence of other species is not novel, and has previously provided insights into a hidden diversity of microbes associated with diverse insect species ( Ghanavi et al. 2021 ; Twort et al. 2022 ; Vancaester & Blaxter 2023 ). However, this is, to our knowledge, the first time that the method is used on datasets from across different life stages, and on several populations from across a large portion of the natural geographical range of a single host species, revealing new details about the ecology and evolution of interactions between M. cinxia butterflies and their diverse parasites. Previous studies have identified the butterfly M. cinxia as the host of several parasitoid species, including specialist and generalist parasitoids attacking the eggs, larvae or pupae of M. cinxia (Lei et al. 1997b; van Nouhuys 2016 ). We present evidence that some of our M. cinxia larvae were parasitized by either Braconidae or Ichneumonidae parasitoid wasps, most likely Cotesia melitaearum and Hyposoter horticola , which are both common in the Åland Islands ( van Nouhuys 2016 ; van Nouhuys et al. 2012 ). The detected parasitism rates, however, (12% of our larval samples) remain under the expected 30% emergence rate by H. horticola alone in the Åland population ( Duplouy et al. 2015 ; Montovan et al. 2015 ). Although, it is possible that this result denotes the low detection ability of the screening method, this result might still suggest that the parasitoids indeed only parasitize a 30% fraction of the available larval hosts ( Montovan et al. 2015 ), rather than a much higher rate but experiencing some degree of mortality before emergence. Additionally, the lack of detection of parasitoid DNA from the sequenced adult butterflies is concordant with the idea that Hyposoter and Cotesia parasitoids are specialists of the M. cinxia larval stage, and that parasitism is fatal for the larvae ( Montovan et al. 2015 ). Our results provide the first evidence that M. cinxia is host to bacterial endosymbionts, including Spiroplasma and Wolbachia . Spiroplasma is a common symbiont of insects, infecting about 10% of species worldwide ( Duplouy & Hornett 2018 ). The bacterium induces diverse phenotypes in its hosts ( Jiggins et al. 2000 ; Pollmann et al. 2022 ), but its effects on the ecology and evolution of M. cinxia remain unknown ( Duplouy et al. 2020a ). As Spiroplasma was found at an intermediate prevalence (i.e. 45/169 samples, 26.6%) and conserved in all populations screened, we suggest that the symbiont may be of relevance for the fitness and/or ecology of its M. cinxia host. Several previous microbiota studies focusing on the Åland population have failed to highlight the presence of the symbiont ( Duplouy et al. 2018 ; Duplouy et al. 2020a ; Minard et al. 2022 ; Minard et al. 2019 ). We suggest that Spiroplasma is present at such low densities in larval and adult M. cinxia hosts, that its detection through metabarcoding approaches might not always be successful. This hypothesis is supported by the fact that, even after pooling all our samples, we could only produce a short partial Spiroplasma assembly (65KB) with very low read coverage. Future studies specifically investigating Spiroplasma in M. cinxia are needed to clarify the prevalence, titer, tropism and role of the symbiont in this butterfly species. In contrast, Wolbachia , perhaps the most common symbiont in insects worldwide ( Duplouy & Hornett 2018 ; O’Neill et al. 1992 ; Zug & Hammerstein 2012 ), was rarely detected in M. cinxia . Spiroplasma and Wolbachia can sometimes co-infect their hosts ( Mathé-Hubert et al. 2019 ), however, as both symbionts are thought to compete for the same resources, they might also exclude each other, which would explain the high prevalence of Spiroplasma and the low prevalence of Wolbachia in our system. Wolbachia and Spiroplasma symbionts are predominantly transmitted maternally, but evidence of horizontal transfers of the symbionts is available from other host systems ( Brown & Lloyd 2015 ; Duplouy et al. 2020b ; Vavre et al. 1999 ). Parasitoid species in particular are described as potential vectors of Wolbachia to naïve hosts ( Vavre et al. 1999 ). In the Åland Islands, 50% of the population of H. horticola is infected with a strain of the bacterial symbiont Wolbachia ( Duplouy et al. 2015 ; Duplouy et al. 2021 ; van Nouhuys et al. 2016 ). The lack of infection in these particular wasps ( Duplouy et al. 2015 ; Duplouy et al. 2021 ), or alternatively, the low sequencing coverage of our samples, combined with the possibly low density of Wolbachia in young parasitoid larvae, could explain why this Wolbachia strain was not detected in any of the six Finnish larvae parasitized by Hyposoter . Unfortunately, because of low coverage, we could not compare the partial Wolbachia assembly from the Spanish and Swiss M. cinxia samples to previously sequenced material from the Wolbachia strains infecting H. horticola from Åland or France ( Duplouy et al. 2015 ). In contrast, we have no evidence of Spiroplasma infection in parasitoids of M. cinxia ( Valerio et al. 2024b ). Overall, the analysis of metagenomes from different life-stages and populations revealed details of the interactions between the butterfly M. cinxia and its parasitoids, as well as with various symbiotic species. Although this study demonstrates the power of such analyses, applicable to any study system ( Vancaester & Blaxter 2023 ), they also generate several new questions and avenues for further research on species interactions. For example, in addition to Wolbachia and Spiroplasma , other microbial infections, such as Yersinia bacteria and baculoviruses, were detected. The detection of such possibly pathogenic species is exciting, and their possible role in host population decline ( Kahilainen et al. 2018 ) deserves further investigation. Finally, although the development of more affordable whole-genome sequencing methods now supports the wider use of those methods in evolutionary biology, the overall coverage and total number of reads obtained from these sequencing projects may often be too low to allow the comprehensive and reliable detection of infections in the targeted host. In our case, even after merging individual sequencing files, we were only able to produce partial assemblies of the genomes of some of the symbiotic strains present in the different populations of M. cinxia . Furthermore, because of the overall low coverage of our samples, we remain cautious about some of our results. For example, the estimated prevalence of many infections should be interpreted carefully, as especially false negatives might still occur despite merging of the data. Similarly, because of the merging of specimen data, we cannot tell exactly how many individual specimens were truly infected per population. Nonetheless, as the outputs from two independent tools, Blobtool ( Laetsch & Blaxter 2017 ) and CC-Metagen, ( Marcelino et al. 2020 ), converged in their taxonomic assignments of the non-host genomic material, we are confident in the provided genus-level taxonomic identifications. But higher coverage would have provided us with better quality assemblies of all species, and would have provided additional population genetic information on the different parasites ( Kankare et al. 2005 ). In conclusion, even if represented at low coverage, available whole-genome sequencing projects not only provide the research community with genomic material from the target species, but also allow the discovery and potential monitoring of diverse pathogenic, parasitic, and symbiotic organisms associated with the target host. In the future, the results of our metagenomic analyses will guide the design of target experimental assays to reveal the role of each detected infection on the fitness and population dynamics of M. cinxia , as well as their importance for the butterfly’s ecology and evolutionary trajectory. Data availability Supplementary material (Table S1-S3 and genomic assemblies) can be found in Zenodo under the DOI 10.5281/zenodo.14673566 . Raw sequence reads from the three re-sequencing datasets will only be made publicly available in NCBI upon publication of the research. Supplementary material Download figure Open in new tab Figure S1: The coverage of Spiroplasma genome (top), Wolbachia genome (middle), and the first 1.4Mb of first Cotesia chromosome (bottom). The top row (coverage=1) of each graph shows the low coverage across the chromosomes. Only very few positions have been covered explaining the resulting partial assemblies obtained in the present study. Table S1: Outputs from the Blobtool analyses. Data can be found under Zenodo DOI 10.5281/zenodo.14673566 . Table S2: Number of reads assigned to each of three parasites (ie. Cotesia, Spiroplasma, Wolbachia ) for each sample. Data can be found under Zenodo DOI 10.5281/zenodo.14673566 . Table S3: Output from the CCMetagen analyses on five selected samples. Data can be found under Zenodo DOI 10.5281/zenodo.14673566 . Acknowledgments We thank F. Valerio for providing reference genome databases for Wolbachia , Spiroplasma and Cotesia . The project was funded by the Academy of Finland (grant #321543 to AD, #316227 to MFD) and Helsinki Institute of Life Science (HiLIFE) start up package to M.S., M.M.J. and P.R., as members of the University of Helsinki Biodata Analytics Unit, were supported by the Academy of Finland’s ‘Thriving Nature’ research profiling action. Thank you to Constanti Stefanescu, Alma Oksanen, Debra DiLeo, Sandra Fagan, Antoni Mariné, and Rachel de Marco for assistance with sample collection in Spain, Switzerland, and Morocco. Footnotes https://zenodo.org/records/14673567 References ↵ Ahola V , Lehtonen R , Somervuo P , Salmela L , Koskinen P , Rastas P , Välimäki N , Paulin L , Kvist J , Wahlberg N , Tanskanen J , Hornett EA , Ferguson LC , Luo S , Cao Z , de Jong MA , Duplouy A , Smolander OP , Vogel H , McCoy RC , Qian K , Chong WS , Zhang Q , Ahmad F , Haukka JK , Joshi A , Salojärvi J , Wheat CW , Grosse-Wilde E , Hughes D , Katainen R , Pitkänen E , Ylinen J , Waterhouse RM , Turunen M , Vähärautio A , Ojanen SP , Schulman AH , Taipale M , Lawson D , Ukkonen E , Mäkinen V , Goldsmith MR , Holm L , Auvinen P , Frilander MJ , and Hanski I. 2014 . The Glanville fritillary genome retains an ancient karyotype and reveals selective chromosomal fusions in Lepidoptera . Nat Commun 5 : 4737 . doi: 10.1038/ncomms5737 OpenUrl CrossRef PubMed ↵ Bankevich A , Nurk S , Antipov D , Gurevich AA , Dvorkin M , Kulikov AS , Lesin VM , Nikolenko SI , Pham S , Prjibelski AD , Pyshkin AV , Sirotkin AV , Vyahhi N , Tesler G , Alekseyev MA , and Pevzner PA . 2012 . SPAdes: a new genome assembly algorithm and its applications to single-cell sequencing . J Comput Biol 19 : 455 – 477 . doi: 10.1089/cmb.2012.0021 OpenUrl CrossRef PubMed ↵ Benoist R , Chantre C , Capdevielle-Dulac C , Bodet M , Mougel F , Calatayud PA , Dupas S , Huguet E , Jeannette R , Obonyo J , Odorico C , Silvain JF , Le Ru B , and Kaiser L. 2017 . Relationship between oviposition, virulence gene expression and parasitism success in Cotesia typhae nov. sp. parasitoid strains . Genetica 145 : 469 – 479 . doi: 10.1007/s10709-017-9987-5 OpenUrl CrossRef PubMed ↵ Bolger AM , Lohse M , and Usadel B . 2014 . Trimmomatic: a flexible trimmer for Illumina sequence data . Bioinformatics 30 : 2114 – 2120 . doi: 10.1093/bioinformatics/btu170 OpenUrl CrossRef PubMed Web of Science ↵ Brown AN , and Lloyd VK. 2015 . Evidence for horizontal transfer of Wolbachia by a Drosophila mite . Experimental and Applied Acarology 66 : 301 – 311 . doi: 10.1007/s10493-015-9918-z OpenUrl CrossRef PubMed ↵ Charlat S , Duplouy A , Hornett EA , Dyson EA , Davies N , Roderick GK , Wedell N , and Hurst GD . 2009 . The joint evolutionary histories of Wolbachia and mitochondria in Hypolimnas bolina . BMC Evol Biol 9 : 64 . doi: 10.1186/1471-2148-9-64 OpenUrl CrossRef PubMed ↵ Charlat S , Engelstädter J , Dyson EA , Hornett EA , Duplouy A , Tortosa P , Davies N , Roderick GK , Wedell N , and Hurst GD . 2006 . Competing selfish genetic elements in the butterfly Hypolimnas bolina . Curr Biol 16 : 2453 – 2458 . doi: 10.1016/j.cub.2006.10.062 OpenUrl CrossRef PubMed Web of Science ↵ Omkar Chellappan M , and Ranjith MT . 2021 . Metagenomic Approaches for Insect Symbionts . In: Omkar , ed. Microbial Approaches for Insect Pest Management . Singapore : Springer , 271 – 313 . ↵ Clausen PTLC , Aarestrup FM , and Lund O . 2018 . Rapid and precise alignment of raw reads against redundant databases with KMA . BMC Bioinformatics 19 : 307 . doi: 10.1186/s12859-018-2336-6 OpenUrl CrossRef PubMed ↵ Clavijo G , Dorémus T , Ravallec M , Mannucci MA , Jouan V , Volkoff AN , and Darboux I . 2011 . Multigenic families in Ichnovirus: a tissue and host specificity study through expression analysis of vankyrins from Hyposoter didymator Ichnovirus . PLoS One 6 : e27522 . doi: 10.1371/journal.pone.0027522 OpenUrl CrossRef PubMed ↵ Correa CC , and Ballard JWO . 2016 . Wolbachia associations with insects: Winning or losing against a master manipulator . Frontiers in Ecology and Evolution 3 : 153 . doi: 10.3389/fevo.2015.00153 OpenUrl CrossRef ↵ Deng J , Assandri G , Chauchan P , Futahashi R , Galimberti A , Hansson B , Lancaster LT , Takahashi Y , Svensson EI , and Duplouy A . 2021 . Wolbachia- driven selective sweep in a range expanding insect species . BMC Ecology and Evolution 21 . doi: 10.1186/s12862-021-01906-6 OpenUrl CrossRef ↵ Dorémus T , Jouan V , Urbach S , Cousserans F , Wincker P , Ravallec M , Wajnberg E , and Volkoff AN . 2013 . Hyposoter didymator uses a combination of passive and active strategies to escape from the Spodoptera frugiperda cellular immune response . J Insect Physiol 59 : 500 – 508 . doi: 10.1016/j.jinsphys.2013.02.010 OpenUrl CrossRef PubMed ↵ Duplouy A , Couchoux C , Hanski I , and van Nouhuys S. 2015 . Wolbachia Infection in a Natural Parasitoid Wasp Population . PLoS One 10 : e0134843 . doi: 10.1371/journal.pone.0134843 OpenUrl CrossRef PubMed ↵ Duplouy A , and Hornett EA . 2018 . Uncovering the hidden players in Lepidoptera biology: the heritable microbial endosymbionts . PeerJ 6 : e4629 . doi: 10.7717/peerj.4629 OpenUrl CrossRef PubMed ↵ Duplouy A , Ikonen S , and Hanski I . 2013 . Life history of the Glanville fritillary butterfly in fragmented versus continuous landscapes . Ecol Evol 3 : 5141 – 5156 . doi: 10.1002/ece3.885 OpenUrl CrossRef PubMed ↵ Duplouy A , Minard G , Lähteenaro M , Rytteri S , and Saastamoinen M . 2018 . Silk properties and overwinter survival in gregarious butterfly larvae . Ecol Evol 8 : 12443 – 12455 . doi: 10.1002/ece3.4595 OpenUrl CrossRef PubMed ↵ Duplouy A , Minard G , and Saastamoinen M . 2020a . The gut bacterial community affects immunity but not metabolism in a specialist herbivorous butterfly . Ecol Evol 10 : 8755 – 8769 . doi: 10.1002/ece3.6573 OpenUrl CrossRef PubMed ↵ Duplouy A , Nair A , Nyman T , and van Nouhuys S. 2021 . Long-term spatiotemporal genetic structure of an accidental parasitoid introduction, and local changes in prevalence of its associated Wolbachia symbiont . Mol Ecol 30 : 4368 – 4380 . doi: 10.1111/mec.16065 OpenUrl CrossRef ↵ Duplouy A , Pranter R , Warren-Gash H , Tropek R , and Wahlberg N . 2020b . Towards unravelling Wolbachia global exchange: a contribution from the Bicyclus and Mylothris butterflies in the Afrotropics . BMC Microbiol 20 : 319 . doi: 10.1186/s12866-020-02011-2 OpenUrl CrossRef PubMed ↵ Ghanavi HR , Twort VG , and Duplouy A . 2021 . Exploring bycatch diversity of organisms in whole genome sequencing of Erebidae moths (Lepidoptera) . Sci Rep 11 : 24499 . doi: 10.1038/s41598-021-03327-3 OpenUrl CrossRef PubMed ↵ Gibson J , Shokralla S , Porter TM , King I , van Konynenburg S , Janzen DH , Hallwachs W , and Hajibabaei M. 2014 . Simultaneous assessment of the macrobiome and microbiome in a bulk sample of tropical arthropods through DNA metasystematics . Proc Natl Acad Sci U S A 111 : 8007 – 8012 . doi: 10.1073/pnas.1406468111 OpenUrl Abstract / FREE Full Text ↵ Glasl B , Herndl GJ , and Frade PR . 2016 . The microbiome of coral surface mucus has a key role in mediating holobiont health and survival upon disturbance . ISME J 10 : 2280 – 2292 . doi: 10.1038/ismej.2016.9 OpenUrl CrossRef ↵ Graham RI , and Wilson K . 2012 . Male-killing Wolbachia and mitochondrial selective sweep in a migratory African insect . BMC Evolutionary Biology 12 . doi: 10.1186/1471-2148-12-204 OpenUrl CrossRef PubMed ↵ Ehrlich PR , and Hanski I Hanski I , Ehrlich PR , Nieminen M , Murphy DD , Hellmann JJ , Boggs CL , and McLaughlin JF . 2004 . Checkerspots and conservation biology . In: Ehrlich PR , and Hanski I , eds. On the wings of checkerspots: A model system for population biology . Oxford University Press . ↵ Hanski I , and Heino M . 2003 . Metapopulation-level adaptation of insect host plant preference and extinction-colonization dynamics in heterogeneous landscapes . Theor Popul Biol 64 : 281 – 290 . doi: 10.1016/s0040-5809(03)00093-5 OpenUrl CrossRef PubMed ↵ Hochachka WM , Dobson AP , Hawley DM , and Dhondt AA . 2021 . Host population dynamics in the face of an evolving pathogen . J Anim Ecol 90 : 1480 – 1491 . doi: 10.1111/1365-2656.13469 OpenUrl CrossRef ↵ Hornett EA , Duplouy AM , Davies N , Roderick GK , Wedell N , Hurst GD , and Charlat S . 2008 . You can’t keep a good parasite down: evolution of a male-killer suppressor uncovers cytoplasmic incompatibility . Evolution 62 : 1258 – 1263 . doi: 10.1111/j.1558-5646.2008.00353.x OpenUrl CrossRef PubMed ↵ Jiggins FM , Hurst GD , Jiggins CD , v d Schulenburg JH , and Majerus ME. 2000 . The butterfly Danaus chrysippus is infected by a male-killing Spiroplasma bacterium . Parasitology 120 : 439 – 446 . doi: 10.1017/s0031182099005867 OpenUrl CrossRef PubMed Web of Science ↵ Kahilainen A , Oostra V , Somervuo P , Minard G , and Saastamoinen M . 2022 . Alternative developmental and transcriptomic responses to host plant water limitation in a butterfly metapopulation . Mol Ecol 31 : 5666 – 5683 . doi: 10.1111/mec.16178 OpenUrl CrossRef ↵ Kahilainen A , van Nouhuys S , Schulz T , and Saastamoinen M. 2018 . Metapopulation dynamics in a changing climate: Increasing spatial synchrony in weather conditions drives metapopulation synchrony of a butterfly inhabiting a fragmented landscape . Glob Chang Biol 24 : 4316 – 4329 . doi: 10.1111/gcb.14280 OpenUrl CrossRef ↵ Kankare M , van Nouhuys S , and Hanski I. 2005 . Genetic Divergence Among Host-Specific Cryptic Species in Cotesia melitaearum Aggregate (Hymenoptera: Braconidae), Parasitoids of Checkerspot Butterflies . Annals of the Entomological Society of America 98 : 382 – 394 . doi: 10.1603/0013-8746(2005)098[0382:GDAHCS]2.0.CO;2 OpenUrl CrossRef ↵ Koehncke A , Telschow A , Werren JH , and Hammerstein P . 2009 . Life and death of an influential passenger: Wolbachia and the evolution of CI-modifiers by their hosts . PLoS One 4 : e4425 . doi: 10.1371/journal.pone.0004425 OpenUrl CrossRef PubMed ↵ Laetsch DR , and Blaxter ML . 2017 . KinFin: Software for Taxon-Aware Analysis of Clustered Protein Sequences . G3 (Bethesda) 7 : 3349 – 3357 . doi: 10.1534/g3.117.300233 OpenUrl Abstract / FREE Full Text Lei GCV , V. , Nieminen M , and Kuusaari M . 1997a . The parasitoid complex attacking Finnish populations of the Glanville fritillary Melitaea cinxia (Lep:Nymphalidae), and endangered butterfly . Journal of Natural History 31 : 635 – 648 . doi: 10.1080/00222939700770301 OpenUrl CrossRef Lei G-C , and Hanski I . 1997b . Metapopulation structure of Cotesia melitaearum , a specialist parasitoid of the butterfly Melitaea Cinxia . Oikos 78 ( 1 ): 91 – 100 . doi: 10.2307/3545804 OpenUrl CrossRef Web of Science ↵ Li H , and Durbin R . 2009 . Fast and accurate short read alignment with Burrows-Wheeler transform . Bioinformatics 25 : 1754 – 1760 . doi: 10.1093/bioinformatics/btp324 OpenUrl CrossRef PubMed Web of Science ↵ Li H , and Durbin R . 2010 . Fast and accurate long-read alignment with Burrows-Wheeler transform . Bioinformatics 26 : 589 – 595 . doi: 10.1093/bioinformatics/btp698 OpenUrl CrossRef PubMed Web of Science ↵ Liang Q , Bible PW , Liu Y , Zou B , and Wei L . 2020 . DeepMicrobes: taxonomic classification for metagenomics with deep learning . NAR Genom Bioinform 2 : lqaa009 . doi: 10.1093/nargab/lqaa009 OpenUrl CrossRef ↵ Marcelino VR , Clausen PTLC , Buchmann JP , Wille M , Iredell JR , Meyer W , Lund O , Sorrell TC , and Holmes EC . 2020 . CCMetagen: comprehensive and accurate identification of eukaryotes and prokaryotes in metagenomic data . Genome Biol 21 : 103 . doi: 10.1186/s13059-020-02014-2 OpenUrl CrossRef PubMed ↵ Mathé-Hubert H , Kaech H , Hertaeg C , Jaenike J , and Vorburger C . 2019 . Nonrandom associations of maternally transmitted symbionts in insects: The roles of drift versus biased cotransmission and selection . Mol Ecol 28 : 5330 – 5346 . doi: 10.1111/mec.15206 OpenUrl CrossRef ↵ Minard G , Kahilainen A , Biere A , Pakkanen H , Mappes J , and Saastamoinen M . 2022 . Complex plant quality—microbiota–population interactions modulate the response of a specialist herbivore to the defence of its host plant . Functional Ecology 36 : 2873 – 2888 . doi: 10.1111/1365-2435.14177 OpenUrl CrossRef ↵ Minard G , Tikhonov G , Ovaskainen O , and Saastamoinen M . 2019 . The microbiome of the Melitaea cinxia butterfly shows marked variation but is only little explained by the traits of the butterfly or its host plant . Environ Microbiol 21 : 4253 – 4269 . doi: 10.1111/1462-2920.14786 OpenUrl CrossRef ↵ Montovan KJ , Couchoux C , Jones LE , Reeve HK , and van Nouhuys S. 2015 . The puzzle of partial resource use by a parasitoid wasp . Am Nat 185 : 538 – 550 . doi: 10.1086/680036 OpenUrl CrossRef PubMed ↵ Nurk S , Meleshko D , Korobeynikov A , and Pevzner PA . 2017 . metaSPAdes: a new versatile metagenomic assembler . Genome Res 27 : 824 – 834 . doi: 10.1101/gr.213959.116 OpenUrl Abstract / FREE Full Text ↵ O’Neill SL , Giordano R , Colbert AM , Karr TL , and Robertson HM . 1992 . 16S rRNA phylogenetic analysis of the bacterial endosymbionts associated with cytoplasmic incompatibility in insects . Proc Natl Acad Sci U S A 89 : 2699 – 2702 . doi: 10.1073/pnas.89.7.2699 OpenUrl Abstract / FREE Full Text ↵ Ojanen SP , Nieminen M , Meyke E , Pöyry J , and Hanski I . 2013 . Long-term metapopulation study of the Glanville fritillary butterfly ( Melitaea cinxia ): survey methods, data management, and long-term population trends . Ecol Evol 3 : 3713 – 3737 . doi: 10.1002/ece3.733 OpenUrl CrossRef PubMed ↵ Pollmann M , Moore LD , Krimmer E , D’Alvise P , Hasselmann M , Perlman SJ , Ballinger MJ , Steidle JLM , and Gottlieb Y . 2022 . Highly transmissible cytoplasmic incompatibility by the extracellular insect symbiont Spiroplasma . iScience 25 : 104335 . doi: 10.1016/j.isci.2022.104335 OpenUrl CrossRef PubMed ↵ Pryszcz LP , and Gabaldón T . 2016 . Redundans: an assembly pipeline for highly heterozygous genomes . Nucleic Acids Res 44 : e113 . doi: 10.1093/nar/gkw294 OpenUrl CrossRef PubMed ↵ Raina JB , Eme L , Pollock FJ , Spang A , Archibald JM , and Williams TA . 2018 . Symbiosis in the microbial world: from ecology to genome evolution . Biol Open 7 . doi: 10.1242/bio.032524 OpenUrl Abstract / FREE Full Text ↵ RCoreTeam . 2020 . R: A language and environment for statistical computing . R Foundation for Statistical Computing , Vienna, Austria ↵ Rogowski ELB , Van Alst AD , Travis J , Reznick DN , Coulson T , and Bassar RD. 2020 . Novel parasite invasion leads to rapid demographic compensation and recovery in an experimental population of guppies . Proc Natl Acad Sci U S A 117 : 22580 – 22589 . doi: 10.1073/pnas.2006227117 OpenUrl Abstract / FREE Full Text ↵ Rosa E , Minard G , Lindholm J , and Saastamoinen M . 2019 . Moderate plant water stress improves larval development, and impacts immunity and gut microbiota of a specialist herbivore . PLoS One 14 : e0204292 . doi: 10.1371/journal.pone.0204292 OpenUrl CrossRef PubMed ↵ Saastamoinen M . 2022 . What can the long-term ecological monitoring of the Åland islands meadow network tell us about changes in Finnish nature? Memoranda Soc Fauna Flora Fennica 98 : 27 – 33 . OpenUrl ↵ Savary S , Drezen JM , Tan F , Beckage NE , and Periquet G . 1999 . The excision of polydnavirus sequences from the genome of the wasp Cotesia congregata (Braconidae, microgastrinae) is developmentally regulated but not strictly restricted to the ovaries in the adult . Insect Mol Biol 8 : 319 – 327 . doi: 10.1046/j.1365-2583.1999.83130.x OpenUrl CrossRef PubMed Web of Science ↵ Settele J , Shreeve TG , Konvicka M , and Van H Shaw MR , Stefanescu C , and van Nouhuys S . 2009 . Parasitoids of European Butterflies . In: Settele J , Shreeve TG , Konvicka M , and Van H , eds. Ecology of Butterflies of Europe . Cambridge : Cambridge University Press , 130 – 156 . ↵ Smolander OP , Blande D , Ahola V , Rastas P , Tanskanen J , Kammonen JI , Oostra V , Pellegrini L , Ikonen S , Dallas T , DiLeo MF , Duplouy A , Duru IC , Halimaa P , Kahilainen A , Kuwar SS , Kärenlampi SO , Lafuente E , Luo S , Makkonen J , Nair A , de la Paz Celorio-Mancera M , Pennanen V , Ruokolainen A , Sundell T , Tervahauta AI , Twort V , van Bergen E , Österman-Udd J , Paulin L , Frilander MJ , Auvinen P , and Saastamoinen M. 2022 . Improved chromosome-level genome assembly of the Glanville fritillary butterfly ( Melitaea cinxia ) integrating Pacific Biosciences long reads and a high-density linkage map . Gigascience 11 . doi: 10.1093/gigascience/giab097 OpenUrl CrossRef PubMed ↵ Susi H , Filloux D , Frilander MJ , Roumagnac P , and Laine AL . 2019 . Diverse and variable virus communities in wild plant populations revealed by metagenomic tools . PeerJ 7 : e6140 . doi: 10.7717/peerj.6140 OpenUrl CrossRef PubMed ↵ Teixeira L , Ferreira A , and Ashburner M . 2008 . The bacterial symbiont Wolbachia induces resistance to RNA viral infections in Drosophila melanogaster . PLoS Biol 6 : e2 . doi: 10.1371/journal.pbio.1000002 OpenUrl CrossRef PubMed ↵ Tollenaere C , Pernechele B , Mäkinen HS , Parratt SR , Németh MZ , Kovács GM , Kiss L , Tack AJ , and Laine AL . 2014 . A hyperparasite affects the population dynamics of a wild plant pathogen . Mol Ecol 23 : 5877 – 5887 . doi: 10.1111/mec.12908 OpenUrl CrossRef ↵ Twort VG , Blande D , and Duplouy A . 2022 . One’s trash is someone else’s treasure: sequence read archives from Lepidoptera genomes provide material for genome reconstruction of their endosymbionts . BMC Microbiol 22 : 209 . doi: 10.1186/s12866-022-02602-1 OpenUrl CrossRef PubMed ↵ Valerio F , Twort VG , and Duplouy A . 2024a . Screening Host Genomic Data for Wolbachia Infections . Methods Mol Biol 2739 : 251 – 274 . doi: 10.1007/978-1-0716-3553-7_16 OpenUrl CrossRef PubMed ↵ Valerio F , Martel C , Stefanescu C , van Nouhuys S , Kankare M , Duplouy A. 2024b . Wolbachia strain diversity in a complex group of sympatric cryptic parasitoid species . BMC Microbiology 24 : 319 . doi: 10.1186/s12866-024-03470-7 OpenUrl CrossRef PubMed ↵ van Nouhuys S. 2016 . Diversity, population structure, and individual behaviour of parasitoids as seen using molecular markers . Curr Opin Insect Sci 14 : 94 – 99 . doi: 10.1016/j.cois.2016.02.006 OpenUrl CrossRef PubMed ↵ van Nouhuys S , Kohonen M , and Duplouy A. 2016 . Wolbachia increases the susceptibility of a parasitoid wasp to hyperparasitism . J Exp Biol 219 : 2984 – 2990 . doi: 10.1242/jeb.140699 OpenUrl Abstract / FREE Full Text ↵ van Nouhuys S , Niemikapee S , and Hanski I. 2012 . Variation in a Host-Parasitoid Interaction across Independent Populations . Insects 3 : 1236 – 1256 . doi: 10.3390/insects3041236 OpenUrl CrossRef PubMed ↵ Vancaester E , and Blaxter M . 2023 . Phylogenomic analysis of Wolbachia genomes from the Darwin Tree of Life biodiversity genomics project . PLoS Biol 21 : e3001972 . doi: 10.1371/journal.pbio.3001972 OpenUrl CrossRef PubMed ↵ Vavre F , Fleury F , Lepetit D , Fouillet P , and Boulétreau M . 1999 . Phylogenetic evidence for horizontal transmission of Wolbachia in host-parasitoid associations . Mol Biol Evol 16 : 1711 – 1723 . doi: 10.1093/oxfordjournals.molbev.a026084 OpenUrl CrossRef PubMed Web of Science ↵ Vila R , Hayward A , Lohse K , Wright C , Barcoding DToL, collective, programme WSIToL, Wellcome, collective SISODP, Tree, collective oLCI, and Consortium DToL . 2021 . The genome sequence of the Glanville fritillary, Melitaea cinxia (Linnaeus, 1758) . Wellcome Open Research 6 . doi: 10.12688/wellcomeopenres.17283.1 OpenUrl CrossRef PubMed ↵ Weinert LA , Araujo-Jnr EV , Ahmed MZ , and Welch JJ . 2015 . The incidence of bacterial endosymbionts in terrestrial arthropods . Proc Biol Sci 282 : 20150249 . doi: 10.1098/rspb.2015.0249 OpenUrl CrossRef PubMed ↵ Zhang YZ , Shi M , and Holmes EC . 2018 . Using Metagenomics to Characterize an Expanding Virosphere . Cell 172 : 1168 – 1172 . doi: 10.1016/j.cell.2018.02.043 OpenUrl CrossRef PubMed ↵ Zug R , and Hammerstein P . 2012 . Still a host of hosts for Wolbachia : analysis of recent data suggests that 40% of terrestrial arthropod species are infected . PLoS One 7 : e38544 . doi: 10.1371/journal.pone.0038544 OpenUrl CrossRef PubMed ↵ Łukasik P , Guo H , van Asch M , Ferrari J , and Godfray HC. 2013 . Protection against a fungal pathogen conferred by the aphid facultative endosymbionts Rickettsia and Spiroplasma is expressed in multiple host genotypes and species and is not influenced by co-infection with another symbiont . J Evol Biol 26 : 2654 – 2661 . doi: 10.1111/jeb.12260 OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted January 21, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Recovering ecological interactions by mining non-target data from whole genome re-sequencing projects Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Recovering ecological interactions by mining non-target data from whole genome re-sequencing projects Mirkka Jones , Pasi Rastas , J. Camilo Chacón-Duque , Michelle F. DiLeo , Abhilash Nair , Vicencio Oostra , Marjo Saastamoinen , Anne Duplouy bioRxiv 2025.01.17.633498; doi: https://doi.org/10.1101/2025.01.17.633498 Share This Article: Copy Citation Tools Recovering ecological interactions by mining non-target data from whole genome re-sequencing projects Mirkka Jones , Pasi Rastas , J. Camilo Chacón-Duque , Michelle F. DiLeo , Abhilash Nair , Vicencio Oostra , Marjo Saastamoinen , Anne Duplouy bioRxiv 2025.01.17.633498; doi: https://doi.org/10.1101/2025.01.17.633498 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Ecology Subject Areas All Articles Animal Behavior and Cognition (7642) Biochemistry (17715) Bioengineering (13907) Bioinformatics (42003) Biophysics (21470) Cancer Biology (18624) Cell Biology (25533) Clinical Trials (138) Developmental Biology (13390) Ecology (19935) Epidemiology (2067) Evolutionary Biology (24356) Genetics (15617) Genomics (22529) Immunology (17753) Microbiology (40432) Molecular Biology (17200) Neuroscience (88681) Paleontology (667) Pathology (2840) Pharmacology and Toxicology (4828) Physiology (7653) Plant Biology (15171) Scientific Communication and Education (2046) Synthetic Biology (4304) Systems Biology (9826) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00