Full text
45,102 characters
· extracted from
preprint-html
· click to expand
Mammalian Uteri Contain a Diverse Virome: Insights from Healthy Mares | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Mammalian Uteri Contain a Diverse Virome: Insights from Healthy Mares Lulu Guo , G. Reed Holyoak , Udaya DeSilva doi: https://doi.org/10.1101/2025.02.26.640264 Lulu Guo 1 Department of Veterinary Clinical Sciences, Oklahoma State University , Stillwater, Oklahoma, United States Find this author on Google Scholar Find this author on PubMed Search for this author on this site G. Reed Holyoak 1 Department of Veterinary Clinical Sciences, Oklahoma State University , Stillwater, Oklahoma, United States Find this author on Google Scholar Find this author on PubMed Search for this author on this site Udaya DeSilva 2 Department of Animal and Food Sciences, Oklahoma State University , Stillwater, Oklahoma, United States Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: udaya.desilva{at}okstate.edu Abstract Full Text Info/History Metrics Preview PDF ABSTRACT The Earth’s estimated 10 31 virions, primarily phages, significantly impact microbial ecosystems. Despite their abundance, viromes remain relatively understudied. This is especially the case in domestic animals. Although recent studies have described the presence of a dynamic commensal microbiome in mammalian uteri, no studies have attempted to characterize the commensal virome in a mammalian uterus. In this study we have established for the first time the presence of a sparse, but diverse native virome in the equine uterus. The resulting virome database consists of 513 non-redundant viral genomes (>2 kb). Taxonomic annotations revealed a diverse virome dominated by Gammaretrovirus, Mamastrovirus, Sapovirus and Rosenblumvirus. Notably, 75% of the assembled genomes represented novel species. The phylogenetic tree unveiled distinct clades suggesting unexplored viral diversity with the uterine environment. Furthermore, bacterial hosts for equine uterine phages were predicted, aligning with previous studies’ findings. Most notably, the study identified antibiotic resistance genes within the virome, hinting at potential gene transfer mechanisms between bacteria and viruses. This study establishes the first uterine virome of any mammal, shedding light on a previously unexplored domain. The findings highlight the potential for phage therapy in reproductive infectious diseases and the importance of understanding the maternal gestational environment. Moreover, the study underscores the need for further studies to expand the uterine viromes, paving the way to deeper understanding of uterine microbiome and its implications for animal and human health. Introduction There are an estimated 10 31 virions on earth 1 . Most of these viruses are thought to be phages that infect prokaryotes and compete with their hosts by at least an order of magnitude 2 . Based on the half-life of free viruses ∼(48h), it is estimated that 10 27 viruses are produced per minute, and 10 25 microorganisms - about 100 million metric tons – of bacteria are destroyed per minute 1 . Although bacterial and fungal biomes of most environments have been thoroughly investigated, viromes have not been deeply studied. Most sequence data in typical virome studies remain unidentifiable, and referred to as unexplored viral “dark matter” 3 . According to the National Center for Biotechnology Information (NCBI) Genomes database, only 11,673 complete viral genome sequences have been reported as of January 2024. This number represents a very small fraction of the total viral genetic diversity. Reproductive tract virome studies have focused mainly within the vagina because of accessibility and ease of sampling without cross contamination 4 . Additionally, the uterine environment has long been considered a sterile environment as early as Henry Tissier’s 1900 study 5 . However, this assumption started to be challenged in the mid-to-late 1980s, with reports indicating culturable bacteria from the uterus of healthy asymptomatic women 6789 . With the advent of high-throughput bacterial genomic analyses, many reports of uterine microbiomes of different species have been published, such as human 10 , dairy cow 11 , canine 12 , and equine 13 . Published virome studies on female reproductive tract mostly focuses on human vaginal environment, such as comparing the vaginal viromes of pregnant women with or without vaginitis 14 and the differences between health and dysbiotic vaginal DNA virome 15 etc. Human vaginal virome analyses led scientists to believe that vaginal viromes are able to balance female genital tract bacteriome, mucosal immunity, sexual and reproductive health and disease 16 , and that change of cervicovaginal DNA virome will affect genital inflammation and microbiota composition 17 . However, understanding the role of virome in animal gynecological health is also important because they are an essential part of the entire ecosystem. Our previous metagenomic analyses of the equine uterine microbiome suggested the existence of a commensal virome. Here we report the identification of a native virome of the equine uterus, the host prediction for those viruses, and the presence of antibiotic resistance in the uterine environment. To the best of our knowledge, this is the first comprehensive analysis of the uterine virome of a mammal. Equine Uterine Virome Database We obtained 272,710,338 clean reads (∼4 billion nucleotides with an average read length of 140 bp) with Phred scores higher than 40. These assembled into 32,084 contigs with an average lengt∼h 550 bp. Minimum contig length wa∼s 200 bp. 2789 contigs were over 10 kb in length. 1750 of the larger contigs were determined to be high-quality for containing majority (>70%) of the organism’s predicted genome 18 . The N50 length, defined as the shortest contig length that covers at least half of the total base content was ∼500 bp and the N90 length defined as the shortest contig length that ensures that the contigs of that length, or longer contains at least 90% of the sum lengths of the contigs was∼310 kb (data not shown). The GC content of the contigs were ∼40% GC and none of them had gaps. 66 contigs were complete circular genomes. No detectable DNA was observed in either negative control in a bioanalyzer and were not sequenced. To predict viral sequences, all the contigs were filtered through DeepVirFinder 19 , which takes advantages of deep learning to build convolutional neural networks to identify viral contigs without using reference databases 462 contigs were recognized as virus. VirSorter 20 , which relies on comparing sequence to known virus and viral-like features was also used to identify viral contigs and 78 contigs were identified. Twenty-seven of these contigs were recognized by both tools. We then filtered sequences at a 95% average nucleotide identity (ANI) threshold and 70% aligned fraction threshold obtaining a database of 513 uterine viral sequences, referred to here as the equine uterine virome database. Equine Uterus Harbors Diverse Range of Novel Virome Sequences Taxonomic annotations of the contigs were performed by CAT 21 , which classifies contigs according to genes, open reading frames (ORFs) prediction, and protein mapping. The IMG/VR database was used during annotation. The most plausible abundance in different levels based on viral contigs is shown in Figures 2(a)-2(f) . The mare endometrium is dominated by Gammaretrovirus, Mamastrovirus, Sapovirus and Rosenblumvirus at genus level. Gammaretrovirus, Mamastrovirus and Sapovirus are RNA viruses while Rosenblumvirus is a dsDNA virus. Most abundant predicted Phyla are depicted in Figure 3 . As shown, 11 classes, 11 orders, 14 families, 8 genera, 7 phyla and 29 species were identified. To represent richness, evenness, and statistical significance (p-adj <0.05), the alpha diversity was calculated by R vegan package. Alpha rarefaction of observed metrices showing species richness in samples reached near-saturation, but it only considers observed OTUs. However, chao1 considers not only observed OTUs, but also non-observed rare species. The results show the sequence coverage is sufficient. The non-parametric Kruskal-Wallis test was used for Shannon index and Simpson index ( Figures 4(a) & 4(b) ). Simpson index focuses more on relative abundance while Shannon index focuses more on species richness. Alpha diversity indices at different phylogenetic classifications are shown in Table 1 . View this table: View inline View popup Download powerpoint Table 1. Alpha diversity indices at different phylogenetic classifications. Download figure Open in new tab Figure 1. Overview of experimental workflow. Download figure Open in new tab Figure 2. The abundance profiles are depicted across various taxonomic levels, ranging from phylum to species. Each figure provides insight into the distribution and prevalence of taxa within the analyzed dataset, shedding light on the taxonomic composition and diversity present. Through comprehensive examination at different taxonomic resolutions, from broad classifications such as phylum down to specific species, these figures offer a nuanced understanding of the microbial community structure within the uterus. The dominance of Gammaretrovirus, Mamastrovirus, Sapovirus, and Rosenblumvirus at the genus level in the mare endometrium underscores the diversity of viral populations within this biological niche. Notably, Gammaretrovirus, Mamastrovirus, and Sapovirus are RNA viruses, whereas Rosenblumvirus belongs to the dsDNA virus group. Download figure Open in new tab Figure 3. A contig-based abundance analysis unveils a detailed representation of the genomic content within the assembled sequences. Additionally, the identification of 11 classes, 11 orders, 14 families, 8 genera, 7 phyla, and 29 species underscores the taxonomic richness and diversity present in the microbial community. Download figure Open in new tab Figure 4. (a) The alpha diversity of the analyzed ecosystem was assessed using the Shannon index. This metric provides a comprehensive measure of biodiversity within a specific community, taking into account both the abundance and evenness of different taxa. A higher Shannon index value signifies greater diversity, reflecting a more balanced distribution of species and indicating a richer and more complex ecological landscape. (b) The alpha diversity of the studied ecosystem is evaluated through the Simpson index. This index offers a complementary perspective on biodiversity, focusing on the dominance or concentration of species within the community. A lower Simpson index indicates higher diversity, emphasizing the presence of a more evenly distributed array of species. Phylogeny of Uterine Viruses To discover more details about viruses within the uterine lumen, we performed comprehensive virome profiling of the uterine samples by mapping 2789 contigs against the NR-V database to make sure we covered prophages. 513 previously predicted viral contigs were utilized to build a phylogenetic tree by MATLAB software and ITOL 22 . Two main branches were generated, and trees were built for both (data not shown). This further indicates there are many unknown viral species in the uterine environment. The relationships between some viruses are close, suggesting that they probably evolved from the same organism or mutated into a new virus. Bacterial Host Prediction for Equine Uterine Phages We predicted the most likely bacterial host for the phages we obtained from equine uteri. First, we screened our contigs with the CRISPRCasdb spacer database to select all potential host information. Then, the phage-bacteria interaction database, Microbe Versus Phage (MVP) was used to arrange the similarities between contigs and known virus sequences. Finally, correlation was applied to predict the bacterial host for the contigs. The core hosts we found were Clostridiales at order level, and Streptococcus and Staphylococcus at genus level, which parallels our previous equine uterine microbiome study 13 . Presence of Antibiotic Resistance Genes in Equine Uterine Virome Investigating the uterine viral sequences further, we employed a method based on ORFs annotation for subsequent analysis of related community functions 23 . Using BWA-MEME 24 , the effective data of each sample after removing the host sequence were compared to the initial ORFs set of each sample. The number of reads of a gene in each sample were calculated. According to the comparison results, ORFs of each sample were filtered. Dereplication was performed with CD-HIT 25 using global identity threshold of 99%. A total of 463 ORFs were predicted by Prokka 26 . Antibiotic resistance genes were annotated by Comprehensive Antibiotic Research Database (CARD) and Resistance Gene Identifier 27 . Although antibiotics do not have direct effect on viruses, studies have found that viromes from a variety of environments carry antibiotic resistance genes 28 . As suggested by multiple studies 29 , 30 , bacteriophages may play a role in horizontal transfer of genes conferring antibiotic resistance to bacteria. Therefore, it is particularly important to detect drug resistance factors within viral functional genes. The core antibiotic resistance genes detected in the uterine viruses were gene 88 and gene 163, being involved with resistance to one or more antibiotics ( Figures 5(a) & 5(d) ) by target modification mechanisms ( Figures 5(b) & 5(e) ). The most predicted antibiotic resistance is to lincosamides, macrolides, and streptogramin ( Figure 5(c) ). Download figure Open in new tab Download figure Open in new tab Figure 5. (a) The resistance mechanism of antibiotic genes illuminating the strategies employed by these genes to confer resistance to antimicrobial agents. The identification of core antibiotic genes in uterine viruses associated with target modification mechanisms indicates a prevalent strategy within the microbial community to evade the effects of antibiotics. (b) The abundance of antibiotic genes within the viral genome is highlighted, providing a comprehensive view of the prevalence and distribution of these resistance determinants among viral elements. The identification of core antibiotic genes, specifically gene 88 and gene 163, within the uterine viruses signifies their prominent role in conferring antibiotic resistance within the microbial community associated with the uterus. (c) An exploration is undertaken to identify the most likely resistant drugs associated with the antibiotic genes under consideration. The most predicted antibiotic resistance in the study is to lincosamides, macrolides, and streptogramin, highlighting the prevalence of resistance mechanisms against these classes of antibiotics within the analyzed microbial community. (d) Antibiotic Resistance Ontology. (e) An exploration is undertaken to identify the most likely resistant drugs associated with the antibiotic genes under consideration. The most predicted antibiotic resistance in the study is to lincosamides, macrolides, and streptogramin, highlighting the prevalence of resistance mechanisms against these classes of antibiotics within the analyzed microbial community. Discussion To date, genome sequencing has made remarkable contributions to the fields of microbiology, biology, and physiology, leading some to state that all organisms are metaorganisms 31 . The microbiota, microbial communities within and on the animal body, are regarded as an integral part of the metaorganism blueprint and play important roles in determining the health of animals 4 . The population and diversity of the virome has a major impact on the community of hostile microbes and pathobionts. In this study, we have obtained and analyzed more than 500 high-quality equine uterine viral contigs. To the best of our knowledge, we present the first uterine virome in a mammal. As expected, majority of the viral contigs (n=462) were identified using DeepVirFinder 19 that predicts viral sequences using deep learning and building convoluted neural networks without relying on reference databases. We identified 78 contigs using VirSorter, that relies on comparing sequences to known virus and virus-like sequences. Only 27 contigs were identified by both programs. As it is estimated that a vast majority of viruses that exist are yet to be identified 32 , this result was expected and was the experience of a few other studies 33 , 34 . The uterus has traditionally been considered a sterile environment. Although being far less robustly populated than the gut or the vagina, uterine microbiomes have been previously described. Our approach ( Figure 1 ) allowed us to capture viral genomes from this comparatively sparse, yet more diversly colonized environment. Since the uterus is relatively understudied, we were unable to classify many contigs below Family level, although we have assigned several contigs to different genera and species, they represented only a fraction of the identified viruses. Over 75% of the assembled genomes represented novel species. The uterine endometrium hosts a highly diverse and novel viral population. The most abundant family found is Papillomavirus, a double strand DNA virus. This virus has previously been reported in cutaneous lesions on the horse 35 , and this is the first report of it being found in the uterus. It should be noted that this virus, and closely related (almost identical) bovine papilloma virus, have been associated with sarcoid, squamous cell carcinoma/genital papillomatosis in the horse 36 and associated with similar lesions in the human uterine environment 37 . This is the first time the single strand RNA virus families of Astroviridae and Caliciviridae, have been identified in horses. We believe there are still many other viruses within the uterus remaining to be identified and studied. There are also abundant phage families that have been discovered in this study, such as Microviridae, Siphoviridae, Podoviridae and others, which suggest the possibility of the use of these native phages in targeted non-antibiotic therapy of reproductive infectious diseases in the future. This opens the door to further studies in this area. Multiple Displacement Amplification (MDA) that was used to amplify viral DNA is known to preferentially amplify certain DNA sequences over others 38 , 39 . Consequentially, the relative composition of different viral families identified in this study may have been influenced by our methodology. We limited our samples to healthy animals at a single stage of estrous cycle that minimizes ascending migration of vaginal microorganisms. We only sampled 12 animals and they were all from the same facility and in the same geographical area. As such, we are certain that the uterine virome of horses is much more diverse than is reported in this study. Our goal was to establish that a diverse and complex native virome exists in a mammalian uterus and we have successfully accomplished that goal. We were surprised by the prevalence and diversity of antibiotic resistance genes we found in viral genomes. Although having antibiotic resistance genes does not directly affect the virus, antibiotic disease gene prevalence among viral genomes has been observed before 28 , 29 , 30 . Although it was outside the scope of this work, checking if any of the uterine bacteria had acquired the same resistance elements would be interesting. Antibiotic resistant microbes are threatening the treatment of infectious diseases. At present, the identification of drug resistance genes can help us understand drug resistance mechanisms and provide references for disease treatment and drug development. Our study reveals that antibiotic resistance genes also reside in viral genomes. The predicted resistance mechanism of the antibiotic gene family reflects the co-evolution between bacteria and viruses. This suggests the existence of gene flow networks between phylogenetically distinct bacterial and viral species in the uterus. In this study, we also found that the uterine viral contigs were separated into 2 main clades. This result highlights the importance of building a well-established uterine virome database, as the combined effect sizes of highly related phage genomes can help reveal the association of specific clades with their bacterial hosts and animal health 40 . Methods Topical subheadings are allowed. Authors must ensure that their Methods section includes adequate experimental and characterization data necessary for others in the field to reproduce their work. Animals and Sample Collection Twelve healthy mares from Oklahoma were selected for sample collection in this study. Mares were between 3 and 14 years of age, with clinically normal reproductive tracts. Mares were sampled in a single day during the normal breeding season (mid-spring in the northern hemisphere) during the luteal phase of their estrous cycle (diestrus) between day 7 and 10 post-ovulation. At this time, under the influence of progesterone the cervix is closed and sulfomucins significantly reduces the potential for transcervical migration of vaginal bacteria. All mares had the same diet for at least 2 months before sample collection. None of the mares had recent antiviral or antibiotic exposure. All mares had uterine luminal endometrial microbiota samples collected via 150 ml of saline infused through a triple guarded system, where the sample collection catheters were protected from the vestibular and vaginal environment and brought to the external os of the cervix inside a sterile disposable vaginal speculum. The sample collection catheter was a stallion urinary catheter (Jorgensen Labs, Loveland, CO, USA) inserted within a 36 Fr. 70 cm equine embryo flush catheter (IMV Technologies, Holland, MI, USA) which served as the second guard to prevent contamination from the cervical external os and lumen. The embryo flush catheter was inserted into the cervix to the level of the internal cervical os, the balloon inflated with∼50 mL of air to seal the cervix, and then the urinary catheter advanced into the uterine lumen. Saline was infused, massaged within the lumen, and collected from the uterus via gravity flow. A mid-stream catch of approximately 50 mL was collected into sterile 50 mL conical tubes and immediately capped and placed on ice. The urinary catheter was then retracted into the flush catheter, and both retracted into the speculum, before removal back through the vaginal vault. This small volume lavage sampling technique has been shown to have the highest return rate for microbial collection 41 . We enhanced the guarded protection from potential vestibulovaginal contamination by adding the disposable speculum to the collection process. All samples were collected on a single day in the same facility and processed together to eliminate a batch effect. A saline sample was flushed through the catheter at the time of collection as well as a second aliquot of the same batch of saline was processed alongside regular samples throughout the experimental protocol as negative controls. Animal use and sample collection procedures were approved by the Oklahoma State University Institutional Animal Care and Use Committee. An overview of the experimental workflow described in this manuscript is provided in ( Figure 1 ). Viral Nucleic Acid Isolation and Amplification Lavage samples were decanted and sequentially filtered through a 0.45 µ m and 0.22 µ m filter by using Vacuum Driven Sterile Filter (Millipore Steriflip, Burlington, MA, USA). Viral particles were enriched by using ultracentrifuge and Pellet Paint ® Co-Precipitant (Novagen, Madison, WI). Viral enrichments were nuclease treated at 37°C for 90 minutes to remove contaminating free floating DNA and RNA. Nucleic acid was extracted from viral enrichments using the QIAamp UltraSens Virus Kit (Qiagen, Germantown, MD, USA) and following the manufacturer’s protocol. Quantifying the purified Viral nucleic acids was done using a NanoDrop ND-1000 spectrophotometer (NanoDrop Technologies, Wilmington, DE, USA). A 25-ng aliquot of purified nucleic acid was used as template for amplification using the REPLI-g Mini Kit (Qiagen, Germantown, MD, USA). Nucleic acid quantification was done using a Qubit 3.0 Fluorometer (Thermo Fisher Scientific, Waltham, MA, USA). Amplified samples were kept at 4°C for short-term storage. cDNA Synthesis and Library Preparation Up to 1 µ g template RNA and ProtoScript ® II First Strand cDNA Synthesis Kit (New England Biolabs, Ipswich, MA, USA) were used in first strand cDNA synthesis following kit protocols. The second strand cDNA synthesis was done using NEBNext Ultra II Non-Directional RNA Second Strand Synthesis Module (New England Biolabs Inc.) according to the kit protocols. Metagenomic library preparation was performed using the NEBNext Ultra II Library Prep Kit (#E7645L) and Index Primers (#E7500S and #E7335L) from New England Biolabs. The protocol associated with these kits was used. Briefly, each library sample was quantified and run on a bioanalyzer to establish library molarity (nM) for sequencing. Samples were diluted to equivalent molarities and pooled for sequencing via Illumina HiSeq 2500 platform. The raw sequencing data used in this study is available at the Sequence Read Archive (SRA) of NCBI under the Project number PRJNA1122187 and accession numbers SAMN41777987-993. Quality Control and Metagenomic Assembly To ensure data quality and avoid erroneous results, sequencing data needs to be quality filtered and preprocessed before use in subsequent analyses. FastQC 42 software was used to evaluate the quality of sequencing data. Then, a common NGS quality control tool, Trimmomatic 43 was used for pretreatment including filtering low-quality reads, removing low-quality bases and unrecognized base (N) at the end of reads, removing sequencing adapters, removing short sequences etc. In order to avoid host contamination, sequence were further quality-filtered with the latest equine database EquCab3 by using Bowtie 2 44 and Samtools 45 to remove the host sequences. MetaSPAdes 46 was then used to assemble the paired-end reads. Viral Sequence Prediction VIBRANT 18 was used to analyze the contigs larger than 10kb and predict viral sequences since it can process large metagenomic assemblies based on combined machine learning and protein similarity approach. VirSorter 20 was used to identify the virus contigs and to detect prophages by aligning a clean read with the NT (Nucleotide Sequence Database) library of non-redundant sequences through BLAST and aligned sequences that are homologous to viruses and bacteria. Groups included were dsDNAphage, NCLDV, RNA, ssDNA and lavidaviridae. A minimum score of 0.5 was used. Category 1, 2, 4, 5 were considered from VirSorter prediction. DeepVirFinder 19 ] was used for deep learning to distinguish viral from bacterial contigs. Contigs with score > 0.9 and p-value < 0.01 were considered from DeepVirFinder prediction. Contigs Annotation, Clustering and Taxonomy Viral genomes were annotated with Prokka 26 ] by using viral kingdom. Based on identifying coordinates of genomic features within contigs, Prokka can annotate genes and save the information in standards-compliant output files. vConTACT2 47 was used to form clusters by creating mapping file as it has been widely used to group phage sequences into clusters roughly corresponding to the genus level. Comparative Annotation Toolkit (CAT) 21 , using long read for taxonomic classification was used to provide taxonomic context of contigs. The function of the dereplicated genes were annotated by eggNOG database 48 , KEGG 49 and CAZy database 50 . Kraken2 and Bracken was used to calculate species abundance 51 . Abundance was calculated by first classifying the sequence using Kraken2 and then estimating the abundance of each species with Bracken. Contig-based analyses were performed using Contig Annotation Tool (CAT) 52 . Bacterial Host Prediction and Antibiotic Resistance Gene Detection Bacterial hosts were predicted by using the spacer sequence library from the CRISPRCasdb database and conducting a blastn-short comparison on assembled contig sequences to identify potential phage hosts 53 . Microbe versus Phage (MVP) database was used to build the database of phage-prokaryotic interactions 54 . Author contributions statement Must include all authors, identified by initials, for example: A.A. conceived the experiment(s), A.A. and B.A. conducted the experiment(s), C.A. and D.A. analysed the results. All authors reviewed the manuscript. Additional information To include, in this order: Accession codes (where applicable); Competing interests (mandatory statement). The corresponding author is responsible for submitting a competing interests statement on behalf of all authors of the paper. This statement must be included in the submitted article file. Acknowledgements (not compulsory) Acknowledgements should be brief, and should not include thanks to anonymous referees and editors, or effusive comments. Grant or contribution numbers may be acknowledged. References 1. ↵ Rohwer , F. , Prangishvili , D. & Lindell , D. Roles of viruses in the environment ( 2009 ). 2. ↵ Krupovic , M. , Prangishvili , D. , Hendrix , R. W. & Bamford , D. H. Genomics of bacterial and archaeal viruses: dynamics within the prokaryotic virosphere . Microbiol. molecular biology reviews 75 , 610 – 635 ( 2011 ). OpenUrl CrossRef 3. ↵ Liang , G. & Bushman , F. D. The human virome: assembly, composition and host interactions . Nat. Rev. Microbiol . 19 , 514 – 527 ( 2021 ). OpenUrl CrossRef PubMed 4. ↵ García-Velasco , J. A. , Menabrito , M. & Catalán , I. B. What fertility specialists should know about the vaginal microbiome: a review . Reproductive biomedicine online 35 , 103 – 112 ( 2017 ). OpenUrl CrossRef PubMed 5. ↵ Wolfrom , M. L. Clamp , J. R. , Hough , L. , Hickson , J. L. & Whistler , R. L. Lactose . In Wolfrom , M. L. (ed.) Advances in Carbohydrate Chemistry , vol. 16 , 159 – 206 , DOI: 10.1016/S0096-5332(08)60262-3 ( Academic Press , 1962 ). OpenUrl CrossRef 6. Heinonen , P. et al. Anatomic sites of upper genital tract infection . Obstet. & Gynecol . 66 , 384 – 390 ( 1985 ). OpenUrl PubMed Web of Science 7. Eschenbach , D. A. , Rosene , K. , Tompkins , L. , Watkins , H. & Gravett , M. G. Endometrial cultures obtained by a triple-lumen method from afebrile and febrile postpartum women . J. Infect. Dis . 153 , 1038 – 1045 ( 1986 ). OpenUrl CrossRef PubMed 8. Hemsell , D. , Obregon , V. , Heard , M. & Nobles , B. Endometrial bacteria in asymptomatic, nonpregnant women . The J. reproductive medicine 34 , 872 – 874 ( 1989 ). OpenUrl 9. Møller , B. R. , Kristiansen , F. V. , Thorsen , P. , Frost , L. & Mogensen , S. C. Sterility of the uterine cavity . Acta obstetricia et gynecologica Scand . 74 , 216 – 219 ( 1995 ). OpenUrl CrossRef 10. ↵ Verstraelen , H. et al. Characterisation of the human uterine microbiome in non-pregnant women through deep sequencing of the v1-2 region of the 16s rrna gene . PeerJ 4 , e1602 ( 2016 ). OpenUrl CrossRef PubMed 11. ↵ Wang , M.-L. et al. Uterine microbiota of dairy cows with clinical and subclinical endometritis . Front. microbiology 9 , 2691 ( 2018 ). OpenUrl CrossRef 12. ↵ Lyman , C. et al. Canine endometrial and vaginal microbiomes reveal distinct and complex ecosystems . PLoS One 14 , e0210157 ( 2019 ). OpenUrl CrossRef PubMed 13. ↵ Holyoak , G. et al. The healthy equine uterus harbors a distinct core microbiome plus a rich and diverse microbiome that varies with geographical location . Sci. reports 12 , 14790 ( 2022 ). OpenUrl 14. ↵ Zhang , H.-T. , Wang , H. , Wu , H.-S. , Zeng , J. & Yang , Y. Comparison of viromes in vaginal secretion from pregnant women with and without vaginitis . Virol. J . 18 , 1 – 9 ( 2021 ). OpenUrl CrossRef PubMed 15. ↵ Jakobsen , R. R. et al. Characterization of the vaginal dna virome in health and dysbiosis . Viruses 12 , 1143 ( 2020 ). OpenUrl CrossRef PubMed 16. ↵ Happel , A.-U. , Varsani , A. , Balle , C. , Passmore , J.-A. & Jaspan , H. The vaginal virome—balancing female genital tract bacteriome, mucosal immunity, and sexual and reproductive health outcomes? Viruses 12 , 832 ( 2020 ). OpenUrl CrossRef PubMed 17. ↵ Kaelin , E. A. et al. Cervicovaginal dna virome alterations are associated with genital inflammation and microbiota composition . Msystems 7 , e00064 – 22 ( 2022 ). OpenUrl PubMed 18. ↵ Kieft , K. , Zhou , Z. & Anantharaman , K. Vibrant: automated recovery, annotation and curation of microbial viruses, and evaluation of viral community function from genomic sequences . Microbiome 8 , 1 – 23 ( 2020 ). OpenUrl CrossRef PubMed 19. ↵ Ren , J. et al. Identifying viruses from metagenomic data using deep learning . Quant. Biol . 8 , 64 – 77 ( 2020 ). OpenUrl CrossRef PubMed 20. ↵ Roux , S. , Enault , F. , Hurwitz , B. L. & Sullivan , M. B. Virsorter: mining viral signal from microbial genomic data . PeerJ 3 , e985 ( 2015 ). OpenUrl CrossRef PubMed 21. ↵ Fiddes , I. T. et al. Comparative annotation toolkit (cat)—simultaneous clade and personal genome annotation . Genome research 28 , 1029 – 1038 ( 2018 ). OpenUrl Abstract / FREE Full Text 22. ↵ Letunic , I. & Bork , P. Interactive tree of life (itol) v5: an online tool for phylogenetic tree display and annotation . Nucleic acids research 49 , W293 – W296 ( 2021 ). OpenUrl CrossRef PubMed 23. ↵ Hu , Q. et al. Effects of low-dose antibiotics on gut immunity and antibiotic resistomes in weaned piglets . Front. Immunol . 11 , 903 ( 2020 ). OpenUrl CrossRef PubMed 24. ↵ Jung , Y. & Han , D. Bwa-meme: Bwa-mem emulated with a machine learning approach . Bioinformatics 38 , 2404 – 2413 ( 2022 ). OpenUrl CrossRef PubMed 25. ↵ Fu , L. , Niu , B. , Zhu , Z. , Wu , S. & Li , W. Cd-hit: accelerated for clustering the next-generation sequencing data . Bioinformatics 28 , 3150 – 3152 ( 2012 ). OpenUrl CrossRef PubMed Web of Science 26. ↵ Seemann , T. Prokka: rapid prokaryotic genome annotation . Bioinformatics 30 , 2068 – 2069 ( 2014 ). OpenUrl CrossRef PubMed Web of Science 27. ↵ Alcock , B. P. et al. Card 2020: antibiotic resistome surveillance with the comprehensive antibiotic resistance database . Nucleic acids research 48 , D517 – D525 ( 2020 ). OpenUrl CrossRef PubMed 28. ↵ Colombo , S. et al. Viromes as genetic reservoir for the microbial communities in aquatic environments: a focus on antimicrobial-resistance genes . Front. microbiology 8 , 1095 ( 2017 ). OpenUrl CrossRef 29. ↵ Muniesa , M. , Colomer-Lluch , M. & Jofre , J. Potential impact of environmental bacteriophages in spreading antibiotic resistance genes . Futur. microbiology 8 , 739 – 751 ( 2013 ). OpenUrl CrossRef 30. ↵ Chen , Q. et al. Bacteriophage and bacterial susceptibility, resistance, and tolerance to antibiotics . Pharmaceutics 14 , 1425 ( 2022 ). OpenUrl CrossRef PubMed 31. ↵ Sieber , M. et al. Neutrality in the metaorganism . PLoS Biol . 17 , e3000298 ( 2019 ). OpenUrl CrossRef PubMed 32. ↵ Paez-Espino , D. et al. Uncovering earth’s virome . Nature 536 , 425 – 430 ( 2016 ). OpenUrl CrossRef PubMed 33. ↵ Alcalá Briseño , R. I. et al. Translating virome analyses to support biosecurity, on-farm management, and crop breeding . Front. Plant Sci . 14 , 1056603 ( 2023 ). OpenUrl CrossRef PubMed 34. ↵ Hegarty , B. et al. Benchmarking informatics approaches for virus discovery: caution is needed when combining in silico identification methods . Msystems 9 , e01105 – 23 ( 2024 ). OpenUrl CrossRef PubMed 35. ↵ Postey , R. C. , Appleyard , G. D. & Kidney , B. A. Evaluation of equine papillomas, aural plaques, and sarcoids for the presence of equine papillomavirus dna and papillomavirus antigen . Can. journal veterinary research 71 , 28 ( 2007 ). OpenUrl 36. ↵ Peters-Kennedy , J. , Lange , C. , Rine , S. & Hackett , R. Equus caballus papillomavirus 8 (ec pv 8) associated with multiple viral plaques, viral papillomas, and squamous cell carcinoma in a horse . Equine veterinary journal 51 , 470 – 474 ( 2019 ). OpenUrl CrossRef PubMed 37. ↵ Olusola , P. , Banerjee , H. N. , Philley , J. V. & Dasgupta , S. Human papilloma virus-associated cervical cancer and health disparities . Cells 8 , 622 ( 2019 ). OpenUrl CrossRef PubMed 38. ↵ Ahsanuddin , S. et al. Assessment of repli-g multiple displacement whole genome amplification (wga) techniques for metagenomic applications . J. biomolecular techniques: JBT 28 , 46 ( 2017 ). OpenUrl CrossRef 39. ↵ Borgström , E. , Paterlini , M. , Mold , J. E. , Frisen , J. & Lundeberg , J. Comparison of whole genome amplification techniques for human single cell exome sequencing . PloS one 12 , e0171566 ( 2017 ). OpenUrl CrossRef PubMed 40. ↵ Camarillo-Guerrero , L. F. , Almeida , A. , Rangel-Pineros , G. , Finn , R. D. & Lawley , T. D. Massive expansion of human gut bacteriophage diversity . Cell 184 , 1098 – 1109 ( 2021 ). OpenUrl CrossRef PubMed 41. ↵ Dezzutti , C. S. et al. Performance of swabs, lavage, and diluents to quantify biomarkers of female genital tract soluble mucosal mediators . PloS one 6 , e23136 ( 2011 ). OpenUrl CrossRef PubMed 42. ↵ Andrews , S. Fastqc: A quality control tool for high throughput sequence data [online].” fastqc,” ( 2015 ). 43. ↵ Bolger , A. M. , Lohse , M. & Usadel , B. Trimmomatic: a flexible trimmer for illumina sequence data . Bioinformatics 30 , 2114 – 2120 ( 2014 ). OpenUrl CrossRef PubMed Web of Science 44. ↵ Langdon , W. B. Performance of genetic programming optimised bowtie2 on genome comparison and analytic testing (gcat) benchmarks . BioData mining 8 , 1 – 7 ( 2015 ). OpenUrl CrossRef PubMed 45. ↵ Etherington , G. J. , Ramirez-Gonzalez , R. H. & MacLean , D. bio-samtools 2: a package for analysis and visualization of sequence and alignment data with samtools in ruby . Bioinformatics 31 , 2565 – 2567 ( 2015 ). OpenUrl CrossRef PubMed 46. ↵ Aw , T. G. , Howe , A. & Rose , J. B. Metagenomic approaches for direct and cell culture evaluation of the virological quality of wastewater . J. virological methods 210 , 15 – 21 ( 2014 ). OpenUrl CrossRef 47. ↵ Bolduc , B. et al. vcontact: an ivirus tool to classify double-stranded dna viruses that infect archaea and bacteria . PeerJ 5 , e3243 ( 2017 ). OpenUrl CrossRef PubMed 48. ↵ Huerta-Cepas , J. et al. eggnog 5.0: a hierarchical, functionally and phylogenetically annotated orthology resource based on 5090 organisms and 2502 viruses . Nucleic acids research 47 , D309 – D314 ( 2019 ). OpenUrl CrossRef PubMed 49. ↵ Kanehisa , M. & Goto , S. Kegg: kyoto encyclopedia of genes and genomes . Nucleic acids research 28 , 27 – 30 ( 2000 ). OpenUrl CrossRef PubMed Web of Science 50. ↵ Drula , E. et al. The carbohydrate-active enzyme database: functions and literature . Nucleic acids research 50 , D571 – D577 ( 2022 ). OpenUrl CrossRef PubMed 51. ↵ Dimopoulos , E. A. et al. Haystac: A bayesian framework for robust and rapid species identification in high-throughput sequencing data . PLOS Comput. Biol . 18 , e1010493 ( 2022 ). OpenUrl CrossRef PubMed 52. ↵ Cambuy , D. D. , Coutinho , F. H. & Dutilh , B. E. Contig annotation tool cat robustly classifies assembled metagenomic contigs and long sequences . BioRxiv 072868 ( 2016 ). 53. ↵ Pourcel , C. et al. Crisprcasdb a successor of crisprdb containing crispr arrays and cas genes from complete genome sequences, and tools to download and query lists of repeats and spacers . Nucleic acids research 48 , D535 – D544 ( 2020 ). OpenUrl CrossRef PubMed 54. ↵ Gao , N. L. et al. Mvp: a microbe–phage interaction database . Nucleic acids research 46 , D700 – D707 ( 2018 ). OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted February 28, 2025. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Mammalian Uteri Contain a Diverse Virome: Insights from Healthy Mares Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Mammalian Uteri Contain a Diverse Virome: Insights from Healthy Mares Lulu Guo , G. Reed Holyoak , Udaya DeSilva bioRxiv 2025.02.26.640264; doi: https://doi.org/10.1101/2025.02.26.640264 Share This Article: Copy Citation Tools Mammalian Uteri Contain a Diverse Virome: Insights from Healthy Mares Lulu Guo , G. Reed Holyoak , Udaya DeSilva bioRxiv 2025.02.26.640264; doi: https://doi.org/10.1101/2025.02.26.640264 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Microbiology Subject Areas All Articles Animal Behavior and Cognition (7635) Biochemistry (17691) Bioengineering (13892) Bioinformatics (41937) Biophysics (21452) Cancer Biology (18589) Cell Biology (25504) Clinical Trials (138) Developmental Biology (13378) Ecology (19899) Epidemiology (2067) Evolutionary Biology (24320) Genetics (15609) Genomics (22506) Immunology (17736) Microbiology (40394) Molecular Biology (17181) Neuroscience (88605) Paleontology (666) Pathology (2832) Pharmacology and Toxicology (4824) Physiology (7641) Plant Biology (15156) Scientific Communication and Education (2045) Synthetic Biology (4294) Systems Biology (9825) Zoology (2271)
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.