A Simple and Cost-Effective Protocol for Enriching ’Ca. Saccharimonadia’ from Human Saliva to Enable Efficient Genome Sequencing

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 41,644 characters · extracted from preprint-html · click to expand
A Simple and Cost-Effective Protocol for Enriching ’Ca. Saccharimonadia’ from Human Saliva to Enable Efficient Genome Sequencing | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results A Simple and Cost-Effective Protocol for Enriching ’ Ca . Saccharimonadia’ from Human Saliva to Enable Efficient Genome Sequencing Clara Bonaiti , Simona Panelli , Giorgia Bettoni , Lodovico Sterzi , Diego Marco Minore , Stella Papaleo , Enza D’Auria , Gianvincenzo Zuccotti , Francesco Comandatore doi: https://doi.org/10.1101/2025.07.17.665291 Clara Bonaiti 1 Department of Biomedical and Clinical Sciences, “Romeo ed Enrica Invernizzi” Pediatric Clinical Research Center, University of Milan , Milan, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site Simona Panelli 1 Department of Biomedical and Clinical Sciences, “Romeo ed Enrica Invernizzi” Pediatric Clinical Research Center, University of Milan , Milan, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site Giorgia Bettoni 1 Department of Biomedical and Clinical Sciences, “Romeo ed Enrica Invernizzi” Pediatric Clinical Research Center, University of Milan , Milan, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site Lodovico Sterzi 1 Department of Biomedical and Clinical Sciences, “Romeo ed Enrica Invernizzi” Pediatric Clinical Research Center, University of Milan , Milan, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site Diego Marco Minore 1 Department of Biomedical and Clinical Sciences, “Romeo ed Enrica Invernizzi” Pediatric Clinical Research Center, University of Milan , Milan, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site Stella Papaleo 1 Department of Biomedical and Clinical Sciences, “Romeo ed Enrica Invernizzi” Pediatric Clinical Research Center, University of Milan , Milan, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site Enza D’Auria 1 Department of Biomedical and Clinical Sciences, “Romeo ed Enrica Invernizzi” Pediatric Clinical Research Center, University of Milan , Milan, Italy 2 Department of Pediatrics, Vittore Buzzi Children’s Hospital, University of Milan , Milan, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site Gianvincenzo Zuccotti 1 Department of Biomedical and Clinical Sciences, “Romeo ed Enrica Invernizzi” Pediatric Clinical Research Center, University of Milan , Milan, Italy 2 Department of Pediatrics, Vittore Buzzi Children’s Hospital, University of Milan , Milan, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site Francesco Comandatore 1 Department of Biomedical and Clinical Sciences, “Romeo ed Enrica Invernizzi” Pediatric Clinical Research Center, University of Milan , Milan, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: francesco.comandatore{at}unimi.it Abstract Full Text Info/History Metrics Preview PDF Abstract Background “Candidatus Saccharimonadia”, a lineage within the Candidate Phyla Radiation (CPR), is characterized by small cell size, reduced genomes, and an epibiotic lifestyle dependent on bacterial hosts. Despite their presence in diverse environments, including the human oral microbiota, their role in human health remains largely unexplored. Observational studies have linked increased “ Ca . Saccharimonadia” abundance in human saliva with inflammatory conditions such as periodontitis and inflammatory bowel disease, while recent in vivo evidence suggests potential anti-inflammatory properties. Investigating “ Ca . Saccharimonadia” is challenging due to their fastidious nature, making standard culturing methods impractical. Current genomic studies rely on either co-cultivation with bacterial hosts or shotgun metagenomics, both requiring advanced technical expertise and costly resources. To address this limitation, we developed an affordable and efficient protocol for enriching “ Ca . Saccharimonadia” from human saliva samples, facilitating genome sequencing. Our protocol, termed the “ Ca . Saccharimonadia” Enrichment (SE) protocol, consists of two mandatory phases (detachment from host bacteria and weight/size-based separation) along with an optional DNA degradation phase. We validated this method on two human saliva samples. Results After SE protocol, the two saliva showed a substantial increase in “ Ca . Saccharimonadia” DNA concentration. The enriched samples enabled high-quality metagenome-assembled genomes (MAGs) to be obtained via shotgun metagenomics. Conclusions This study presents a cost-effective and scalable approach to studying “ Ca . Saccharimonadia”, overcoming prior limitations and expanding opportunities for future research on their role in human health and disease. Background “Candidatus Saccharimonadia” (formerly known as TM7 or Saccharibacteria) is one of the most studied lineages within the Candidate Phyla Radiation (CPR), a largely unexplored bacterial group which is estimated to encompass approximately 25% of all bacterial genetic variability [ 1 ]. “ Ca . Saccharimonadia” are characterised by[ 1 ] small cell size and reduced genomes, which lack several metabolic pathways [ 2 ]. Electron microscopy studies have evidenced that “ Ca . Saccharimonadia” have an epibiotic lifestyle, living on the surface of host Actinobacteriota [3, 4] . This suggests a strict metabolic relationship between “ Ca . Saccharimonadia” and the bacterial host. “ Ca . Saccharimonadia” inhabit diverse environments, including water, soil, animals, and are also a recognized component of the human microbiota, residing in the oral cavity, skin, and the gastrointestinal tract [ 5 ]. Various studies have shown that “ Ca . Saccharimonadia” abundance in the oral cavity increases in dysbiotic microbiomes associated with various human inflammatory diseases, including periodontitis, vaginosis and inflammatory bowel diseases [ 6 – 8 ]. On the other hand, experimental evidence revealed that “ Ca . Saccharimonadia” exhibit anti-inflammatory activities [ 9 ], also by inhibiting Tumour Necrosis Factor (TNF)-α production in human macrophages [ 3 ]. Coherently, D’Auria and colleagues (2023) found that “ Ca . Saccharimonadia” are enriched in the oral microbiota of children suffering from food allergy, in comparison to healthy controls [ 10 ]. Unfortunately, “ Ca . Saccharimonadia”, as the other CPR bacteria, are fastidious to culture in standard laboratory conditions [ 11 ]. At the state of the art, only a few successful cultivations are reported in literature [ 3 , 12 , 13 ]. This strongly hampers the investigation of “ Ca . Saccharimonadia” physiology and its impact on human health. Comparative genomics can aid in reconstructing the metabolic pathways of “ Ca . Saccharimonadia” and provide insights into their evolution. Currently, genome sequences of these bacteria can be obtained through two approaches: either by co-culturing “ Ca . Saccharimonadia” with their Actinobacteriota host or by using shotgun metagenomics [ 3 , 12 , 14 ]. Both approaches require advanced skills and expensive equipment. The co-cultivation of “ Ca . Saccharimonadia” can be performed only in very specific conditions, very challenging to achieve. Furthermore, considering that “ Ca . Saccharimonadia” represents ∼5% in the human oral microbiota [ 5 ], the sequencing of their entire genomes by shotgun metagenomics can require a remarkable sequencing depth, increasing the cost and the informatic effort. At the state of the art, protocols relying on vortexing, filtering and concentrating CPR cells with a final ultra-centrifugation, have been used as preparatory steps for the co-culturing of “ Ca . Saccharimonadia” with their hosts [ 12 , 13 ]. However, these approaches have never been used as a culture-independent way to obtain “Ca. Saccharimonadia” genomes. Building on these protocols, we developed an affordable and efficient protocol for the enrichment of “ Ca . Saccharimonadia” from human saliva, for genome sequencing purposes. We tested the protocol on two human saliva samples, resulting in a substantial enrichment of the “ Ca . Saccharimonadia” and the generation of two high-quality genome assemblies, without requiring deep metagenomics sequencing. Methods Ethics statement The two saliva samples used in this study were obtained from two children recruited as part of the control population in a study aimed at describing the alteration of oral microbiota in children suffering from food allergies [ 10 ]. Participants to the study were recruited at the Pediatric Clinic of the Vittore Buzzi Children’s Hospital (Milan, Italy). The study was conducted according to the Declaration of Helsinki, and all the methods followed the relevant guidelines and regulations. The Ethical Committee of ASST-Fatebenefratelli-Sacco approved the study (Ref. 2021/ST/041). The privacy rights of subjects have been observed. The parents of the recruited children signed an informed consent. Human saliva sampling and collection For each child, two ml of saliva were collected in a sterile container upon awakening, prior to any drinking, eating or teeth brushing. The fresh saliva samples conferred to the hospital were immediately subjected to the “Ca . Saccharimonadia ” enrichment protocol (from here “SE protocol”) described below. “Ca. Saccharimonadia” enrichment protocol To enrich “ Ca . Saccharimonadia” from human saliva samples, we leverage two distinctive traits of these bacteria: the ability to survive on the surface of other bacteria and the small size, along with a resilient cell wall that withstands chemical and physical stresses [ 15 ]. The SE protocol is composed of three phases: two mandatory (Phase I and Phase II) and one optional (Phase III). Phase I: detachment of “Ca . Saccharimonadia ” from the surface of host bacteria; Phase II: weight and size-based separation of cells by centrifugation and filtering; Phase III (optional): final removal of free DNA. All these steps are performed manually, prior to DNA extraction. Phase I (the detachment of “ Ca . Saccharimonadia”) consists in vortexing one ml of fresh saliva in a two-ml tube for 10 minutes. Phase II (separation of the cells on the basis of weight and size) consists in three main steps: 1) Centrifuge at 2600 x g for 15 minutes; 2) Discard the pellet and filter the supernatant through a 0.45 μm filter; 3) Centrifuge the filtrate at 16,900 x g for 1 hour at 4 ° C. These steps are expected to lead to the lysis of several cells, in particular those having a less resistant wall, including eukaryotic cells and gram negative bacteria. To eliminate free DNA, we added an optional third phase using Propidium Monoazide (PMA), a DNA intercalator that degrades DNA upon exposure to 465–475 nm light [ 16 ]. Phase III is composed by three steps: 1) the pellet obtained from the centrifugation in Phase II-step 3 is resuspended in 150µl of sterile water by pipetting and vortexing, and left at room temperature for 5 minutes (this step is expected to osmotically lyse mammalian cells); 2) PMA is added to a final concentration of 10µM (7.5µl of the 0.2mM stock) and samples are briefly vortexed, then incubated in the dark at room temperature for 5 minutes; 3) samples are finally placed horizontally on ice, 20cm away from a standard bench top fluorescent light (we used the WESTLITE Flashlight LED Blue 470 nm) for 25 minutes, with rotation every 5 minutes. The two samples included in the study underwent both a protocol which included only Phase 1 and Phase 2 (from here “SE-short protocol”) and a “SE-long protocol”, which included all three phases. Each SE experiment was performed on two technical replicates for each of the two subjects, and the samples were subsequently stored at -20 ° C. A graphical representation of the protocols are reported in Figure 1 . Download figure Open in new tab Figure 1. The “Ca. Saccharimonadia” Enrichment (SE) protocol Graphical representation of the “Ca. Saccharimonadia” Enrichment (SE) protocol, which consists of three phases following fresh saliva sampling: Phase I involves vortexing saliva to detach the target cells; Phase II separates cells by centrifugation and filtration based on size and weight; Phase III (optional) uses Propidium Monoazide (PMA) to eliminate free DNA through light exposure (465–475 nm). The SE-long protocol contains all the three phases, while SE-short only the first two phases. Both SE-short and SE-long protocols are followed by DNA extracted, Multiple Displacement Amplification (MDA), Next Generation Sequencing and genome assembly. DNA extraction, quantification and normalization DNA extractions were performed on original samples (i.e., saliva samples not subjected to the SE protocols), as well as on the samples after SE-short and SE-long protocols. DNA was extracted using the MasterPure™ Gram Positive DNA Purification Kit, following the manufacturer’s instructions, except for the Proteinase K incubation, which lasted one hour instead of 15 minutes. The lysozyme incubation lasted 30 minutes. DNA concentration was assayed with Qubit Fluorometer (Invitrogen, Waltham, Massachusetts, USA). “ Ca . Saccharimonadia” enrichments obtained by the SE-short and SE-long protocols were then evaluated by V3-V4 16S rRNA sequencing. “ Ca . Saccharimonadia” quantification by V3-V4 16S rRNA amplicon sequencing Amplicon production was performed as previously described [ 17 ]. Libraries were subjected to paired-end sequencing (2 × 300 bp format) on an Illumina MiSeq platform at BMR Genomics (Padova, Italy). The bioinformatics analysis of microbiota sequencing data was based on the Mothur pipeline [ 18 ]. Raw FASTQ files were quality-filtered using Trimmomatic [ 19 ] and high-quality reads were analysed following the SOP Mothur procedure [ 20 ]. Shotgun metagenomics One of the primary objectives of the SE protocols is to facilitate the sequencing of “ Ca . Saccharimonadia” genomes by significantly enriching them in the sample. To evaluate the efficiency of SE protocols in achieving this aim, we performed shotgun metagenomics on the most enriched “ Ca . Saccharimonadia” sample for each individual included in the study, to assemble the relative “ Ca . Saccharimonadia” strain genome. As expected, both the SE-short and SE-long protocols resulted in a substantial reduction of DNA concentration. To mitigate this issue, the DNA extracted after SE protocols was amplified using Multiple Displacement Amplification (MDA) with the Repli-g Single Cell Kit (Qiagen, Hilden, Germany), following the manufacturer’s instructions. The amplified DNA was then sequenced on an Illumina NovaSeq platform (2 × 150 bp paired-end) by Novogene (Munich, Germany). The low quality reads were trimmed out using the Trimmomatic software [ 19 ] and Metagenome-Assembled Genomes (MAGs) were obtained using the MetaWRAP pipeline [ 21 ]. The contamination and completeness of the obtained MAGs were then evaluated using the CheckM tool [ 22 ]. Then, MAGs were taxonomically assigned using the Forestax tool [ 23 ]. The gene content of the MAGs was then compared with a large collection of genome assemblies of the same genus from the Genome Taxonomy Database (GTDB) [ 24 ]. The comparison was carried out by orthologues analysis performed using the OrhoFinder tool [ 25 ]. Lastly, the metabolic capabilities of the MAGs were investigated by Clusters of Orthologous Groups (COG)-based annotation [ 26 ]. To determine the minimum number of reads required to obtain high quality “Ca. Saccharimonadia” MAGs, we repeated the MetaWRAP and Forestax pipelines on four random subsets of 5, 10, 20 and 30 million reads. Once the Saccharimonadia MAGs were obtained, the completeness, contamination, genome coverage, contig number, total length and normalized N50 (i.e. N50/total length) were compared. Results Enrichment of “Ca. Saccharimonadia” from human saliva The saliva samples collected from the two individuals were subjected to the SE-short and SE-long protocols as described above. DNA from the original samples and after the two protocols were then extracted and subjected to V3-V4 16S rRNA amplicon sequencing to quantify “ Ca . Saccharimonadia” in the samples ( Table 1 ). View this table: View inline View popup Download powerpoint Table 1. Percentage of “ Ca . Saccharimonadia” in the samples determined via V3-V4 16S rRNA amplicon sequencing The “Original” column refers to “ Ca . Saccharimonadia” percentage in the collected human saliva samples, while “SE-short” and “SE-long” columns refers to the values obtained after the SE-short and SE-long protocols, respectively. “Rep. 1” and “Rep. 2” refer to the technical replicates. Metagenome-assembled genomes (MAGs) As reported in Table 1 , the samples showing the highest “ Ca . Saccharimonadia” enrichment were the replicate 2 of the SE-long of the individual 1 (hereafter ‘sample-ind1’) and the replicate 2 of the SE-short of the individual 2 (hereafter ‘sample-ind2’). These two samples were selected for metagenomics. A total of 53,085,080 and 38,116,642 paired-end reads were obtained for sample-ind1 and sample-ind2, respectively. In the initial stage of the MetaWRAP pipeline, reads were mapped to the human reference genome assembly (Genome Reference Consortium Human Build 38, hg38, GCA_000001405) to distinguish human-derived sequences from those of other organisms, including “ Ca . Saccharimonadia”. This analysis identified 52,720,686 non-human reads for sample-ind1 (99.3% of the total) and 34,645,562 for sample-ind2 (90.8% of the total). Then, MetaWRAP pipeline subjected the non-human reads to metagenome assembly and Metagenome-Assembled Genomes (MAGs) binning, returning a total of five bins for sample-ind1 and one bin for sample-ind2. For sample-ind1, two out of five bins resulted to have completeness higher than 70% and contamination below 3%: one with completeness 95.35% and contamination 2.3%, the other with completeness 100% and contamination 2.3%. The taxonomic profiling of the two bins assigned the first one to the genus Anaeroplasma (class Bacilli) and the second one to the genus Nanosynbacter (class Saccharimonadia ). For sample-ind2, the only bin obtained resulted in the genus Nanosyncoccus (class Saccharimonadia ), with 97.67% of completeness and 0% of contamination. The gene content and quality of the Nanosynbacter genome assembly (MAG sample-ind1) was further assessed by comparing it with 36 Nanosynbacter genome assemblies from the GTDB database (Supplementary Table 1). The same was done for the Nanosyncoccus genome assembly (MAG sample-ind2), comparing it with 137 assemblies of the same genus present in GTDB (Supplementary Table 1). The results are reported in Supplementary Table 2 and Supplementary Table 3. For the Nanosynbacter genome assembly (MAG sample-ind1) (Supplementary Table 2), most parameters show values around the median of the other assemblies of the same genus in GTDB. About the Nanosyncoccus genome assembly (MAG sample-ind2) (Supplementary Table 3), the parameter values are comparable to the highest quality genome assemblies of this genus available in the GTDB database. Membrane/Wall proteins annotation The Clusters of Orthologous Genes (COG)-based annotation of the Nanosynbacter and Nanosyncoccus MAGs showed differences in the gene content related to bacterial cell wall biosynthesis (Supplementary Table 4). Specifically, the Nanosynbacter MAG (sample_ind1) lacked six genes that were present in the Nanosyncoccus MAG (sample_ind2), whereas the latter lacked 11 genes found in the former. Metagenome-assembled genomes (MAGs) quality and number of reads For each of the two samples (sample-ind1 and sample-ind2), the MAGs binning and taxonomic profiling were repeated on a random subset of 5 million, 10 million, 20 million and 30 million reads and MAG qualities were compared. The results are shown in Figure 2 . Download figure Open in new tab Figure 2. Statistics of MAGs obtained with random subset of metagenomics reads The plots report completeness (a and b), contamination (c and d), log10 of coverage (e and f), number of contigs (g and h), log10 of MAG total length (i and l), N50 normalized (N50/MAG total length) (m and m), for MAGs obtained by MetaWRAP pipeline using a random subset of 5/10/20/30 millions reads. For each plot, the last value on the right refers to all the sequenced reads (i.e. ∼53 million for Nanosymbacter MAG sample-ind1 and ∼38 million for Nanosyncoccus MAG sample-ind2). The plots a, c, e, g, i, m refer to the MAG obtained from the saliva of the individual 1, after the “Ca. Saccharimonadia” Enrichment (SE) -long protocol. Plots b, d, f, h, i and n, refer to the MAG of the individual 2, even after saliva was subjected to the SE-short protocol. The Nanosynbacter MAG (sample-ind1) reached high completeness and low contamination until 10 million reads. This is also the number of reads that gave the minimum number of contigs, without a strong reduction in the MAG total length and maintaining the coverage above 1,000X. For the Nanosyncoccus MAG (sample-ind2), a minimum of 10 million reads were sufficient to obtain high completeness (>95%), ∼50X genome coverage and an assembly total length comparable to the other assemblies obtained with more reads. Discussion Candidate Phyla Radiation (CPR) is a very large but poorly investigated bacterial lineage, found in several ecological niches, ranging from soil to the human body [ 15 ]. Observational and experimental studies suggest that CPR bacteria possess immuno-modulating properties [ 3 , 9 , 27 ]. Additionally, D’Auria et al. (2023) found CPR bacteria enriched in allergic children, indicating a potential role in the development of this immune-mediated pathology [ 10 ]. The most studied CPR class is “ Ca . Saccharimonadia”, which is commonly part of the human oral microbiota, even if with frequency ∼5% [ 5 ]. This low abundance makes deep and costly metagenomic sequencing necessary to achieve high-quality genome assemblies. In this work we present a protocol for the enrichment of “ Ca . Saccharimonadia” from fresh human saliva: “ Ca . Saccharimonadia ” Enrichment” protocol, or SE protocol. This protocol drew inspiration from existing procedures for enrichment of CPR from fresh saliva samples, which rely on vortexing, filtering and concentrating CPR cells with a final ultra-centrifugation. The difference is that, while in these previous works the enrichment was generally preparatory to co-culturing “ Ca . Saccharimonadia” with their hosts, in our protocol, it is the first step of a procedure that is completely culture-independent and ends in the genomic sequencing of “ Ca . Saccharimonadia” directly from saliva samples. Another noteworthy point is that we simplified existing protocols by performing the last centrifugation step of Phase II using a standard benchtop microcentrifuge instead of an ultra-centrifuge. This point makes the protocol feasible by any laboratory equipped with basic instruments. Another original implementation of our protocol is the step of free DNA degradation through PMA-mediated photolysis. This procedure, originally conceived for achieving the depletion of host DNA to increase the rate of bacterial reads in shotgun metagenomics of saliva samples [ 16 ], has been tested by us as a way to further increase the “ Ca . Saccharimonadia” representation in the fresh saliva sample. The protocol consists of three main phases (two mandatory and one optional) and we propose two protocol variants, called SE-short (which includes the first two phases only) and SE-long (including the three phases). We validated the protocols on two children’s saliva samples, measuring the “ Ca . Saccharimonadia” enrichment by V3-V4 16S rRNA amplicon sequencing. Then, we assembled two high quality “ Ca . Saccharimonadia” MAGs using DNA extracted after the SE protocols. Lastly, we evaluated the minimum number of reads required to obtain good quality “ Ca . Saccharimonadia” MAGs after the enrichment. Our findings showed that both SE protocols (SE-short and SE-long) effectively enriched “Ca . Saccharimonadia ” from human saliva samples ( Table 1 and Table 2), rising up the percentages from ∼5% to ∼50-80%. However, we found that the two individuals carried two different genera of “ Ca . Saccharimonadia” (i.e. Nanosynbacter and Nanosyncoccus ), that gave a different enrichment response after SE-short and SE-long protocols. For the Individual 1 a successfully “ Ca . Saccharimonadia ” enrichment was observed after both the SE-short and SE-long protocols, and sequencing revealed the presence of a bacterium belonging to the genus Nanosynbacter . In contrast, for the Individual 2, which harboured a “ Ca . Saccharimonadia” bacterium belonging to the genus Nanosyncoccus , the SE-long protocol resulted in significantly lower enrichment compared to SE-short. Both protocols share the first two phases, during which the “ Ca . Saccharimonadia” are detached from the host bacterial cells (Phase I) and cells with less resistant walls (i.e. eukaryotic and gram negative cells) are expected to be lysed, and removed by filtration (Phase II). At the end of these two phases, DNA from cells with less resistant walls can however remain and be sequenced. The Phase III of the SE-long protocol removes this free-DNA. At the end of the two phases (for the SE-short), or three phases (for SE-long), the sample is subjected to whole DNA extraction and amplification by MDA. The observed decrease (from 52% to 8.5%) of the “ Ca . Saccharimonadia” (genus Nanosyncoccus ) in sample-ind2 after free-DNA removal (Phase III of the SE-long protocol) suggests that a significant portion of the “ Ca . Saccharimonadia ” free-DNA (likely released during cell lysis in Phase II) was eliminated in Phase III. This indicates that the “ Ca . Saccharimonadia ” species present in Individual 2’s saliva have a non highly resistant cell wall. Conversely, in sample-ind1, the final step of the SE-long protocol had no significant I mpact on “ Ca . Saccharimonadia ” (genus Nanosynbacter ) representation (rising slightly from ∼79% to 88%), suggesting the absence of free DNA from Nanosynbacter after Phase II, possibly due to a resistant cell wall. The metabolic characterization of the “ Ca . Saccharimonadia ” MAGs obtained from the two samples is coherent with this hypothesis: indeed, MAGs obtained from the individual 2 (which belong to the Nanosyncoccus genus) lack several genes involved in the wall biosynthesis. The MAG obtained after the SE protocols were both of high quality, exhibiting a high level of completeness (>95%) and low contamination (<3%). Additionally, the assembly statistics were comparable or better than those of the “Ca. Saccharimonadia ” genome assemblies of the genera Nanosyncoccus or Nanosynbacter available in public databases. The MAGs obtained using a subset of 10 million 150×2 paired-end Illumina reads maintained a high level of quality, suggesting that increasing the number of reads would not have a significant impact on the results. This finding is particularly interesting, as this read depth is comparable to that used for Whole-Genome Sequencing (WGS) of bacterial isolates, one order of magnitude lower than what is typically required for metagenomics. Conclusions The protocol presented in this study enables the successful generation of high-quality “ Ca . Saccharimonadia ” genome assemblies without the high economic and computational demands of shotgun metagenomics. Moreover, it requires only standard laboratory equipment commonly available in microbiology and molecular biology labs, making it easily implementable. Lastly, the significantly lower sequencing depth needed after applying this protocol further reduces both the computational resources and expertise required for data analysis. In conclusion, this study presents an easy-to-use, cost-effective protocol for the enrichment of “ Ca . Saccharimonadia ” , designed to facilitate the genomic characterization of this elusive bacterial group. List of abbreviations SE protocol “Ca. Saccharimonadia” enrichment protocol PMA Propidium Monoazide MDA Multiple Displacement Amplification MAG Metagenome-Assembled Genome GTDB Genome Taxonomy Database COG Clusters of Orthologous Group Declarations Ethics approval and consent to participate Participants to the study were recruited at the Pediatric Clinic of the Vittore Buzzi Children’s Hospital (Milan, Italy). The study was conducted according to the Declaration of Helsinki, and all the methods followed the relevant guidelines and regulations. The Ethical Committee of ASST-Fatebenefratelli-Sacco approved the study (Ref. 2021/ST/041). The privacy rights of subjects have been observed. The parents of the recruited children signed an informed consent. Funding The project was funded by Grandi Sfide di Ateneo (GSA) of the University of Milan. Authors’ contributions Made substantial contributions to conception and design of the study: Simona Panelli and Francesco Comandatore; Performed the experiments: Clara Bonaiti, Simona Panelli, Giorgia Bettoni, Stella Papaleo; Performed data analysis: Lodovico Sterzi, Diego Marco Minore; Drafted the manuscript: Francesco Comandatore, Simona Panelli, Lodovico Sterzi, Enza D’Auria, Gianvincenzo Zuccotti Acknowledgements We acknowledge the support of the APC Central Fund of the University of Milano”. We would like to thank Prof. Raffaele De Francesco for his valuable advice during the experimental design. References 1. ↵ Parks DH , Rinke C , Chuvochina M , Chaumeil P-A , Woodcroft BJ , Evans PN , et al. Recovery of nearly 8,000 metagenome-assembled genomes substantially expands the tree of life . Nature Microbiology . 2017 ; 2 : 1533 – 42 . OpenUrl CrossRef PubMed 2. ↵ McLean JS , Bor B , Kerns KA , Liu Q , To TT , Solden L , et al. Acquisition and Adaptation of Ultra-small Parasitic Reduced Genome Bacteria to Mammalian Hosts . Cell Rep . 2020 ; 32 : 107939 . OpenUrl CrossRef PubMed 3. ↵ He X , McLean JS , Edlund A , Yooseph S , Hall AP , Liu S-Y , et al. Cultivation of a human-associated TM7 phylotype reveals a reduced genome and epibiotic parasitic lifestyle . Proceedings of the National Academy of Sciences . 2015 ; 112 : 244 – 9 . OpenUrl Abstract / FREE Full Text 4. Nie J , Utter DR , Kerns KA , Lamont EI , Hendrickson EL , Liu J , et al. Strain-Level Variation and Diverse Host Bacterial Responses in Episymbiotic Saccharibacteria . mSystems . 2022 ; 7 : e0148821 . OpenUrl CrossRef PubMed 5. ↵ Naud S , Valles C , Abdillah A , Abou Chacra L , Mekhalif FZ , Ibrahim A , et al. Preliminary landscape of Saccharibacteria in the human microbiome . Front Cell Infect Microbiol . 2023 ; 13 : 1195679 . OpenUrl PubMed 6. ↵ Bor B , Bedree JK , Shi W , McLean JS , He X. Saccharibacteria (TM7) in the Human Oral Microbiome . J Dent Res . 2019 ; 98 : 500 – 9 . OpenUrl CrossRef PubMed 7. Kuehbacher T , Rehman A , Lepage P , Hellmig S , Fölsch UR , Schreiber S , et al. Intestinal TM7 bacterial phylogenies in active inflammatory bowel disease . Journal of Medical Microbiology . 2008 ; 57 : 1569 – 76 . OpenUrl CrossRef PubMed Web of Science 8. ↵ Brinig MM , Lepp PW , Ouverney CC , Armitage GC , Relman DA . Prevalence of Bacteria of Division TM7 in Human Subgingival Plaque and Their Association with Disease . Applied and Environmental Microbiology . 2003 . doi: 10.1128/AEM.69.3.1687-1694.2003 . OpenUrl Abstract / FREE Full Text 9. ↵ Chipashvili O , Utter DR , Bedree JK , Ma Y , Schulte F , Mascarin G , et al. Episymbiotic Saccharibacteria suppresses gingival inflammation and bone loss in mice through host bacterial modulation . Cell Host Microbe . 2021 ; 29 : 1649 – 62.e7 . OpenUrl CrossRef PubMed 10. ↵ D’Auria E , Cattaneo C , Panelli S , Pozzi C , Acunzo M , Papaleo S , et al. Alteration of taste perception, food neophobia and oral microbiota composition in children with food allergy . Scientific Reports . 2023 ; 13 : 1 – 13 . OpenUrl CrossRef PubMed 11. ↵ Naud S , Ibrahim A , Valles C , Maatouk M , Bittar F , Alou MT , et al. Candidate Phyla Radiation, an Underappreciated Division of the Human Microbiome, and Its Impact on Health and Disease . Clinical Microbiology Reviews . 2022 . doi: 10.1128/cmr.00140-21 . OpenUrl CrossRef PubMed 12. ↵ Murugkar PP , Collins AJ , Chen T , Dewhirst FE . Isolation and cultivation of candidate phyla radiation Saccharibacteria (TM7) bacteria in coculture with bacterial hosts . Journal of Oral Microbiology . 2020 . doi: 10.1080/20002297.2020.1814666 . OpenUrl CrossRef PubMed 13. ↵ Ibrahim A , Maatouk M , Rajaonison A , Zgheib R , Haddad G , Khalil JB , et al. Adapted Protocol for Saccharibacteria Cocultivation: Two New Members Join the Club of Candidate Phyla Radiation . Microbiology Spectrum . 2021 . doi: 10.1128/spectrum.01069-21 . OpenUrl CrossRef 14. ↵ Eloe-Fadrosh EA , Ivanova NN , Woyke T , Kyrpides NC . Metagenomics uncovers gaps in amplicon-based detection of microbial diversity . Nature Microbiology . 2016 ; 1 : 1 – 4 . OpenUrl CrossRef 15. ↵ Ji Y , Zhang P , Zhou S , Gao P , Wang B , Jiang J. Widespread but Poorly Understood Bacteria: Candidate Phyla Radiation . Microorganisms . 2022 ; 10 . 16. ↵ Marotz CA , Sanders JG , Zuniga C , Zaramela LS , Knight R , Zengler K. Improving saliva shotgun metagenomics by chemical host DNA depletion . Microbiome . 2018 ; 6 : 1 – 9 . OpenUrl CrossRef PubMed 17. ↵ Mameli C , Cattaneo C , Panelli S , Comandatore F , Sangiorgio A , Bedogni G , et al. Taste perception and oral microbiota are associated with obesity in children and adolescents . PLoS One . 2019 ; 14 : e0221656 . OpenUrl PubMed 18. ↵ Schloss PD , Westcott SL , Ryabin T , Hall JR , Hartmann M , Hollister EB , et al. Introducing mothur: Open-Source, Platform-Independent, Community-Supported Software for Describing and Comparing Microbial Communities . Applied and Environmental Microbiology . 2009 . doi: 10.1128/AEM.01541-09 . OpenUrl Abstract / FREE Full Text 19. ↵ Bolger AM , Lohse M , Usadel B. Trimmomatic: a flexible trimmer for Illumina sequence data . Bioinformatics . 2014 ; 30 : 2114 – 20 . OpenUrl CrossRef PubMed Web of Science 20. ↵ Kozich JJ , Westcott SL , Baxter NT , Highlander SK , Schloss PD . Development of a dual-index sequencing strategy and curation pipeline for analyzing amplicon sequence data on the MiSeq Illumina sequencing platform . Appl Environ Microbiol . 2013 ; 79 : 5112 – 20 . OpenUrl Abstract / FREE Full Text 21. ↵ Uritskiy GV , DiRuggiero J , Taylor J. MetaWRAP-a flexible pipeline for genome-resolved metagenomic data analysis . Microbiome . 2018 ; 6 : 158 . OpenUrl CrossRef PubMed 22. ↵ Parks DH , Imelfort M , Skennerton CT , Hugenholtz P , Tyson GW . CheckM: assessing the quality of microbial genomes recovered from isolates, single cells, and metagenomes . Genome Res . 2015 ; 25 : 1043 – 55 . OpenUrl Abstract / FREE Full Text 23. ↵ Sterzi L , Panelli S , Bonaiti C , Papaleo S , Bettoni G , D’Auria E , et al. RecA is a reliable marker for bacterial taxonomy, even in the Candidate Phyla Radiation . bioRxiv . 2024 ;:2024.06.21.600076. 24. ↵ Parks D , Hugenholtz P. Genome Taxonomy Database r214.1 . 2021 . 25. ↵ Emms DM , Kelly S. OrthoFinder: phylogenetic orthology inference for comparative genomics . Genome Biol . 2019 ; 20 : 238 . OpenUrl CrossRef PubMed 26. ↵ Tatusov RL , Koonin EV , Lipman DJ . A genomic perspective on protein families . Science . 1997 ; 278 : 631 – 7 . OpenUrl Abstract / FREE Full Text 27. ↵ Han Y , Wang B , Gao H , He C , Hua R , Liang C , et al. Insight into the Relationship between Oral Microbiota and the Inflammatory Bowel Disease . Microorganisms . 2022 ; 10 . View the discussion thread. Back to top Previous Next Posted July 17, 2025. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following A Simple and Cost-Effective Protocol for Enriching ’Ca. Saccharimonadia’ from Human Saliva to Enable Efficient Genome Sequencing Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share A Simple and Cost-Effective Protocol for Enriching ’ Ca . Saccharimonadia’ from Human Saliva to Enable Efficient Genome Sequencing Clara Bonaiti , Simona Panelli , Giorgia Bettoni , Lodovico Sterzi , Diego Marco Minore , Stella Papaleo , Enza D’Auria , Gianvincenzo Zuccotti , Francesco Comandatore bioRxiv 2025.07.17.665291; doi: https://doi.org/10.1101/2025.07.17.665291 Share This Article: Copy Citation Tools A Simple and Cost-Effective Protocol for Enriching ’ Ca . Saccharimonadia’ from Human Saliva to Enable Efficient Genome Sequencing Clara Bonaiti , Simona Panelli , Giorgia Bettoni , Lodovico Sterzi , Diego Marco Minore , Stella Papaleo , Enza D’Auria , Gianvincenzo Zuccotti , Francesco Comandatore bioRxiv 2025.07.17.665291; doi: https://doi.org/10.1101/2025.07.17.665291 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Microbiology Subject Areas All Articles Animal Behavior and Cognition (7640) Biochemistry (17707) Bioengineering (13903) Bioinformatics (41980) Biophysics (21465) Cancer Biology (18613) Cell Biology (25528) Clinical Trials (138) Developmental Biology (13387) Ecology (19920) Epidemiology (2067) Evolutionary Biology (24332) Genetics (15615) Genomics (22519) Immunology (17747) Microbiology (40424) Molecular Biology (17194) Neuroscience (88664) Paleontology (667) Pathology (2839) Pharmacology and Toxicology (4827) Physiology (7650) Plant Biology (15160) Scientific Communication and Education (2046) Synthetic Biology (4302) Systems Biology (9826) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00