Full text
57,345 characters
· extracted from
preprint-html
· click to expand
A cross-environment comparison of nontuberculous mycobacterial diversity | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results A cross-environment comparison of nontuberculous mycobacterial diversity View ORCID Profile Matthew J. Gebert , Ettie M. Lipner , Jordan M. Galletta , Jessica B. Henley , Michael Hoffert , Melissa L. Riskin , D. Rebecca Prevots , View ORCID Profile Noah Fierer doi: https://doi.org/10.1101/2025.08.04.668438 Matthew J. Gebert 1 Department of Ecology and Evolutionary Biology, University of Colorado , Boulder, CO, USA 2 Cooperative Institute for Research in Environmental Sciences, University of Colorado , Boulder, CO, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Matthew J. Gebert For correspondence: matthew.gebert{at}colorado.edu Noah.fierer{at}colorado.edu Ettie M. Lipner 3 Epidemiology and Population Studies Section, Division of Intramural Research, National Institute of Allergy and Infectious Diseases, National Institutes of Health , Rockville, MD, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jordan M. Galletta 2 Cooperative Institute for Research in Environmental Sciences, University of Colorado , Boulder, CO, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jessica B. Henley 2 Cooperative Institute for Research in Environmental Sciences, University of Colorado , Boulder, CO, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Michael Hoffert 1 Department of Ecology and Evolutionary Biology, University of Colorado , Boulder, CO, USA 2 Cooperative Institute for Research in Environmental Sciences, University of Colorado , Boulder, CO, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Melissa L. Riskin 4 U.S. Geological Survey, Hydrologic Networks Branch , Lawrenceville, NJ, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site D. Rebecca Prevots 3 Epidemiology and Population Studies Section, Division of Intramural Research, National Institute of Allergy and Infectious Diseases, National Institutes of Health , Rockville, MD, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Noah Fierer 1 Department of Ecology and Evolutionary Biology, University of Colorado , Boulder, CO, USA 2 Cooperative Institute for Research in Environmental Sciences, University of Colorado , Boulder, CO, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Noah Fierer For correspondence: matthew.gebert{at}colorado.edu Noah.fierer{at}colorado.edu Abstract Full Text Info/History Metrics Preview PDF Abstract Nontuberculous mycobacteria (NTM) are a group of environmental bacteria that encompass nearly 200 described species, some of which can cause chronic pulmonary infection in humans. What makes these infections unique is that they are environmentally acquired, yet there remains a limited understanding of how different environments contribute to potential pathogen exposure. Here, we use new and existing marker gene datasets to compare the amounts and types of NTM across three environments known to harbor mycobacteria, surface waters, soil, and household plumbing biofilms, to better understand potential pathogen occurrence in each environment. We used 16S rRNA gene sequencing, in tandem with mycobacterial-specific marker gene sequencing to characterize variation in the relative abundances of the genus Mycobacterium and specific mycobacterial taxa across the three environments, with a focus on a clinically significant NTM. We found that household plumbing biofilms contained both the highest relative abundance of the genus Mycobacterium (on average, 13.7% of bacteria were members of the genus), as well as the highest occurrence of clinically relevant species detected ( Mycobacterium avium , Mycobacterium abscessus ), compared to surface waters and soil. Although mycobacteria are ubiquitous across many different environments, mycobacterial diversity is highly variable between environments with clinically relevant species largely restricted to household plumbing biofilms, information that is critical for understanding the ecology and epidemiology of NTM disease. Importance Nontuberculous mycobacteria, or NTM, are a diverse group of bacteria within the genus Mycobacterium that are common in many environments. While most members of the genus pose little threat to human health, a handful of species, namely the Mycobacterium avium complex, M. abscessus , and M. mucogenicum , can cause severe and prolonged lung infections. These environmentally acquired infections are on the rise in the United States and around the world, yet we still don’t have a good understanding of which environment types pose the greatest risk of infection to susceptible populations. Our study used cultivation independent approaches to identify the specific NTM taxa found in over 1,000 samples from three potentially important environmental reservoirs - surface waters, soils, and household plumbing systems, to determine which of these environments are most likely to harbor NTM of clinical significance. Our results highlight the high degree of variability in the types of NTM taxa detected in different environments (including extensive novel diversity within the genus) and show that household plumbing biofilms are likely the most important reservoir and subsequent route of transmission for clinically significant NTM. Introduction Nontuberculous mycobacteria (NTM) are a group of bacteria commonly found in a wide range of environments. They are defined by their unique cell wall structure, consisting of long-chain fatty acids known as mycolic acids, that allow for their prolonged survival during periods of desiccation and nutrient limitation, as well as resistance to common disinfectants and antibiotics ( Brennan and Nikaido 1995 ). Although most members of the genus are of limited clinical significance, some species (e.g. Mycobacterium avium complex, Mycobacterium abscessus , Mycobacterium kansasii ) can cause pulmonary infection in humans, especially in individuals with underlying structural lung damage ( Lake et al. 2016 ). NTM disease is of growing concern worldwide, with case numbers increasing annually across the United States and around the world ( Winthrop et al. 2020 ; Dahl et al. 2022 ; Bents et al. 2024 ). NTM disease is widely considered to be environmentally acquired, with many environments implicated in the exposure and transmission of pathogenic NTM ( Falkinham 2016 ; Gebert et al. 2018 ; Gross et al. 2021 ). While NTM have been detected in a wide range of environments, including soil, household plumbing, hot tubs and pools, and natural water bodies ( Centers for Disease Control and Prevention, Atlanta, GA, United States 2024 ), few studies have comprehensively characterized NTM communities across a range of environments or quantified the occurrence of clinically relevant NTM taxa within different types of environments. This knowledge gap persists, in part, because of the widespread reliance on cultivation-dependent approaches for assessing NTM diversity in environmental samples, and the biases and limitations associated with such approaches ( Modra et al. 2023 ; Ulmann, Kracalikova, and Dziedzinska 2015 ; von Reyn et al. 1993 ; Bland et al. 2005 ; Mercaldo et al. 2023 ). Many environmental NTM remain undescribed or poorly characterized ( Walsh et al. 2019 ), and differentiating clinically relevant NTM from those that are not clinically relevant requires time-consuming genotyping of isolates ( Baldwin et al. 2019 ; Sarro et al. 2018 ). Likewise, previous work characterizing the presence of clinically relevant NTM in different environments has often focused on relatively small numbers of representative samples ( Jacobs et al. 2009 ; Kopecky et al. 2011 ; Roguet et al. 2016 ), making it challenging to reach broader conclusions about the potential importance of different environments as sources of NTM infections. In short, much of our knowledge on which environments most likely harbor clinically relevant NTM is derived from limited or anecdotal evidence. Previous studies have used cultivation-independent approaches to survey NTM diversity in two environments often implicated as reservoirs of clinically relevant NTM: premise plumbing and surface soils. More specifically, Gebert et al. analyzed showerhead biofilms collected from 638 homes across the US ( Gebert et al. 2018 ) and Walsh et al. analyzed 143 soils from across the globe ( Walsh et al. 2019 ), using a combination of 16S rRNA and hsp65 gene sequencing of DNA extracted directly from the environmental samples to characterize NTM diversity and composition. Both survey efforts found that the NTM communities found in these environments are diverse and highly variable in composition with clinically relevant NTM frequently detected in building premise plumbing. Surface waters, including lakes, streams, and reservoirs, are also implicated as sources of NTM exposures, and are known to harbor a broad diversity of NTM, including clinically relevant taxa. ( Delghandi et al. 2020 ; Roguet et al. 2016 ; George et al. 1980 ; Makovcova et al. 2014 ). However, it remains unclear how NTM communities vary across surface waters and, whether surface waters represent an important source of exposures to clinically relevant NTM. More generally, it remains unclear how NTM diversity differs across these environments and which environments represent the most important potential sources of NTM exposures. For this study, we used high throughput marker gene sequencing, targeting both the 16S rRNA gene and the mycobacterial-specific 65-kD heat shock protein ( hsp65 ) gene to characterize the ubiquity and types of NTM detected across 373 surface water samples collected from 102 sites across the US. We then integrated the surface water datasets with previously published datasets from 143 soils ( Walsh et al. 2019 ) and 638 household plumbing biofilm samples ( Gebert et al. 2018 ) to directly compare the diversity and ubiquity of NTM found across these three major environment types. The comprehensive survey of NTM diversity in surface waters conducted here, when coupled with the soil and premise plumbing datasets, made it possible to quantitatively compare NTM communities across environments and identify which environments are most likely to harbor clinically relevant NTM. Methods Surface water samples A total of 373 surface water samples were collected from surface water sites across the United States that are monitored by the US Geological Survey (USGS) as part of the National Water Quality Network (NWQN) ( Riskin and Lee 2021 ). These samples were collected from 102 unique surface water collection sites across 28 states (for site map, see Figure 1 ). At 73 of the sites, multiple samples were collected over time starting in July 2022 and concluding in November 2022. The collection sites spanned 8 different surface water types, with the majority coming from streams, but also including large inland and coastal rivers, lakes and reservoirs, and urban and agricultural sites (Supplementary Table 1). For the 16S rRNA gene sequencing analysis, all samples (N = 373) were included in downstream analysis. Download figure Open in new tab Figure 1: Map showing the distribution of surface water sample collection sites, colored in purple, across the United States (N = 102), as part of the National Water Quality Network (USGS). For information on collection locations for the soil and household plumbing biofilm samples, see Walsh et al. (2019) and Gebert et al. (2018) . Methods of sample collection used by the NWQN conform to the USGS National Field Manual for the Collection of Water-Quality Data ( US Geological Survey 2006 ). To the greatest extent possible, isokinetic, depth-integrated sampling techniques that provide samples representative of stream conditions are used. The collection of isokinetic, depth-integrated samples is done using either an equal-width-increment (EWI) or equal-discharge-increment (EDI) sampling method that yields a composite sample that represents the streamflow-weighted concentrations of the stream cross section being sampled. For each sample collection, a total of 0.2L - 10L of water was filtered immediately through 0.45 µm GWV high-capacity groundwater sampling capsule filters (Cytiva Life Sciences) by USGS personnel. Collection filters were then stored at -20°C at individual sites until the final date of collection (November 2022). All capsule filters were shipped overnight on ice to the University of Colorado Boulder, where they were stored at -20°C until DNA extraction. Metadata associated with all samples were downloaded from the Water Quality Portal ( https://www.waterqualitydata.us/ ) and included information on water temperature (°C), water pH, dissolved oxygen (% saturation), total carbon (mg/L), total nitrogen (mg/L), sodium adsorption ratio (SAR), and turbidity at the time of sampling (Supplementary Table 3). Household plumbing biofilm samples We re-analyzed a previously published dataset from a large-scale survey of showerhead biofilms, treating the showerhead biofilms as a proxy for household plumbing biofilms ( Gebert et al. 2018 ). For this analysis, we focused only on those biofilm swab samples collected from households in the United States (N = 638, 49 of 50 states in the US represented). For specific site information and sampling details, see Gebert et al. (2018) . Global soil samples We also re-analyzed a previously published soil dataset from Walsh et al. (2019) , which focused on a subset of 143 soils from collection sites across 6 continents, originally collected for the study described in Delgado-Baquerizo et al. (2018) . Composite samples were collected from each site to 7.5 cm depth with all samples stored at -20°C immediately after collection. For additional soil and site information, see Delgado-Baquerizo et al. (2018) and Walsh et al. (2019) . DNA extraction DNA was extracted from the showerhead biofilm and soil samples using the DNEasy PowerSoil kit (Qiagen, Germantown, MD, USA), see Gebert et al. (2018) and Walsh et al. (2019) for further details. To extract DNA from the surface water samples, filters were first thawed at room temperature for ∼1 hour prior to downstream processing. Autoclaved 7/16” brass caps were attached to the bottom of each filter capsule prior to thawing. Immediately before shaking, 5mL of 5% Triton was added to each filter capsule, and the filter was capped on the top end, sealing the capsule. Capsule filters were shaken at 20 Hz for 7.5 min, then inverted and shaken for another 7.5 min. We then used an air-filled 50mL syringe to force liquid out of each capsule in the direction of flow, collecting 2-5 mL of eluent per capsule into a DNA-free 15 mL conical tube, with the eluents frozen at -20°C immediately after collection. After thawing the eluents at room temperature, we extracted DNA using the DNeasy PowerWater kit (Qiagen, Germantown, MD, USA), following the manufacturer’s recommended protocol. In each round of extraction, we included an extraction blank to check for contamination. 16S rRNA Gene Sequencing We amplified and sequenced a portion of the 16S rRNA gene using bacterial and archaeal primers to determine the relative abundance of the genus Mycobacterium in each sample. For a detailed description of library preparation and sequencing for the soil and household plumbing biofilm samples, see Walsh et al. (2019) , and Gebert et al. (2018) . To characterize the bacterial community of the extracted surface water, we used the same barcoded 515fBC/806rB primers (Caporaso et al., 2012) as aforementioned, which target the V4 region of the 16S rRNA gene. Duplicate PCR reactions were performed as follows: 12.5μl of Colorless Platinum II Hot Start Master Mix (ThermoFisher, Waltham, MA, USA), 10μl of Sigma water (Sigma-Aldrich, Burlington, MA, USA), 1μl of primers and 1μl of gDNA. Thermocycler conditions were 94°C for 2 minutes, 35 cycles at 94°C for 15 seconds, 60°C for 15 seconds, 68°C for 1 minute, then 72°C for 10 minutes. Amplicon normalization and clean-up was done using the Invitrogen SequalPrep Normalization Plate kit (ThermoFisher, Waltham, MA, USA) with 5μl of amplicons from each sample pooled. The composited library was then quantified using the Invitrogen Qubit dsDNA HS Assay kit (ThermoFisher, Waltham, MA, USA) and ABsolute qPCR Mix, SYBR Green, no ROX (ThermoFisher, Waltham, MA, USA). The library was run on the Illumina MiSeq using a v2-300 cycle kit (Illumina, San Diego, CA, USA) at the Center for Microbial Exploration at the University of Colorado Boulder. Hsp65 gene sequencing As 16S rRNA gene sequence data are not generally useful for identifying particular mycobacterial taxa ( Kim and Shin 2018 ), we also sequenced the 65-kD heat shock protein ( hsp65 ) gene using mycobacterial-specific primers Tb11-Tb12 primers ( Telenti et al. 1993 ). For a detailed description of library preparation and sequencing for soil and household plumbing biofilm samples, see Walsh et al. (2019) , and Gebert et al. (2018) . For the surface water DNA extracts, the same protocol described in Gebert et al. (2018) was followed except we used Platinum II Hot Start Master Mix (ThermoFisher, Waltham, MA, USA) for PCRs and amplicons were cleaned by adding 8.85 μL DNA-free water and 0.251 μL of ExoSAP (New England Biolabs, Ipswich, MA) to a 20 μL aliquot of each amplicon followed by incubation at 37°C for 30 minutes followed by 95°C for 5 minutes. A second PCR was done to attach 12-bp universal reverse barcodes for sample multiplexing. Each reaction consisted of 12.5 μl of Platinum Hot Start Master Mix (ThermoFisher, Waltham, MA, USA), 8.5 μL of Sigma water (Sigma-Aldrich, Burlington, MA, USA), 2 μl of combined Illumina universal barcoded primers stock at 10μM each (Illumina, San Diego, CA, USA), and 2 μL of cleaned amplicon from the first reaction, with thermocycler conditions as follows: 95°C for 3 minutes, then 8 cycles of 95°C for 30 seconds, 55°C for 30 seconds, 72°C for 30 seconds, then 72°C for 2 minutes and held at 4°C. We followed the same protocol as above for normalization and quantification of the library. Sequencing was done using a v3-600 cycle kit (Illumina, San Diego, CA, USA) on the Illumina MiSeq at the Center for Microbial Exploration at the University of Colorado Boulder. 16S rRNA Gene Sequence Analyses Raw reads from the surface water samples were demultiplexed using idemp ( https://github.com/yhwu/idemp ) and primers were trimmed from reads using cutadapt (version 1.8.1)( Martin 2011 ). Data was processed using the DADA2 pipeline (version 1.22.0)( Callahan et al. 2016 ). Reads were filtered based on the quality metrics (trunclen = (150, 140), maxEE = (2,2), truncQ=2, maxN=0). After the removal of chimeras, taxonomy was assigned against the SILVA nr v.138.1 database ( Quast et al. 2013 ). This resulted in 376 samples being used for downstream analysis. The 16S rRNA marker gene datasets from the two previously published studies (household plumbing biofilms and soil) were generated using an identical procedure ( Gebert et al, 2018 , Walsh et al, 2019 ). After processing and quality filtering, a total of 638 household plumbing biofilm samples and 143 soil samples were included in this study. Combined with the 373 surface water samples that met our threshold for inclusion (minimum 2,000 archaeal and bacterial 16S rRNA gene reads per sample), the combined 16S rRNA gene dataset used for downstream analyses included a total of 1,154 samples. Hsp65 Sequence Analyses The hsp65 marker gene sequence data from each of the three datasets were combined and processed together using a single pipeline to maintain consistency and permit direct comparison of results across the three unique environments. First, each hsp65 dataset was demultiplexed independently using idemp ( https://github.com/yhwu/idemp ). Primers were trimmed from reads using cutadapt (version 1.8.1) ( Martin 2011 ). Data was then processed using the DADA2 pipeline (version 1.22.0) ( Callahan et al. 2016 ). Each dataset was filtered independently based on the quality metrics for each respective MiSeq run. Error rates were then determined, and sequence variants were inferred (pool = TRUE), resulting in three amplicon sequence variant (ASV) tables, one for each environment. Sequence tables from each of the three independently processed datasets (household plumbing biofilms, global soils, surface waters) were then merged into a single table spanning the three distinct environments. Since the primer pair used to PCR amplify a portion of the hsp65 gene (Tb11-Tb12) is not specific to members of the genus Mycobacterium , it was necessary to remove all non-mycobacterial reads. The combined ASV representative sequence file (repset) generated above was then filtered using the updated NTM database as the reference database using blastn (Altshul et al, 1990)(command: makeblastdb -in )(see below for details) at a minimum match percent identity of 90% or greater. The combined ASV repset file was then filtered using seqtk ( https://github.com/lh3/seqtk ) to retain only ASVs that met the 90% or greater match threshold to the reference database. Samples with fewer than 100 mycobacterial hsp65 reads were removed from the dataset, resulting in a total of 822 samples total across the three environments (household plumbing biofilm N= 507, soil N= 140, surface waters N= 175). This table was used in all downstream NTM analyses. Across these 822 samples, we detected a total of 7,854 mycobacterial ASVs. Updated hsp65 marker gene database and phylogenetic tree The NTM phylogenetic tree was built using an updated version of the Dai et al. 65-kD heat shock protein marker gene database ( Dai et al. 2011 ). Briefly, the database was aligned and trimmed using MAFFT (version v7.505 (2022/Apr/10)( Katoh et al. 2002 ) and trimal (v1.4.rev15 build[2013-12-17])( Capella-Gutiérrez, Silla-Martínez, and Gabaldón 2009 ), respectively. The aligned database was then used to train a Hidden Markov Model using HMMR (HMMER 3.3.2 (Nov 2020))(( Wheeler and Eddy 2013 )). The HMM was then used to search (hmmsearch) a curated file of mycobacterial whole genome sequences extracted from the Genome Taxonomy Database (GTDB)( Parks et al. 2022 ). To remove any sequence noise and mismatches from the output file, a phylogenetic tree was built using RAxML (version 8.2.12), and divergent sequences were removed from the database. The final database resulted in 189 mycobacterial heat shock protein sequences, adding an additional 32 NTM species or strains to the 2011 Dai et al database. The updated reference database can be found at https://github.com/gebertm/hsp65_Tb11-Tb12_db . ASV Clustering All 7,854 mycobacterial ASVs were clustered to combine ASVs that were closely related based on phylogenetic analyses. This was done as we observed a high diversity of individual ASVs and because most ASVs were only found in a relatively small number of samples across all three datasets (mean of 6.4 samples per ASV). To conduct the phylogenetic clustering, we built a phylogenetic tree, including both the representative sequence file and updated hsp65 marker gene database, to assign taxonomy based on proximity to a known reference database sequence, using Nocardia farcinica (DSM43665) as the outgroup. Briefly, sequences were aligned using MAFFT ( Katoh et al. 2002 ) (v7.505 (2022/Apr/10)), and aligned sequences were then trimmed using trimAl (v1.4.rev15 build[2013-12-17]). The maximum likelihood tree was built using RAxML (version 8.2.12, 2018) with the following command raxmlhpc -f a -m GTRGAMMA -p 12345 -x 12345 -# 100 -T 30 --print-identical-sequences. To cluster ASVs, we used the TreeCluster package ( Balaban et al. 2019 ) (version 1.0.4) with the distance threshold t = 0.20, meaning 0.20 is the maximum pairwise distance between leaves in a given cluster. The optimal threshold was set based on the clustering of the Mycobacterium tuberculosis complex reference sequences into one unique cluster, without including additional NTM taxa. TreeCluster resulted in 404 unique clusters, encompassing the 7,854 ASVs. For a cluster to be present in a sample, it was required to have a total of >10 reads across the combined dataset. 62 ASVs did not fall within a defined cluster (62/7854, or 0.79%), designated as -1 in the final cluster table (Supplementary Table 2), and were excluded from the downstream analysis. Taxonomic names were assigned at the cluster level, when possible (i.e., clusters that included named reference strains were assigned the name of that reference strain). Only 74/404 clusters (18%) contained one or more reference sequences, meaning most clusters (82%) could not be confidently assigned to the species level based on their phylogenetic similarity to a named species. The top 50 clusters found in each environment, which encompassed >99%, 66%, and 95% of the total reads in household plumbing biofilms, soil, and surface waters, respectively were selected for downstream analyses. Since the NTM diversity in the soil samples was considerably higher compared with the other two environments, a smaller percentage of the total NTM reads from the soil samples were captured in the top 50 clusters. Statistical Analysis To visualize the variation in community structure of all NTM species, we ran a principal components analysis (PCoA) on the cleaned cluster table using the Phyloseq package in R ( McMurdie and Holmes 2013 ). Briefly, we converted the cluster table from read counts to a presence/absence matrix, requiring a minimum of 10 reads per cluster for it to be considered ‘present’ in the data. The dissimilarity matrix was calculated using pairwise Jaccard distances. To test whether any of the measured environmental variables collected at each USGS site predicted the NTM community composition in the surface water samples, we ran a Mantel test on samples using the R vegan package (version 2.6-8) ( Oksanen et al. 2013 ). Briefly, for the measured environmental variables, an additional dissimilarity matrix was calculated using vegdist in the R vegan package (version 2.6-8) ( Oksanen et al. 2013 ) using pairwise Euclidean distance. A Mantel test was then run between the taxa dissimilarity matrix and the metadata dissimilarity matrix to determine if any of the measured environmental variables predicted variation in NTM community composition across samples. Results Relative abundance of genus Mycobacterium across the three environments We used the 16S rRNA gene sequence data to determine the relative abundance of the genus Mycobacterium across the 1,154 samples from the three environments ( Figure 2 ). Members of the genus Mycobacterium were nearly ubiquitous across the three environments, detected in 100% of the 146 soils, 76% of the 373 surface water samples, and 94% of the 638 household plumbing biofilms. However, the relative abundances of mycobacteria varied depending on the environment. In household plumbing biofilms, mycobacterial abundances ranged from no mycobacteria detected (40 samples) to mycobacteria representing >95% of the bacterial communities (4 samples). The median relative abundance of the genus Mycobacterium in the plumbing biofilms (3.7%) was appreciably higher than that observed in soil (median relative abundance = 0.37%) and surface waters (median relative abundance = 0.015%). Only 1.3% of surface water samples (5/373) and 11% of soil samples (16/143) had mycobacterial abundances over 1%, while 60% of household plumbing biofilm samples had mycobacterial abundances greater than 1% (384/638) ( Figure 2 ). Download figure Open in new tab Figure 2: Relative abundances of the genus Mycobacterium across three environments (household plumbing biofilm (n=638), soil (n=143), and surface water (n=373)). Relative abundances represent the proportional abundances of taxa assigned to the genus Mycobacterium compared to all other bacteria and archaea detected in each sample from 16S rRNA gene sequencing effort. Median relative abundances of the genus in each environment are noted above each scatterplot. Mycobacterial species-level survey across the three environments While 16S rRNA marker gene sequencing allowed us to compare the relative abundance of the genus Mycobacterium across environment types, species-level information obtained through mycobacterial-specific marker gene sequencing of the hsp65 gene, is crucial for understanding the diversity of mycobacterial taxa in each environment, especially those of clinical significance. To better summarize the broad-scale diversity of the NTM in these environments, we phylogenetically grouped mycobacterial ASVs into “clusters” based on phylogenetic relatedness. Most NTM clusters found in the household plumbing biofilms clustered with known reference sequences (>80% sequence similarity to an isolate found in the reference database), including many of known clinical significance (for example Mycobacterium avium and Mycobacterium chelonae ). In contrast, many NTM clusters identified in soil and surface waters could not be identified below the genus level of taxonomic resolution as they did not include any named species in our phylogenetic analyses. When we focused on the top 50 NTM clusters detected in each of the three environments (150 in total), we found that in household plumbing biofilms, 24 clusters were found to contain a reference sequence (48%), but only 24% of clusters in soil and 16% of clusters in surface waters shared similarity with a reference sequence. All three environments harbored a broad diversity of NTM, spanning the mycobacterial phylogenetic tree ( Figure 3 ), however, the amount of novel taxonomic diversity observed in natural environments was higher than what was observed in household plumbing biofilms. Download figure Open in new tab Figure 3: Maximum likelihood tree, using the mycobacterial hsp65 gene, showing 189 reference strains, plus one representative ASV from each of the top 50 NTM clusters detected in each environment (135 unique ASVs total). Colors of outside ring represent the environment in which the NTM cluster was detected (household plumbing biofilm = green, soil = brown, surface waters = blue). Phylogenetic tree was rooted using the hsp65 sequence from Nocardia farcinica DSM43665. NTM Cluster Occupancy Although NTM were detected in nearly every sample, regardless of the environment in question, the composition of the mycobacterial communities varied across environment types ( Figure 4 ). The most abundant NTM taxa found in the household plumbing biofilm samples were M. gordonae , followed closely by M. mucogenicum/phocaicum , while the most abundant taxa found in soil were M. madagascariense and M. holsaticum . The most abundant NTMs in the surface water dataset could not be classified to species as they were not closely related to any named NTM species in our reference database ( Figure 4C ). The variation in NTM community composition across the household plumbing biofilm samples was far greater than the variation detected across either the soil or surface water samples ( Figure 4 ). Additionally, the composition of the NTM communities found in surface waters and soils were generally more similar to each other than to those found in the household plumbing biofilm samples ( Figure 4 ), highlighting that each of the three broad environment types harbor distinct NTM communities. Download figure Open in new tab Download figure Open in new tab Figure 4: Bar plots showing the percent of samples (percent occupancy, i.e. percent of samples from each environment in which a given taxon was detected). Panel A: household plumbing, Panel B: global soils, Panel C: surface waters. Bars shaded in red are NTM taxa inferred to have high clinical significance, while bars shaded in yellow have low, or limited, clinical significance. Bars outlined in gray have no reported clinical significance. Taxa indicated by 8 M. ssp. 9 represent lineages that do not include any named mycobacterial isolates. On the right of each bar plot are shown principal coordinate analysis (PCoA) colored by environment type (household plumbing biofilms in green, soils in brown, surface waters in blue), showing variation in overall NTM community composition across the three environments. We note that that three plots are identical except for the highlighting of specific sample types. Relative abundance and ubiquity of clinically relevant NTM in the environment The number of samples that contained clinically relevant NTM varied between environment types, with most clinically relevant taxa detected in the household plumbing biofilm samples ( M. avium complex, M. mucogenicum , M. abscessus ), while the top 50 taxa detected in soils only contained a handful of named strains, two of which have limited clinical significance ( M. florentinum and M. riyadhense , detected in 17% and 14% of samples, respectively). The surface water samples contained only two named clinically relevant NTM, M. chelonae complex and the M. scrofulaceum complex, which were detected in 2.9% and 2.3% of samples, respectively. We chose to focus on six clinically relevant nontuberculous mycobacterial taxa that are frequently detected in clinical samples from human patients ( M. mucogenicum / M. phocaicum , M. avium complex, M. chelonae complex, M. abscessus complex, and M. fortuitum complex, ( Daley et al. 2020 )) and how their relative abundances and occurrence patterns varied across the three environments ( Figure 4 ). All six clinically relevant NTM clusters were detected in household plumbing biofilms. Four of the 6 taxa ( M. mucogenicum/phocaicum , M. avium complex 1, M. chelonae complex, and M. abscessus complex) were the most ubiquitous in household plumbing biofilms ( Figure 5 ). For example, M. mucogenicum/phocaicum was found in ∼39% of samples from household plumbing biofilms, with a mean relative abundance of 16% of mycobacterial hsp65 reads, compared to less than 1% in the natural environments. The M. avium complex 1 was not detected in either soil or surface water samples but was found in nearly 7% of the household plumbing biofilm samples, with a mean relative abundance of 1.7% ( Figure 5 ). The M. avium complex 2 and the M. fortuitum complex, although not detected in surface waters, were detected in a greater number of soil samples compared to household plumbing biofilms (10% vs. 6.9% and 12.1% vs. 2%, respectively). Although the M. avium complex 2 was detected across more soil samples, it had a higher mean relative abundance in household plumbing biofilms (1.4%), compared with soil (0.29%). Download figure Open in new tab Figure 5: Scatterplots showing the relative abundance of six clinically relevant NTM groups across the three environments: A) M. mucogenicum complex, B) M. avium complex 1, C) M. avium complex 2, D) M. chelonae complex, E) M. abscessus complex, F) M. fortuitum complex. Mean relative abundances and 95% confidence intervals are shown in red. Relative abundances were calculated by dividing the number of hsp65 reads assigned to each group in a sample by the total number of mycobacterial hsp65 reads from that sample. Discussion and Conclusions Nontuberculous mycobacteria pulmonary disease is on the rise in the United States and around the world ( Dahl et al. 2022 ; Bents et al. 2024 ). Although many environments have been implicated in the direct transmission of disease, the ecology of NTM across environments remains poorly understood, and studies showing how NTM taxa, including known pulmonary pathogens, vary between environment types remain limited. Here we characterized the variation in the amounts and types of NTM, including those of clinical significance, across a broad range of environments frequently implicated as sources of NTM exposure, including both natural environments (soils, surface waters) and a built environment (household premise plumbing). While we detected members of the genus Mycobacterium in nearly all samples from all three environments, the relative abundance and types of NTM differed appreciably across environments. The median relative abundance of the genus Mycobacterium in both natural environments was low compared to that of household plumbing. We also found that the three environments harbored diverse and distinct NTM communities ( Figure 3 ), but most of the NTM taxa identified, particularly in the natural environments, were of limited to no clinical significance. Of note, clinically significant NTM (including M. mucogenicum and M. abscessus ) were more frequently detected and more abundant in household plumbing biofilms compared to the natural environments surveyed ( Figure 4 ). These results suggest that household plumbing biofilms, not soils or surface waters, likely pose a higher risk of NTM pathogen exposure, and subsequent infection. Although clinically relevant NTM were more frequently detected in household plumbing samples, we note that detection of pathogens does not necessarily equate to a higher risk of infection from household water sources as association between the number of pathogenic NTM cells and disease risk remains uncertain ( Falkinham 2016 ). Likewise, differences in exposure routes, duration, and frequencies likely influence infection risk. However, our results do suggest that patients at risk of NTM infections are more likely to acquire infections from premise plumbing sources than from soils or surface waters, emphasizing the potential risks associated with exposures to certain environments. Of note, the M. scrofulaceum complex, which encompasses the clinically relevant species M. scrofulaceum , M. interjectum , and M. malmoense , appears rarely in the household plumbing biofilm samples (occupancy = 0.39%) but appears more frequently in both natural environments (occupancy = 10% in soil, and 2.3% in surface waters), reflecting the known susceptibility of this NTM group to the chlorination practices commonly used to treat household water supplies in the US, practices that may be associated with a decrease in M. scrofulaceum cases in the US ( Falkinham 2003 ). Together our study highlights that, while many environments harbor NTM, they do not all harbor the same amounts and types of NTM, including clinically relevant taxa which are particularly ubiquitous and abundant in premise plumbing biofilms compared to soils and surface waters. Overall, a better understanding of the ecology of NTM in source environments, including the distributions of clinically relevant NTM taxa, should help inform epidemiological investigations of NTM disease outbreaks and guide recommendations provided to disease susceptible individuals to minimize NTM exposures. Future research should focus on the factors that contribute to NTM selection in the built environment – a likely important route of exposure for human disease. Understanding where certain NTM, especially potential pulmonary pathogens, are coming from, will play a key role in potentially preventing their accumulation in premise plumbing biofilms. Funding sources This work was supported in part by the Division of Intramural Research, National Institute for Allergy and Infectious Diseases, National Institutes of Health. This work was also funded by intramural grants provided to N.F. and M.J.G. from the Cooperative Institute for Research in Environmental Sciences (CIRES) at the University of Colorado Boulder. The authors of this study declare no competing interests or conflicts of interests. Acknowledgements We thank Caihong Vanderburgh for her assistance in the laboratory with sample processing, Holly Roth for help with remote access to the USGS databases, Dr. Andrew Blakney for providing feedback on the manuscript, as well as everyone at USGS collection sites across the United States who contributed filters to this study. Additionally, we thank Dr. Conor Meehan for his assistance and guidance with the updated hsp65 database. References ↵ Balaban , Metin , Niema Moshiri , Uyen Mai , Xingfan Jia , and Siavash Mirarab . 2019 . “ TreeCluster: Clustering Biological Sequences Using Phylogenetic Trees .” PloS One 14 ( 8 ): e0221068 . OpenUrl CrossRef PubMed ↵ Baldwin , Susan L. , Sasha E. Larsen , Diane Ordway , Gail Cassell , and Rhea N. Coler . 2019 . “ The Complexities and Challenges of Preventing and Treating Nontuberculous Mycobacterial Diseases .” PLoS Neglected Tropical Diseases 13 ( 2 ): e0007083 . OpenUrl ↵ Bents , Samantha J. , Rachel A. Mercaldo , Collin Powell , Emily Henkle , Theodore K. Marras , and D. Rebecca Prevots . 2024 . “ Nontuberculous Mycobacterial Pulmonary Disease (NTM PD) Incidence Trends in the United States, 2010-2019 .” BMC Infectious Diseases 24 ( 1 ): 1094 . OpenUrl CrossRef PubMed ↵ Bland , Christopher S. , Jamie M. Ireland , Eduardo Lozano , Maria E. Alvarez , and Todd P. Primm . 2005 . “ Mycobacterial Ecology of the Rio Grande .” Applied and Environmental Microbiology 71 ( 10 ): 5719 – 27 . OpenUrl Abstract / FREE Full Text ↵ Brennan , P. J. , and H. Nikaido . 1995 . “ The Envelope of Mycobacteria .” Annual Review of Biochemistry 64 ( 1 ): 29 – 63 . OpenUrl CrossRef PubMed Web of Science ↵ Callahan , Benjamin J. , Paul J. McMurdie , Michael J. Rosen , Andrew W. Han , Amy Jo A . Johnson , and Susan P. Holmes . 2016 . “ DADA2: High-Resolution Sample Inference from Illumina Amplicon Data .” Nature Methods 13 ( 7 ): 581 – 83 . OpenUrl PubMed ↵ Capella-Gutiérrez , Salvador , José M. Silla-Martínez , and Toni Gabaldón . 2009 . “TrimAl: A Tool for Automated Alignment Trimming in Large-Scale Phylogenetic Analyses.” Bioinformatics (Oxford , England ) 25 ( 15 ): 1972 – 73 . OpenUrl ↵ Centers for Disease Control and Prevention, Atlanta, GA, United States . 2024 . “ About Nontuberculous Mycobacteria (NTM) Infections .” Nontuberculous Mycobacteria (NTM) . April 15, 2024. https://www.cdc.gov/nontuberculous-mycobacteria/about/index.html . ↵ Dahl , Victor Naestholt , Martin Mølhave , Andreas Fløe , Jakko van Ingen , Thomas Schön , Troels Lillebaek , Aase Bengaard Andersen , and Christian Wejse . 2022 . “ Global Trends of Pulmonary Infections with Nontuberculous Mycobacteria: A Systematic Review .” International Journal of Infectious Diseases: IJID: Official Publication of the International Society for Infectious Diseases 125 ( December ): 120 – 31 . OpenUrl PubMed ↵ Dai , Jianli , Yuansha Chen , and Michael Lauzardo . 2011 . “ Web-Accessible Database of Hsp65 Sequences from Mycobacterium Reference Strains .” Journal of Clinical Microbiology 49 ( 6 ): 2296 – 2303 . OpenUrl Abstract / FREE Full Text ↵ Daley , Charles L. , Jonathan M. Iaccarino , Christoph Lange , Emmanuelle Cambau , Richard J. Wallace Jr . , Claire Andrejak , Erik C. Böttger , et al. 2020 . “ Treatment of Nontuberculous Mycobacterial Pulmonary Disease: An Official ATS/ERS/ESCMID/IDSA Clinical Practice Guideline .” The European Respiratory Journal: Official Journal of the European Society for Clinical Respiratory Physiology 56 ( 1 ). doi: 10.1183/13993003.00535-2020 . OpenUrl CrossRef ↵ Delgado-Baquerizo , Manuel , Angela M. Oliverio , Tess E. Brewer , Alberto Benavent-González , David J. Eldridge , Richard D. Bardgett , Fernando T. Maestre , Brajesh K. Singh , and Noah Fierer . 2018 . “A Global Atlas of the Dominant Bacteria Found in Soil.” Science (New York , N.Y .) 359 ( 6373 ): 320 – 25 . OpenUrl ↵ Delghandi , Mohammad Reza , K. Waldner , M. El-Matbouli , and S. Menanteau-Ledouble . 2020 . “ Identification Mycobacterium Spp. in the Natural Water of Two Austrian Rivers .” Microorganisms 8 ( August ). doi: 10.3390/microorganisms8091305 . OpenUrl CrossRef ↵ Falkinham , Joseph O. , 3rd . . 2003 . “ Factors Influencing the Chlorine Susceptibility of Mycobacterium Avium, Mycobacterium Intracellulare, and Mycobacterium Scrofulaceum .” Applied and Environmental Microbiology 69 ( 9 ): 5685 – 89 . OpenUrl Abstract / FREE Full Text ↵ Falkinham , Joseph O . 2016 . “ Current Epidemiologic Trends of the Nontuberculous Mycobacteria (NTM) .” Current Environmental Health Reports 3 ( 2 ): 161 – 67 . OpenUrl PubMed ↵ Gebert , Matthew J. , Manuel Delgado-Baquerizo , Angela M. Oliverio , Tara M. Webster , Lauren M. Nichols , Jennifer R. Honda , Edward D. Chan , Jennifer Adjemian , Robert R. Dunn , and Noah Fierer . 2018 . “ Ecological Analyses of Mycobacteria in Showerhead Biofilms and Their Relevance to Human Health .” MBio 9 ( 5 ). doi: 10.1128/mBio.01614-18 . OpenUrl CrossRef ↵ George , K. L. , B. C. Parker , H. Gruft , and J. O. Falkinham 3rd . . 1980 . “ Epidemiology of Infection by Nontuberculous Mycobacteria. II. Growth and Survival in Natural Waters .” The American Review of Respiratory Disease 122 ( 1 ): 89 – 94 . OpenUrl PubMed Web of Science ↵ Gross , Jane E. , Silvia Caceres , Katie Poch , Nabeeh A. Hasan , Rebecca M. Davidson , L. Elaine Epperson , Ettie Lipner , et al. 2021 . “ Healthcare-Associated Links in Transmission of Nontuberculous Mycobacteria among People with Cystic Fibrosis (HALT NTM) Study: Rationale and Study Design .” PloS One 16 ( 12 ): e0261628 . OpenUrl PubMed ↵ Jacobs , John , Matt Rhodes , Brian Sturgis , and Bob Wood . 2009 . “ Influence of Environmental Gradients on the Abundance and Distribution of Mycobacterium Spp. in a Coastal Lagoon Estuary .” Applied and Environmental Microbiology 75 ( 23 ): 7378 – 84 . OpenUrl Abstract / FREE Full Text ↵ Katoh , K. , K. Misawa , K. Kuma , and T. Miyata . 2002 . “ MAFFT: A Novel Method for Rapid Multiple Sequence Alignment Based on Fast Fourier Transform .” Nucleic Acids Research 30 ( 14 ): 3059 – 66 . OpenUrl CrossRef PubMed Web of Science ↵ Kim , Si Hyun , and Jeong Hwan Shin . 2018 . “ Identification of Nontuberculous Mycobacteria Using Multilocous Sequence Analysis of 16S RRNA, Hsp65, and RpoB .” Journal of Clinical Laboratory Analysis 32 ( 1 ). doi: 10.1002/jcla.22184 . OpenUrl CrossRef ↵ Kopecky , Jan , Martina Kyselkova , Marek Omelka , Ladislav Cermak , Jitka Novotna , Geneviève Grundmann , Yvan Moënne-Loccoz , and Marketa Sagova-Mareckova . 2011 . “ Environmental Mycobacteria Closely Related to the Pathogenic Species Evidenced in an Acidic Forest Wetland .” Soil Biology & Biochemistry 43 ( 3 ): 697 – 700 . OpenUrl ↵ Lake , M. Alexandra , Lyn R. Ambrose , Marc C. I. Lipman , and David M. Lowe . 2016 . “ ’ ‘Why Me, Why Now?’ Using Clinical Immunology and Epidemiology to Explain Who Gets Nontuberculous Mycobacterial Infection .” BMC Medicine 14 ( 1 ): 54 . OpenUrl PubMed ↵ Makovcova , J. , M. Slany , V. Babak , I. Slana , and P. Kralik . 2014 . “ The Water Environment as a Source of Potentially Pathogenic Mycobacteria .” Journal of Water and Health 12 ( 2 ): 254 – 63 . OpenUrl Abstract ↵ Martin , Marcel . 2011 . “ Cutadapt Removes Adapter Sequences from High-Throughput Sequencing Reads .” EMBnet.Journal 17 ( 1 ): 10 – 12 . OpenUrl ↵ McMurdie , Paul J. , and Susan Holmes . 2013 . “ Phyloseq: An R Package for Reproducible Interactive Analysis and Graphics of Microbiome Census Data .” PloS One 8 ( 4 ): e61217 . OpenUrl CrossRef PubMed ↵ Mercaldo , Rachel A. , Julia E. Marshall , Gerard A. Cangelosi , Maura Donohue , Joseph O. Falkinham 3rd . , Noah Fierer , Joshua P. French , et al. 2023 . “ Environmental Risk of Nontuberculous Mycobacterial Infection: Strategies for Advancing Methodology .” Tuberculosis 139 (March): 102305 . OpenUrl CrossRef PubMed ↵ Modra , Helena , Vit Ulmann , Milan Gersl , Vladimir Babak , Ondrej Konecny , Dana Hubelova , Jan Caha , Jan Kudelka , Joseph Oliver Falkinham 3rd . , and Ivo Pavlik . 2023 . “ River Sediments Downstream of Villages in a Karstic Watershed Exhibited Increased Numbers and Higher Diversity of Nontuberculous Mycobacteria .” Microbial Ecology 87 ( 1 ): 15 . OpenUrl PubMed ↵ Oksanen , J. , F. G. Blanchet , R. Kindt , P. Legendre , P. R. Minchin , R. B. O’hara , and Oksanen M . 2013 . “Package ‘Vegan.’” Community Ecology Package , Version 2 ( 9 ): 1 – 295 . OpenUrl ↵ Parks , Donovan H. , Maria Chuvochina , Christian Rinke , Aaron J. Mussig , Pierre-Alain Chaumeil , and Philip Hugenholtz . 2022 . “ GTDB: An Ongoing Census of Bacterial and Archaeal Diversity through a Phylogenetically Consistent, Rank Normalized and Complete Genome-Based Taxonomy .” Nucleic Acids Research 50 ( D1 ): D785 – 94 . OpenUrl CrossRef PubMed ↵ Quast , Christian , Elmar Pruesse , Pelin Yilmaz , Jan Gerken , Timmy Schweer , Pablo Yarza , Jörg Peplies , and Frank Oliver Glöckner . 2013 . “ The SILVA Ribosomal RNA Gene Database Project: Improved Data Processing and Web-Based Tools .” Nucleic Acids Research 41 (Database issue): D590 – 6 . OpenUrl CrossRef PubMed Web of Science ↵ Reyn , C. F. von , R. D. Waddell , T. Eaton , R. D. Arbeit , J. N. Maslow , T. W. Barber , R. J. Brindle , C. F. Gilks , J. Lumio , and J. Lähdevirta . 1993 . “ Isolation of Mycobacterium Avium Complex from Water in the United States, Finland, Zaire, and Kenya .” Journal of Clinical Microbiology 31 ( 12 ): 3227 – 30 . OpenUrl Abstract / FREE Full Text ↵ Riskin , M. L. , and C. J. Lee . 2021 . “ USGS National Water Quality Monitoring Network .” https://pubs.usgs.gov/publication/fs20213019 . ↵ Roguet , A. , C. Therial , M. Saad , L. Boudahmane , L. Moulin , and F. S. Lucas . 2016 . “ High Mycobacterial Diversity in Recreational Lakes .” Antonie van Leeuwenhoek 109 ( 5 ): 619 – 31 . OpenUrl CrossRef PubMed ↵ Sarro , Yeya Ds , Bourahima Kone , Bassirou Diarra , Alisha Kumar , Ousmane Kodio , Djeneba B. Fofana , Chad J. Achenbach , et al. 2018 . “ Simultaneous Diagnosis of Tuberculous and Non-Tuberculous Mycobacterial Diseases: Time for a Better Patient Management .” Clinical Microbiology and Infectious Diseases 3 ( 3 ). doi: 10.15761/CMID.1000144 . OpenUrl CrossRef ↵ Telenti , A. , F. Marchesi , M. Balz , F. Bally , E. C. Böttger , and T. Bodmer . 1993 . “ Rapid Identification of Mycobacteria to the Species Level by Polymerase Chain Reaction and Restriction Enzyme Analysis .” Journal of Clinical Microbiology 31 ( 2 ): 175 – 78 . OpenUrl Abstract / FREE Full Text ↵ Ulmann , Vit , Anna Kracalikova , and Radka Dziedzinska . 2015 . “ Mycobacteria in Water Used for Personal Hygiene in Heavy Industry and Collieries: A Potential Risk for Employees .” International Journal of Environmental Research and Public Health 12 ( 3 ): 2870 – 77 . OpenUrl ↵ US Geological Survey . 2006 . >“ Chapter A4. Collection of Water Samples .” 09-A4. Version 2.0, Revised September 2006 (original version published September 1999). Techniques of Water-Resources Investigations . Reston, VA : US Geological Survey . doi: 10.3133/twri09a4 . OpenUrl CrossRef ↵ Walsh , Corinne M. , Matthew J. Gebert , Manuel Delgado-Baquerizo , Fernando T. Maestre , and Noah Fierer . 2019 . “ A Global Survey of Mycobacterial Diversity in Soil .” Applied and Environmental Microbiology 85 ( 17 ). doi: 10.1128/AEM.01180-19 . OpenUrl Abstract / FREE Full Text ↵ Wheeler , Travis J. , and Sean R. Eddy . 2013 . “ Nhmmer: DNA Homology Search with Profile HMMs .” Bioinformatics 29 ( July ): 2487 – 89 . OpenUrl CrossRef PubMed Web of Science ↵ Winthrop , Kevin L. , Theodore K. Marras , Jennifer Adjemian , Haixin Zhang , Ping Wang , and Quanwu Zhang . 2020 . “ Incidence and Prevalence of Nontuberculous Mycobacterial Lung Disease in a Large U.s. Managed Care Health Plan, 2008-2015 .” Annals of the American Thoracic Society 17 ( 2 ): 178 – 85 . OpenUrl PubMed View the discussion thread. Back to top Previous Next Posted August 04, 2025. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following A cross-environment comparison of nontuberculous mycobacterial diversity Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share A cross-environment comparison of nontuberculous mycobacterial diversity Matthew J. Gebert , Ettie M. Lipner , Jordan M. Galletta , Jessica B. Henley , Michael Hoffert , Melissa L. Riskin , D. Rebecca Prevots , Noah Fierer bioRxiv 2025.08.04.668438; doi: https://doi.org/10.1101/2025.08.04.668438 Share This Article: Copy Citation Tools A cross-environment comparison of nontuberculous mycobacterial diversity Matthew J. Gebert , Ettie M. Lipner , Jordan M. Galletta , Jessica B. Henley , Michael Hoffert , Melissa L. Riskin , D. Rebecca Prevots , Noah Fierer bioRxiv 2025.08.04.668438; doi: https://doi.org/10.1101/2025.08.04.668438 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Microbiology Subject Areas All Articles Animal Behavior and Cognition (7635) Biochemistry (17697) Bioengineering (13894) Bioinformatics (41951) Biophysics (21455) Cancer Biology (18592) Cell Biology (25507) Clinical Trials (138) Developmental Biology (13380) Ecology (19903) Epidemiology (2067) Evolutionary Biology (24321) Genetics (15610) Genomics (22509) Immunology (17737) Microbiology (40398) Molecular Biology (17182) Neuroscience (88618) Paleontology (667) Pathology (2833) Pharmacology and Toxicology (4825) Physiology (7641) Plant Biology (15158) Scientific Communication and Education (2046) Synthetic Biology (4296) Systems Biology (9825) Zoology (2271)
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.