Global patterns of taxonomic and functional diversity in hot springs microbiomes

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 43,367 characters · extracted from preprint-html · click to expand
Global patterns of taxonomic and functional diversity in hot springs microbiomes | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Global patterns of taxonomic and functional diversity in hot springs microbiomes José Ignacio Arroyo , Beatriz Díez , Pablo A. Marquet doi: https://doi.org/10.1101/2025.08.04.668570 José Ignacio Arroyo 1 Facultad de Ciencias Biológicas, Pontificia Universidad Católica de Chile Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: jiarroyo{at}uc.cl pmarquet{at}bio.puc.cl Beatriz Díez 2 Departamento de Genética Molecular y Microbiología, Facultad de Ciencias Biológicas, Pontificia Universidad Católica de Chile Find this author on Google Scholar Find this author on PubMed Search for this author on this site Pablo A. Marquet 1 Facultad de Ciencias Biológicas, Pontificia Universidad Católica de Chile 3 Instituto de Ecología y Biodiversidad (IEB), Las Palmeras 3425, Santiago , Chile 4 Laboratorio Internacional de Cambio Global (LINCGlobal) and Centro de Cambio Global UC, Facultad de Ciencias Biológicas, Pontificia Universidad Católica de Chile , CP 8331150, Santiago, Chile 5 Santa Fe Institute, 1399 Hyde Park Road , Santa Fe, NM 87501, USA 6 Instituto de Sistemas Complejos de Valparaíso (ISCV), Subida Artillería 470 , Valparaíso, Chile Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: jiarroyo{at}uc.cl pmarquet{at}bio.puc.cl Abstract Full Text Info/History Metrics Supplementary material Preview PDF Abstract A reformulation of the metabolic theory of ecology has been proposed based on a derivation of the Eyring-Polanyi equation, leading to a reduced model with the form of a power-law with exponential cut-off (PLECO). Moreover, the recent integration of this new model and metagenomic DNA sequencing theory has led to the hypothesis that, given that temperature affects cell size and assemblage abundance, it should also affect the number of genes, metabolisms, and populations in a microbial community. In particular, for microbial communities, the model predicts that the diversity of taxa, their genes, and metabolisms should respond to temperature according to the PLECO model, and after scaling the data using the estimated parameters, all data should collapse into a single curve. To test these predictions, we use global hot springs microbial communities; geothermally heated environments that include aquatic and terrestrial habitats with large temperature gradients. We analyzed a global database (five continents) of 19 hot springs metagenomes covering a wide gradient of temperature (32-90°C). We found that the alpha diversity of taxa, genes, and their metabolisms decreases with temperature, in agreement with the predictions of the PLECO model. Further, after non-dimensionalization of the model, we derive a single nondimensional curve for taxa and functions. Finally, using general linear models, we analyzed the effects of pH, latitude, and substrate (soil, water, or both), in addition to temperature, to explain the observed diversity pattern. We find that they explain a lower proportion of the variance, but pH can explain up to half of the variance in global diversity in these ecosystems, indicating the need to include pH in the theory. Our study supports the hypothesis that temperature regulates the structure of community genomes. Introduction The metabolic theory of ecology (MTE) integrates the universal constraints imposed by size and temperature on biological rates across levels of biological organization, from organisms to ecosystems ( Brown et al. 2004 , West et al. 2005, Sibly et al. 2012). This framework emerged from the integration of Kleiber’s law, relating body size and metabolic rate, and the empirical Arrhenius equation, relating temperature and the rate of (bio)chemical reactions ( Brown et al. 2004 ). This model was extended to predict different ecological processes from individuals to ecosystems (e.g., Allen et al., Brown et al. 2004 ). Despite the broad scope of predictions of the MTE, there are still challenges, particularly regarding the integration with other theories and the prediction of new patterns and driving variables. For instance, at the community level, theoretical predictions for species richness ( Allen et al. 2002 ) and abundance of heterotrophs ( Allen et al. 2007 ) have been derived assuming that other aspects of ecological complexity (e.g., phylogenetic and functional; Naeem et al. 2016) are not important, which is at odds with theories and data showing that they may be critical to predicting ecological stability and ecosystem functioning ( Thébault and Loreau 2003 , Thébault and Fontaine 2011). We have recently suggested the use of the Eyring-Evans-Polanyi equation, instead of Arrhenius’equation, in predicting biodiversity patterns on the grounds that the former is grounded on solid thermodynamic arguments and is widely accepted as a descriptor of the role of temperature on chemical reactions ( Arroyo et al. 2022 ). This equation is where k is reaction rate (s -1 , for a first-order reaction), k B is the Boltzmann constant, h is the Plank constant (= 6.62 ×10-34 Js -1 ), T is temperature (K), ΔS is the entropy change (J/K), ΔH enthalpy change (J), R is the gas constant (= 8.31 JK -1 mol -1 ). Using this equation, we have proposed a general model of temperature dependence for biological rates, which yields an equation with the form of a power law with an exponential cut-off Here, k could be the number of species (taxa), genes of groups of related genes (gene families, paths or modules), , p 1 = (ΔG/R)+1, and p 2 = ΔH/R, T is temperature is in Kelvin, R is the gas constant, ΔH is free enthalpy change (J), ΔS 0 entropy at T 0 , ΔC is the heat capacity change. Negative values of ΔC gives an asymmetric concave curve that accounts for the breakpoint commonly observed in all temperature response curves. A second prediction of our models is that scaling the data using estimated parameters should give a single curve according to Where and Alternatively, scaling can be done as Where and Eq. 2.1 predicts that data should collapse into a curved pattern, whereas Eq. 2.2 predicts that data should collapse into a linear pattern. After suggesting this new model of temperature dependence, we integrated metabolic ecology and DNA shotgun sequencing theory based on the empirical relationships between temperature and cell size and the effect of mean cell size on assemblage abundance, thus implying that temperature affects assemblage abundance. Then we simplified DNA shotgun sequencing predictions for taxa and gene reads by integrating the genome size-cell size, and population abundance and cell size relationships to predict that taxa and gene reads depend uniquely on population and assemblage abundance, respectively. Finally, by assuming that the abundance and number of genes and groups of genes scale with assemblage abundance, we predicted that ultimately, temperature affects the number of genes and groups of related genes of a community. This results in specific testable predictions of temperature dependence in the richness of taxa, their genes, and metabolisms according to Eq. 1.2 The predictions were relatively well supported by genomes and metagenomes from different taxa and ecosystems, including data from human, terrestrial, and aquatic microbiomes (Chapter 2). A natural laboratory where these predictions can be further tested is hot springs, where are founds temperature gradients are found along a few meters (see for example Alcamán et al. 2015 ). These ecosystems are geothermally heated patches, with temperatures higher than the mean environmental temperature ( Pentecost et al. 2003 , Pentecost et al. 2005 , O’Gorman et al. 2014 ), and where it is often possible to find microbial mats in their surroundings. Comparatively, hot spring microbial mats are less diverse than other terrestrial (e.g., soil) and marine and freshwater ecosystems ( Lozupone and Knight 2007 , Aanniz et al. 2015 ) but contain representatives of most Archaeal and Bacterial lineages ( Sharp et al. 2014 ). These communities can be found both as components of the pelagic environment in the water column or forming mats attached to the bottom sediments and other substrates; the latter are often more diverse than pelagic ones ( Wang et al. 2014 ). Most studies examining ecological patterns in hot springs have been conducted at larger scales. As a general pattern, studies at the scales of meters have shown that abundance and diversity and composition patterns are explained by the temperature, pH and geochemistry with geography becoming important at kilometer scales ( Miller et al. 2009 , Ionescu et al. 2010 , Cuecas et al. 2011, Tobler et al. 2011 , Everroad et al. 2012 , Cole et al. 2013 , Wang et al. 2013, Inskeep et al 2013 , Headd et al. 2014 , Herbold et al. 2014 , Valverde et al. 2014 , Sharp et al. 2014 , Wang et al. 2014 ; Menzel et al 2015 ; Power et al 2018 , Arroyo et al. 2025 ). Here, we fitted four predictions of our recently developed framework of metabolic ecology and metagenomics on global hot springs metagenomes; in particular we predict a temperature dependence of i) the number of taxa, ii) the number of genes, and iii) the number of groups of related genes (e.g. metabolic pathway) and iv) scaling the data with the estimated parameters should result in a single curve according to eqs. 2.1 and 2.2 . v). In addition, we also assessed the effects of pH, latitude, and type of substrate as predictors of taxonomic and functional diversity as they have been shown to explain diversity in these and other ecosystems ( Fierer and Jackson 2006 , Fuhrman et al. 2008 , Inskeep et al. 2013 ). Results We begin by fitting the relationship between the number of species and temperature. The curve model ( eq. 1.2 ) had a significant fit ( Figure 1a ), although its low curvature was statistically different from the linear model of eq. 1.1 (ΔAIC=1.995). Then we fitted the relationship between the number of genes and groups of related genes (e.g., families) with temperature. For this, we used reads annotated according to the functional classification of the SEED database with three different levels of resolution: SEED level 1 (corresponding to biological process), SEED level 2 (corresponding to metabolic pathways, gene families), and SEED level 3 (corresponding to genes, see Methods). The number of genes (SEED level 3) ( Fig. 1 ) and groups of related genes (SEED level 2 and SEED level 1) ( Fig. 2c and Fig. 2d , respectively) decreased significantly with temperature. The number of genes and ‘subsystems’ all fit well to the PLECO model of Eq. 1.2 with an explained variance that varied between 41 to 45%. ( Table 1 ). The estimated parameters of the model ( Eq. 1.2 ) consistently decreased with the level of organization from genes to taxa ( Table 1 ). We also fitted equations. 2.1 and 2.2 to test the universality of temperature dependence regardless of the ecological variable (taxonomic or functional richness). As predicted, data collapsed into a single dimensionless curve according to Eq. 2.1 ( Figure 2 ) or line according to Eq. 2.2 ( Figure 2 , left lower corner). Download figure Open in new tab Fig. 1. Relationship between (a) ln (taxa richness), (b) ln (SEED level 1; biological roles), (c) ln (SEED level 2; families, pathways) and (d) ln(SEED level 3; genes) and 1/T. In the four cases there was a decrease with temperature (or increases with the inverse of temperature, 1/T) in the temperature range 32-90°C. Download figure Open in new tab Fig. 2. Universal temperature dependent curve for taxa and functions. Nondimensionalization based on scales rate and temperature (see Results) showing how temperature-dependence data regardless of variable data collapses into a single curve. Main panel corresponds to Eq. 2.1 and lower left panel to Eq. 2.2 . (◼) Taxa richness, (•) SEED level 1 (biological roles), (▴) SEED level 2 (metabolic pathways, gene families), (⧫) SEED level 3 (genes). View this table: View inline View popup Download powerpoint Table 1. Estimated parameters of models implemented for the effects of temperature (T) ( Fig. 1 ), pH and habitat type (with two levels: terrestrial and aquatic; H). In addition to temperature, we studied the effects on taxonomic and functional diversity of other environmental variables that were recorded in compiled data and our sampling: pH and latitude. Both the logarithm of the number of taxa, genes, or groups of genes and pH fitted significantly to a linear model ( Table 1 ), and the explained variance varied between 44 to 64 %. Latitude was related significantly only to the richness of SEED level 2 groups of genes ( Table 1 ). Finally, we also analyzed the taxonomic and functional diversity among types of habitat (or substrate) from which the sample was originally obtained (mat, water, or a miex of both). For both taxa and functions, the diversity was higher in mat, followed by water and both habitats pooled ( Table 2 ). Using ANOVA, we found that the effect of substrate (mat, water, or mixed) on the logarithm of the number of taxa, genes, or groups of genes was significant in both taxa and functions ( Table 2 ). Post-hoc comparisons showed significant differences among mat, water, and both types of substrates (Table S2). View this table: View inline View popup Download powerpoint Table 2. ANOVA results (η-squared and p-value) for comparisons of number of taxa and SEED 1, 2, and 3 categories among mat, water, and both (pooled). Discussion The importance of developing models in science lies in their objective capacity and predictive usefulness. The ideal is to generate models derived from primary principles, simple formulation (and few parameters), and that explain different variables from a single explanatory variable. The models that have these properties and wide empirical support have been called efficient theories, within which the metabolic theory of ecology is included ( Marquet et al. 2014 ). In microbial ecology, in the last decade, macroecological approaches have been used, evaluating models originally thought for macroorganisms and developing alternatives with valid assumptions for microorganisms ( Barberán et al. 2014 ). For example, in the MTE the assumption that in the temperature range 0-40°C the response is exponential (or linear on a logarithmic scale; Gillooly et al. 2001 ), an assumption that is not very well supported in microorganisms which have a curved behavior within this range or as the case of thermophiles and hyperthermophiles have a positive exponential growth outside this range (e.g. Sharp et al. 2014 ). Therefore, we derived a general model ( Eq. 1.2 , Chapter 1) applicable to plants, animals, and microorganisms and within the entire temperature range of life, but which was derived from primary principles and is simple (i.e., it only has three parameters and on a logarithmic scale can be adjusted using multiple linear regression). We used this general model to develop a theoretical framework for the structure of microbial metagenomes (Arroyo 2020, Chapter 2), which includes some of the predictions tested here. We evaluated this microbial metagenomic framework in microbial communities from hot springs because these ecosystems are a good model to study temperature responses due to the wide temperature ranges at spatial scales of a few centimeters, e.g. 30-60°C; Mackenzie 2014, or meters (30-90°C, Sharp et al. 2014 , Wang et al. 2014 ). Our results showed that, for both taxa, their metabolisms and genes, in the studied temperature range, there was a decline in diversity with temperature, with the tipping point being found before or slightly above 30°C. The value of the parameters varied from genes to metabolisms and species, as is expected in our metabolic ecological metagenomics framework (see Arroyo 2020, Chapter 2), the parameter values depend on the total number of reads sequenced, which increases when recruiting from genes to species. Our approach differs from traditional studies in metagenomic and particularly in hot springs, which have often used comparative approaches to show that temperature is a variable that explains variation in both taxa and functions (in the mesophile-thermophile-hyperthermophile range; ∼30-90 ºC; Sharp et al. 2014 ). However, a few studies have tested predictions of ecological theories, such as Glazier et al. (2012) , who showed that both the number of species and food chain length do not respond well to Arrhenius. Moreover, recent models have been developed in order to explain richness in these ecosystems ( Klales et al. 2012 ). The mechanisms behind these relationships depend on the spatio-temporal scale. At short spatiotemporal scales, they are mostly influenced by the number of individuals ( MacArthur and Wilson 1967 , Hubbell 2001 ) and genes ( Vellend 2003 ), and their maintenance depends on different mechanisms ( Chesson 2000 , Chesson 2018 ), such as resource partitioning. Briefly, many populations with similar metabolisms can coexist in the same community if populations use different resources in space and/or time. Consequently, more productive patches can sustain more individuals, reducing the probability of extinction and concomitantly leading to more species, metabolisms, and genes (see Allen et al. 2007 ). At a large spatiotemporal scale, the effect of temperature on diversification rates ( Allen et al. 2007 ) would also contribute to affecting the richness of taxa, and subsequently genes and metabolisms (Arroyo et al. 2019, Chapter 2). Our results show that the general principles that explain diversity in other ecosystems also apply to extreme temperature environments, and subsequently, the same models or theory can be used universally, irrespective of taxa. The fact that the pattern of temperature dependence for genes that we found in global hot springs is similar to that found in the global ocean ( Sunagawa et al. 2015 ) and opposite to that found in soil may be due to the lower temperature range in soil ecosystems ( Ding et al. 2015 ). Temperature is not the only variable determining diversity in these ecosystems as we also showed that type of substrate, pH, and latitude can explain significant amounts of the variance, as also showed in previous studies ( Miller et al. 2009 , Ionescu et al. 2010 , Cuecas et al. 2011, Tobler et al. 2011 , Everroad et al. 2012 , Cole et al. 2013 , Wang et al. 2013, Inskeep et al 2013 , Headd et al. 2014 , Herbold et y. 2014, Valverde et al. 2014 , Sharp et al. 2014 , Wang et al. 2014 ; Menzel et al 2015 ; Power et al 2018 ). The significant effect of pH emphasizes the need to extend the metabolic theory of ecology to include effects of pH, as this chemical variable also influences enzymatic rate ( Michaelis 1922 , Alberty and Massey 1954 ; Alberty, 2006 ) and subsequently metabolism ( Rektorschek et al. 1998 ), and other properties of ecological systems above the individual-level, such as microbial species richness ( Fierer and Jackson 2006 ). The effects of pH are especially important in organisms that live embedded in substrates, such as those inhabiting soil and aquatic environments, including the ocean and freshwater habitats. Developing a mechanistic but simple model for the effects of pH is of applied importance to predict ecological responses to freshwater acidification, a task that often has been done using empirical approaches (e.g., Ou et al. 2015 , Beaune et al. 2018 ). Further analysis distinguishing Bacteria and Archaea, including functions defined by other databases (e.g. InterPro2GO; Hunter et al. 2014 , eggNOG; Powell et al. 2012 ) and with an increased number of subsamples and/or samples to achieve a higher statistical power, need to be carried out in other hotsprings in order to test the generality of the patterns herein reported. In summary, our analyses showed that genes, metabolisms, and taxa can be well predicted by temperature, supporting the hypothesis that, given that temperature affects assemblage abundance, ultimately it should also affect the number of genes and metabolisms in a community. Moreover, our analysis also showed that pH explains a large amount of variance, indicating the need to extend ecological theory to include variables other than temperature. Methods Data and statistical analysis Data of hot springs metagenomes consisted of metagenomes obtained from previous studies and metagenomes sampled and sequenced by us. We obtained and sequenced eight hot springs mat samples as described in ( Guajardo-Leiva et al. 2018 ) for which the temperature and geographic coordinates were recorded. Additional metagenomic data were obtained from public databases from 18 other hot springs metagenomes spanning latitudinal (from Iceland to Antarctica) and longitudinal (from Yellowstone National Park in North America to Malaysia) geographic gradients, including six continents. Each of these samples was obtained from public databases and was obtained from either mat or water or a mix (of both mat and water; e.g., Menzel et al. 2015 ) and has a record of temperature and geographic coordinates. Our integrated database from our sampling and compiled metagenomic data encompasses a wide range of temperature (from 32 to 98°C), pH (from 2.5 to 9.25), and geographic distance (1 cm-19000 km). Metagenomic data includes different technologies of next-generation sequencing (NGS), including Illumina HiSeq, Ion Torrent, and Illumina MiSeq (Sanger and 454 were not included because of low depth of data; see Table S1). (However, to make these different technologies comparable, we apply a set of procedures, see below). Raw metagenomic data were preprocessed with cutadapt version 1.8.1 ( Martin 2011 ) to remove 5’ adapter and 3’ low-quality sequences. The metagenomic data that we have used were derived from three different technologies, which differ in read length and sequencing depth. It has been shown that different sequencing technologies can be comparable (Luo et al. 2012), however, in order to avoid errors, we made some corrections. To correct for differences in read length, we have established a minimum length of 30 bp, which is a plausible length for annotation ( Carr and Borenstein 2014 , Sims et al. 2014 ). All sequences with quality <30 were removed. To avoid biases in the estimation of diversity because of variable depths, after preprocessing, sequences were rarefied. To do this, it was randomly subsampled five million reads (the minimum depth among the 23 samples) in each sample using fastq-tools ( https://homes.cs.washington.edu/~dcjones/fastq-tools/ ). Direct alignment of the preprocessed and subsampled nucleotide sequences against protein non-redundant NCBI database (NCBI-nr) was performed using DIAMOND ( Buchfink et al. 2015 ) with an e-value of 1e-10. To overcome differences in sequencing deep not effect because we have randomly subsampled the same amount of reads among samples. The taxonomic and functional assignments based on the alignments were interpreted using MEGAN6 ( Huson et al. 2016 ). Here we based on functions assigned by the SEED database (Overbeck et al. 2005, Overbeck et al. 2014). Briefly, this database of genome annotation employs the subsystem approach. A subsystem is a set of functional role that constitutes a biological process or structure. Then a subsystem includes metabolic pathways (glycolysis) and other protein interactions such as ribosomes. The classification of genes within subsystem is hierarchically nested, where in the lowest level (SEED level 1) includes the more general functions with 44 categories (e.g. membrane transport, motility and chemotaxis, stress response, among others), the intermediate level of resolution includes nested functions (SEED level 2, 1136 categories; e.g. glutamate dehydrogenases, glycine biosynthesis, etc.), and the highest level correspond to genes (SEED level 1, 5738 categories; e.g. arginase, cysteine synthase A, etc.). Relationships between the number of taxa, genes, and groups of genes and temperature were performed using (simple or multiple) linear regression, according to the Eyring-Polanyi eq. of two parameters ( eq. 1.1 ) or eq. 1.2 . Regressions were performed using the lm function as implemented in the R programming environment. Empirical relationships between the logarithm of the number of taxa, genes, and metabolisms and pH, and latitude were assessed using simple linear regression. Also, using the lm function. To test the effect of the type of substrate (mat, water or both) we performed ANOVA using the aov and lm functions as implemented in R. Acknowledgments JIA acknowledges support from a CONICYT National Doctoral Scholarship N° 21130515 References ↵ Aanniz T , Ouadghiri M , Melloul M , et al. ( 2015 ) Thermophilic bacteria in Moroccan hot springs, salt marshes and desert soils . Braz J Microbiol 46 ( 2 ): 443 – 453 . OpenUrl CrossRef PubMed ↵ Alcamán ME , Fernandez C , Delgado A , Bergman B , Díez B ( 2015 ) The cyanobacterium Mastigocladus fulfills the nitrogen demand of a terrestrial hot spring microbial mat . ISME J 9 ( 10 ): 2290 – 303 . OpenUrl CrossRef PubMed ↵ Alberty R , and Massey V ( 1954 ) On the interpretation of the pH variation of the maximum initial velocity of an enzymecatalyzed reaction . Biochim Biophys Acta 13 : 347 – 353 . OpenUrl PubMed ↵ Alberty R ( 2006 ) Relations between biochemical thermodynamics and biochemical kinetics . Biophys Chem 124 : 11 – 17 . OpenUrl CrossRef PubMed Web of Science ↵ Storch D , Marquet P and Brown J Allen A , Gillooly J & Brown J ( 2007 ) Recasting the species–energy hypothesis: the different roles of kinetic and potential energy in regulating biodiversity . Scaling biodiversity (ed. by Storch D , Marquet P and Brown J ), pp. 1 – 29 . Cambridge University Press , Cambridge . ↵ Allen AP , Brown JH , Gillooly JF ( 2002 ) Global biodiversity, biochemical kinetics, and the energetic-equivalence rule . Science 297 ( 5586 ): 1545 – 8 . OpenUrl Abstract / FREE Full Text ↵ Arroyo , J. I. , Díez , B. , Kempes , C. P. , West , G. B. , & Marquet , P. A. ( 2022 ). A general theory for temperature dependence in biology . Proceedings of the National Academy of Sciences , 119 ( 30 ), e2119872119 . OpenUrl CrossRef PubMed ↵ Arroyo , J. I. , Pedrós-Alió , C. , Polz , M. F. , Mackenzie , R. , Marquet , P. A. , & Díez , B. ( 2025 ). Fine-scale spatial patterns in hot springs mat bacterial communities . bioRxiv , 2025 – 03 . ↵ Barberán A , Casamayor , EO , & Fierer , N ( 2014 ) The microbial contribution to macroecology . Front Microbiol 5 : 203 . OpenUrl CrossRef PubMed ↵ Beaune D , Sellier Y , Luquet G , Grandjean F ( 2018 ) Freshwater acidification: an example of an endangered crayfish species sensitive to pH . Hydrobiologia 813 ( 1 ) 41 – 50 . OpenUrl CrossRef ↵ Brown JH , Gillooly JF , Allen AP , Savage VM , West GB ( 2004 ) Toward a metabolic theory of ecology . Ecology 85 ( 7 ): 1771 – 1789 . OpenUrl CrossRef Web of Science ↵ Buchfink B , Xie C , Huson DH ( 2015 ) Fast and sensitive protein alignment using DIAMOND . Nat Methods 12 ( 1 ): 59 – 60 . OpenUrl CrossRef PubMed ↵ Carr R , Borenstein E ( 2014 ) Comparative analysis of functional metagenomic annotation and the mappability of short reads . PLoS One 9 ( 8 ): e105776 . OpenUrl CrossRef PubMed ↵ Chesson P ( 2000 ) Mechanisms of maintenance of species diversity . Annu Rev Ecol Syst 31 : 343 – 66 OpenUrl CrossRef Web of Science ↵ Chesson P ( 2018 ) Updates on mechanisms of maintenance of species diversity . J Ecol 106 ( 5 ): 1773 – 1794 . OpenUrl ↵ Cole JK , Peacock JP , Dodsworth JA , Williams AJ , Thompson DB , Dong H , Wu G , Hedlund BP ( 2013 ) Sediment microbial communities in Great Boiling Spring are controlled by temperature and distinct from water communities . ISME J 7 ( 4 ): 718 – 29 . OpenUrl CrossRef PubMed Cuecas A , Portillo MC , Kanoksilapatham W , Gonzalez JM ( 2014 ) Bacterial distribution along a 50°C temperature gradient reveals a parceled out hot spring environment . Microb Ecol 68 ( 4 ): 729 – 39 . OpenUrl CrossRef PubMed ↵ Ding J , Zhang Y , Deng Y , Cong J , Lu H , Sun X ( 2015 ) Integrated metagenomics and network analysis of soil microbial community of the forest timberline . Sci Rep 5 : 7994 . OpenUrl CrossRef PubMed ↵ Everroad RC , Otaki H , Matsuura K , Haruta S ( 2012 ) Diversification of bacterial community composition along a temperature gradient at a thermal spring . Microbes Environ 27 ( 4 ): 374 – 81 . OpenUrl CrossRef PubMed Web of Science ↵ Fierer N , Jackson RB ( 2006 ) The diversity and biogeography of soil bacterial communities . Proc Natl Acad Sci U S A 103 ( 3 ): 626 – 31 . OpenUrl Abstract / FREE Full Text ↵ Fuhrman JA , Steele JA , Hewson I , Schwalbach MS , Brown MV , Green JL , Brown JH ( 2008 ) A latitudinal diversity gradient in planktonic marine bacteria . Proc Natl Acad Sci U S A 105 ( 22 ): 7774 – 8 . OpenUrl Abstract / FREE Full Text ↵ Gillooly JF , Brown JH , West GB , Savage VM , Charnov EL ( 2001 ) Effects of size and temperature on metabolic rate . Science 293 ( 5538 ): 2248 – 51 . OpenUrl Abstract / FREE Full Text ↵ Guajardo-Leiva S , Pedrós-Alió C , Salgado O , Pinto F , Díez B ( 2018 ) Active Crossfire Between Cyanobacteria and Cyanophages in Phototrophic Mat Communities Within Hot Springs . Front Microbiol 9 : 2039 . OpenUrl PubMed ↵ Glazier DS ( 2012 ) Temperature affects food-chain length and macroinvertebrate species richness in spring ecosystems . Fresh Sci 31 ( 2 ): 575 – 585 . OpenUrl Hasler CT , Jeffrey JD , Schneider EVC , Hannan KD , Tix JA , Suski CD ( 2018 ) Biological consequences of weak acidification caused by elevated carbon dioxide in freshwater ecosystems . Hydrobiologia 806 : 1 – 12 . OpenUrl CrossRef ↵ Headd B , Engel AS ( 2014 ) Biogeographic congruency among bacterial communities from terrestrial sulfidic springs . Front Microbiol 5 : 473 . OpenUrl PubMed ↵ Herbold CW , Lee CK , McDonald IR , Cary SC ( 2014 ) Evidence of global-scale aeolian dispersal and endemism in isolated geothermal microbial communities of Antarctica . Nat Commun 5 : 3875 . OpenUrl CrossRef PubMed ↵ Hubbell SP ( 2001 ) The Unified Neutral Theory of Biodiversity and Biogeography . Princeton University Press . ↵ Hunter S , Corbett M , Denise H , Fraser M , Gonzalez-Beltran A , Hunter C , et al. ( 2014 ) EBI metagenomics--a new resource for the analysis and archiving of metagenomic data . Nucleic Acids Res 42 ( Database issue ): D600 – 6 . OpenUrl CrossRef PubMed Web of Science ↵ Huson DH , Beier S , Flade I , Górska A , El-Hadidi M , Mitra S , et al. ( 2016 ) MEGAN Community Edition - Interactive Exploration and Analysis of Large-Scale Microbiome Sequencing Data . PLoS Comput Biol 12 ( 6 ): e1004957 . OpenUrl CrossRef PubMed ↵ Inskeep WP , Jay ZJ , Tringe SG , Herrgård MJ , Rusch DB ( 2013 ) YNP Metagenome Project Steering Committee and Working Group Members . The YNP Metagenome Project: Environmental Parameters Responsible for Microbial Distribution in the Yellowstone Geothermal Ecosystem. Front Microbiol 4 : 67 . OpenUrl PubMed ↵ Ionescu D , Hindiyeh M , Malkawi H , Oren A ( 2010 ) Biogeography of thermophilic cyanobacteria: insights from the Zerka Ma’in hot springs (Jordan) . FEMS Microbiol Ecol 72 ( 1 ): 103 – 13 . OpenUrl CrossRef PubMed Web of Science ↵ Klales A , Duncan J , Nett EJ , Kane SA ( 2012 ) Biophysical model of prokaryotic diversity in geothermal hot springs . Phys Rev E Stat Nonlin Soft Matter Phys 85 ( 2 Pt 1 ): 021911 . OpenUrl PubMed Locey KJ and Lennon JT ( 2016 ) Scaling laws predicts global microbial diversity . Proc Natl Acad Sci U S A 113 ( 21 ): 5970 – 5 . OpenUrl Abstract / FREE Full Text ↵ Lozupone CA , Knight R ( 2007 ) Global patterns in bacterial diversity . Proc Natl Acad Sci U S A 104 ( 27 ): 11436 – 11440 . OpenUrl Abstract / FREE Full Text ↵ MacArthur RH , Wilson EO ( 1967 ) The Theory of Island Biogeography . Princeton, New Jersey : Princeton University Press . ↵ Marquet PA , Allen AP , Brown JH , Dunne JA , Enquist BJ , Gillooly JF , et al. ( 2014 ) On theory in ecology . BioScience 64 : 701 – 710 . OpenUrl CrossRef Web of Science ↵ Martin M ( 2011 ) Cutadapt removes adapter sequences from high-throughput sequencing reads . EMBnet J 17 ( 1 ): 10 – 12 . OpenUrl CrossRef ↵ Menzel P , Gudbergsdóttir SR , Rike AG , Lin L , Zhang Q , Contursi P , Moracci M , Kristjansson JK , Bolduc B , Gavrilov S , Ravin N , Mardanov A , Bonch-Osmolovskaya E , Young M , Krogh A , Peng X ( 2015 ) Comparative metagenomics of eight geographically remote terrestrial hot springs . Microb Ecol 70 ( 2 ): 411 – 24 . OpenUrl CrossRef PubMed ↵ Michaelis L ( 1922 ) Die wasserstoffionenkonzentration . Berlin, Germany : Springer . ↵ Miller SR , Strong AL , Jones KL , Ungerer MC ( 2009 ) Bar-coded pyrosequencing reveals shared bacterial community properties along the temperature gradients of two alkaline hot springs in Yellowstone National Park . Appl Environ Microbiol 75 ( 13 ): 4565 – 72 . OpenUrl Abstract / FREE Full Text Mouillot D , Villéger S , Parravicini V , Kulbicki M , Arias-González JE , Bender M et al. 2014 . Functional over-redundancy and high functional vulnerability in global fish faunas on tropical reefs . Proc Natl Acad Sci U S A 111 ( 38 ): 13757 – 62 . OpenUrl Abstract / FREE Full Text Levin SA Naeem S ( 2001 ) Complexity versus diversity . Encyclopedia of Biodiversity: San Diego, California , eds Levin SA ( Academic Press ), pp 831 – 843 . ↵ O’Gorman EJ , Benstead JP , Cross WF , Friberg N , Hood JM , Johnson PW , Sigurdsson BD , Woodward G ( 2014 ) Climate change and geothermal ecosystems: natural laboratories, sentinel systems, and future refugia . Glob Chang Biol 20 ( 11 ): 3291 – 9 . OpenUrl PubMed Okie JG , Van Horn DJ , Storch D , Barrett JE , Gooseff MN , Kopsova L ( 2015 ) Niche and metabolic principles explain patterns of diversity and distribution: theory and a case study with soil bacterial communities . Proc Biol Sci 282 ( 1809 ): 20142630 . OpenUrl CrossRef PubMed ↵ Ou M , Hamilton TJ , Eom J , Lyall EM , Gallup J , Jiang A , Lee J , Close DA , Yun SS & Brauner CJ ( 2015 ) Responses of pink salmon to CO2-induced aquatic acidification . Nat Clim Change 5 : 950 – 955 . OpenUrl Overbeek R , Begley T , Butler RM , Choudhuri JV , Chuang HY , Cohoon M , de Crecy-Lagard V , Diaz N , Disz T , Edwards R , et al. ( 2005 ) The subsystems approach to genome annotation and its use in the project to annotate 1000 genomes . Nucleic Acids Res 33 : 5691 – 5702 . OpenUrl CrossRef PubMed Web of Science Overbeek R , Olson R , Pusch GD , Olsen GJ , Davis JJ , Disz T , et al. ( 2014 ) The SEED and the Rapid Annotation of microbial genomes using Subsystems Technology (RAST) . Nucleic Acids Res D206 – D214 . ↵ Pentecost A ( 2005 ) Hot springs, thermal springs and warm springs . What’s the difference? Geology Today 21 : 222 – 224 . OpenUrl ↵ Pentecost A , Jones B , Renaut RW ( 2003 ) What is a hot spring? Can. J. Earth Sci 40 ( 11 ): 1443 – 6 . OpenUrl Abstract / FREE Full Text ↵ Powell S , Szklarczyk D , Trachana K , Roth A , Kuhn M , Muller J , et al. ( 2012 ) eggNOG v3.0: orthologous groups covering 1133 organisms at 41 different taxonomic ranges . Nucleic Acids Res . 40 ( Database issue ): D284 – 9 . OpenUrl CrossRef PubMed Web of Science ↵ Power JF , Carere CR , Lee CK , Wakerley GLJ , Evans DW , Button M et al. ( 2018 ) Microbial biogeography of 925 geothermal springs in New Zealanda . Nat. Commun . 9 : 2876 . OpenUrl CrossRef PubMed ↵ Rektorschek M , Weeks D , Sachs G , Melchers K ( 1998 ) Influence of pH on metabolism and urease activity of Helicobacter pylori . Gastroenterology 115 ( 3 ): 628 – 41 . OpenUrl CrossRef PubMed Web of Science R Core Team ( 2012 ). R: A language and environment for statistical computing . R Foundation for Statistical Computing , Vienna, Austria . ISBN 3-900051-07-0 , URL http://www.R-project.org/ ↵ Sharp CE , Brady AL , Sharp GH , Grasby SE , Stott MB , Dunfield PF ( 2014 ) Humboldt’s spa: microbial diversity is controlled by temperature in geothermal environments . ISME J 8 ( 6 ): 1166 – 74 . OpenUrl CrossRef GeoRef PubMed ↵ Sims D , Sudbery I , Ilott NE , Heger A , Ponting CP ( 2014 ) Sequencing depth and coverage: key considerations in genomic analyses . Nat Rev Genet 15 ( 2 ): 121 – 32 . OpenUrl CrossRef PubMed ↵ Sunagawa S , Coelho LP , Chaffron S , Kultima JR , Labadie K , Salazar G ( 2015 ) Structure and function of the global ocean microbiome . Science 348 ( 6237 ): 1261359 . OpenUrl Abstract / FREE Full Text Thébault E , Fontaine C ( 2010 ) Stability of ecological communities and the architecture of mutualistic and trophic networks . Science 329 ( 5993 ): 853 – 6 . OpenUrl Abstract / FREE Full Text ↵ Thébault E , Loreau M ( 2003 ) Food-web constraints on biodiversity–ecosystem functioning relationships Proc Natl Acad Sci U S A 100 ( 25 ): 14949 – 54 . OpenUrl Abstract / FREE Full Text Tilman D ( 1999 ) The ecological consequences of changes in biodiversity: a search for general principles . Ecology 80 ( 5 ): 1455 – 1474 . OpenUrl CrossRef Web of Science ↵ Tobler DJ , Benning LG ( 2011 ) Bacterial diversity in five Icelandic geothermal waters: temperature and sinter growth rate effects . Extremophiles 15 ( 4 ): 473 – 85 . OpenUrl CrossRef PubMed ↵ Valverde A , Tuffin M , Cowan DA ( 2014 ) Biogeography of bacterial communities in hot springs: A focus on the actinobacteria . Extremophiles 16 : 669 – 679 . OpenUrl ↵ Vellend M ( 2003 ) Island biogeography of genes and species . Am Nat 162 ( 3 ): 358 – 65 . OpenUrl CrossRef PubMed Web of Science ↵ Wang S , Dong H , Hou W , Jiang H , Huang Q , Briggs BR , Huang L ( 2014 ) Greater temporal changes of sediment microbial community than its waterborne counterpart in Tengchong hot springs, Yunnan Province, China . Sci Rep 4 : 7479 . OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted August 05, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Global patterns of taxonomic and functional diversity in hot springs microbiomes Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Global patterns of taxonomic and functional diversity in hot springs microbiomes José Ignacio Arroyo , Beatriz Díez , Pablo A. Marquet bioRxiv 2025.08.04.668570; doi: https://doi.org/10.1101/2025.08.04.668570 Share This Article: Copy Citation Tools Global patterns of taxonomic and functional diversity in hot springs microbiomes José Ignacio Arroyo , Beatriz Díez , Pablo A. Marquet bioRxiv 2025.08.04.668570; doi: https://doi.org/10.1101/2025.08.04.668570 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Ecology Subject Areas All Articles Animal Behavior and Cognition (7641) Biochemistry (17707) Bioengineering (13904) Bioinformatics (41988) Biophysics (21466) Cancer Biology (18615) Cell Biology (25530) Clinical Trials (138) Developmental Biology (13387) Ecology (19921) Epidemiology (2067) Evolutionary Biology (24335) Genetics (15615) Genomics (22521) Immunology (17748) Microbiology (40424) Molecular Biology (17194) Neuroscience (88665) Paleontology (667) Pathology (2839) Pharmacology and Toxicology (4827) Physiology (7650) Plant Biology (15160) Scientific Communication and Education (2046) Synthetic Biology (4302) Systems Biology (9826) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00