Caliditerrarchaeota, a new sister to Nanohaloarchaeota, provides insights into the evolution of DPANN halophily

doi:10.1101/2025.08.05.668663

Caliditerrarchaeota, a new sister to Nanohaloarchaeota, provides insights into the evolution of DPANN halophily

2025 · doi:10.1101/2025.08.05.668663

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 73,249 characters · extracted from preprint-html · click to expand

Caliditerrarchaeota, a new sister to Nanohaloarchaeota, provides insights into the evolution of DPANN halophily | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Caliditerrarchaeota, a new sister to Nanohaloarchaeota, provides insights into the evolution of DPANN halophily View ORCID Profile Joshua N. Hamm , View ORCID Profile Nina Dombrowski , Luis E. Valentin-Alvarado , View ORCID Profile Chris Greening , Tom A. Williams , View ORCID Profile Anja Spang doi: https://doi.org/10.1101/2025.08.05.668663 Joshua N. Hamm 1 Royal Netherlands Institute for Sea Research, Department of Marine Microbiology and Biogeochemistry , P.O. Box 59, NL-1790 AB Den Burg, The Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Joshua N. Hamm For correspondence: anja.spang{at}nioz.nl josh.n.hamm{at}gmail.com Nina Dombrowski 2 Institute for Biodiversity and Ecosystem Dynamics (IBED), University of Amsterdam , Amsterdam, The Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Nina Dombrowski Luis E. Valentin-Alvarado 3 Department of Biochemistry and Molecular Biology, Biomedicine Discovery Institute, Monash University , Clayton 3800, Australia Find this author on Google Scholar Find this author on PubMed Search for this author on this site Chris Greening 4 Department of Microbiology, Biomedicine Discovery Institute, Monash University , Clayton, VIC, Australia 5 Securing Antarctica’s Environmental Future, Monash University , Clayton, Victoria, Australia Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Chris Greening Tom A. Williams 6 Department of Life Sciences, University of Bath , BA2 7AX, Bath, UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Anja Spang 1 Royal Netherlands Institute for Sea Research, Department of Marine Microbiology and Biogeochemistry , P.O. Box 59, NL-1790 AB Den Burg, The Netherlands 7 Department of Evolutionary & Population Biology, Institute for Biodiversity and Ecosystem Dynamics (IBED), University of Amsterdam , Amsterdam, The Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Anja Spang For correspondence: anja.spang{at}nioz.nl josh.n.hamm{at}gmail.com Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract The Nanohaloarchaeota are a clade of halophilic symbionts with small cells and genomes. Originally placed within the Euryarchaeota, they are now widely thought to belong to the DPANN archaea. However, the evolution of this clade and its phylogenetic placement within DPANN remain poorly understood. We applied phylogenetic and comparative genomic analyses to assess the evolutionary relationship and genome evolution of the Nanohaloarchaeota and related DPANN lineages. Our phylogenetic analyses resolve Nanohaloarchaeota as a sister group to a phylum-level lineage referred to as EX4484-52, together forming a clade with Aenigmatarchaeota. Representatives of EX4484-52, for which we propose the name Caliditerrarchaeota, have an anaerobic, thermophilic lifestyle but do not appear to be adapted to high salt concentrations. Using gene tree-species tree reconciliations, we investigated the origin of halophily across these archaeal lineages revealing that adaptations to high-salt appear to have evolved on the branch to Nanohaloarchaeota after their divergence from Aenigmatarchaeota and Caliditerrarchaeota. In agreement with recent work, we also identify hallmarks of halophily in another order-level lineage within the Aenigmatarchaeota (Haloaenigmatarchaeaceae) which appears to represent a second independent adaptation of a DPANN clade to halophily. The two halophilic DPANN lineages are inferred to have distinct sets of proteins that enable them to live in environments with high salt levels. Notably, phylogenetic analyses reveal a dominant signal of gene transfers between Haloaenigmatarchaeaceae and Halarchaeoplasmatales, indicating a potential host-symbiont relationship. This work provides the first detailed investigation of the enigmatic Caliditerrarchaeota, and new insights into the evolution of halophilic lifestyles within DPANN. Introduction The DPANN archaea, named after the first representatives of this group [ 1 – 5 ], comprise at least 10 phylum-level lineages (out of 21 archaeal phyla in total) [ 6 ]. Yet only 3 DPANN phyla have cultivated representatives, i.e. the Nanoarchaeota [ 7 – 10 ], Nanohaloarchaeota [ 11 – 13 ] and Micrarchaeota [ 14 , 15 ]. Currently, the lifestyles of most groups are poorly understood. It has recently been suggested that the DPANN form at least two distinct major groups: Cluster 1, which includes the Altiarchaeota, Iainarchaeota, and Micrarchaeota and Cluster 2, including Nanohaloarchaeota, Nanoarchaeota, Aenigmatarchaeota, EX4484-52, SpSt-1190, and Undinarchaeota [ 4 , 6 , 16 ]. Distributed across the biosphere, Cluster 2 DPANN are generally characterised by reduced genomes and small cells, and are predicted to rely upon host organisms [ 3 ]. For instance, cultivated representatives of the Nanoarchaeota [ 7 – 10 ] and Nanohaloarchaeota [ 11 – 13 ] depend on archaeal host cells - i.e. members of the Sulfolobales and Halobacteriales , respectively - for growth and survival. Until recently, the Nanohaloarchaeota were the only known DPANN lineage adapted to extreme salt conditions [ 17 ]. However, the recently-discovered Haloaenigmatarchaeaceae (within phylum Aenigmatarchaeota) are a second DPANN lineage that seems to have independently evolved a halophilic lifestyle [ 18 ]. Similar to other halophilic archaea, the Nanohaloarchaeota and Haloaenigmatarchaeaceae appear to employ a salt-in strategy in which high intracellular salt concentrations are tolerated via greater use of acidic amino acids in proteins, leading to a shift in proteome-wide amino acid composition [ 18 – 23 ]. Of particular importance are transporters involved in uptake of K + (Such as the Kef-type transporter), and exporters of Na + (such as the Na + /H + antiporter) which maintain osmotic balance through selective import of K + and export of Na + [ 24 ]. Since its discovery, the phylogenetic placement of the Nanohaloarchaeota phylum has been a subject of debate. Initial data supported a sister relationship with the Halobacteriales [ 20 ] or Methanocellales [ 25 ], others recovered a sisterhood with other DPANN [ 5 ]. An increasing amount of work based on concatenated single-copy marker gene phylogenies implementing more realistic models of evolution has provided growing evidence that Nanohaloarchaeota indeed belong to the DPANN archaea [ 2 , 4 , 22 , 26 – 28 ]. The monophyletic clustering of nanohaloarchaeal and haloarchaeal proteins in single protein phylogenies is likely a result of protein compositional biases as a response to high salt-adaptation and increased rates of horizontal gene transfer (HGT) between these halophilic symbionts and their hosts [ 4 , 22 , 29 ]. Despite a better understanding of the phylogenetic placement of the Nanohaloarchaeota, a major limitation in assessing the evolution of halophily in Nanohaloarchaeota was the absence of closely related sister lineages with which to compare lifestyles and genetic content. Recently, the Asbonarchaeaceae were reported to be a deep branching, halophilic sister lineage to the Nanosalinaceae within the Nanohaloarchaeota phylum found in polyextreme environments [ 22 ]. Yet, the origin and nature of adaptations to a halophilic lifestyle in the Nanohaloarchaeota and their relationship with non-halophilic DPANN cluster 2 lineages, especially the Aenigmatarchaeota [ 5 , 30 ] and EX4484-52 phylum [ 31 – 33 ] remains to be elucidated. Gene tree-species tree reconciliation methods for ancestral genome reconstruction have been applied to the Nanohaloarchaeota previously but have focused on internal nodes within the nanohaloarchaeal lineage, leaving the transition from non-halophile to halophile unexplored [ 34 , 35 ]. Here, we used phylogenetics, comparative genomics, and gene trees-species tree reconciliation [ 36 , 37 ] to place the Nanohaloarchaeota within DPANN cluster 2 archaea, characterise their closest sister lineage EX4484-52, for which we propose the name Caliditerrarchaeota, and reconstruct the genome evolution of DPANN cluster 2 lineages to assess genomic signatures associated with the adaptation to a halophilic lifestyle. Our work identifies the Caliditerrarchaeota as primarily non-halophilic terrestrial thermophiles, and highlights DNA repair and potassium transport as likely key to halophily in DPANN. Increased rates of horizontal gene transfer between Haloaenigmatarchaeaceae and the Halarchaeoplasmatales point to a putative symbiont-host relationship between members of these clades. Methods Generation of dataset for phylogenetic and genomic analyses To investigate the placement of halophilic lineages a previously established representative set of 607 archaeal genomes was used as a backbone [ 4 ]. To this, 44 publicly available genomes associated with the Nanohaloarchaeota-Aenigmatarchaeota clade, Hikarchaeota, and Thermoplasmatales were added (Supplementary Table 1) resulting in a final dataset of 651 genomes. Selection of phylogenetic marker genes for species tree reconstruction To generate a reliable species tree and accurately place ACN lineages for downstream analyses, we applied a phylogenetic approach similar to Dombrowski et. al. 2020 [ 4 ] to identify suitable marker genes from a set of 151 possible markers (Supplementary Table 12). HMM profiles specific to the marker genes were used to identify homologs in the 651 genomes using a custom script Selection_of_Phylogenetic_Markers/Selecting_best_markers_151set.sh [ 38 ]) that incorporates the hmmsearch [ 39 ] algorithm from the HMMER v3.1b2 package. To reduce the possibility of distant paralogs being extracted during this process the set of HMM profiles used as query was expanded to include the entire TIGRFAM[ 40 ] database (4,528 profiles total). Subsequently, homologs to each of the 151 marker genes were parsed from the output based on best hit evaluated by e-value and bit-score and extracted from their respective genomes. Single gene alignments were performed for all 151 marker genes using MAFFT L-INS-i v7.407 [ 41 ] (settings:reorder) and trimmed using BMGE-1.12 [ 42 ] (settings:-tAA -m BLOSUM30 -h 0.55). Phylogenies were inferred for all genes using IQ-tree v2.1.2 [ 43 ] (settings: -m LG+G -bb 1000 -wbtl -bnni). Single gene phylogenies were assessed using a custom python script to rank markers based on their capacity to resolve established monophyletic taxa as previously described [ 4 ]. Reliability of markers was scored according to the number of total splits (total number of taxa placing outside the expected taxonomic member clade) as well as the number of splits normalised to species count within a specific clade. Marker genes in which Archaea were previously found to not be monophyletic [ 4 ] were removed. Split counts were used to rank the marker genes and concatenated alignments of the 25% and 50% top and lowest ranked genes were generated (Supplementary Table 12). Species tree reconstruction Sequences on long branches were flagged and removed using a custom python script Selection_of_Phylogenetic_Markers/cut_gene_tree_v2.py [ 38 ] applied to trees generated for marker gene reliability assessment. Following long branch removal, remaining sequences were re-aligned and trimmed using MAFFT L-INS-i v7.407 [ 41 ] and BMGE-1.12 [ 42 ] as described above. Marker gene sets were concatenated using catfasta2phyml.pl ( https://github.com/nylander/catfasta2phyml ). To assess placement of halophilic lineages as well as the putative sister clade of the Nanohaloarchaeota (i.e. the Caliditerrarchaeota) multiple concatenated trees were generated: Phylogenies using marker gene subsets: All four subsets of marker genes (top 25 and 50% and lowest 25 and 50%). Alignments were concatenated using catfasta2phyml.pl ( https://github.com/nylander/catfasta2phyml ) and trees generated using IQ-tree [ 43 ] (v2.1.2, settings: -m LG+C60+F+R -nt AUTO -bb 1000-alrt 1000). Removal of compositionally heterogeneous sites: Concatenated alignments of the top 25 and 50% best marker genes were aligned with MAFFT L-INS-i v7.407 [ 41 ] and trimmed with BMGE-1.12 [ 42 ] as above. Alignments were then subjected to compositional site filtering using a custom perl script ( https://github.com/novigit/davinciCode/blob/master/perl/alignment_pruner.pl ) [ 44 ] in a stepwise manner to remove the 10, 30, and 50% most compositionally heterogeneous sites. Trees were reconstructed for all three conditions of the two marker subsets using IQ-tree [ 43 ] (v2.1.2, settings: -m LG+C60+F+R -nt AUTO - bb 1000 -alrt 1000). Removal of fast-evolving sites: SlowFaster v1 [ 45 ] was used to remove fast evolving sites from the top 25 and 50% best marker gene alignments. Sites were filtered in a stepwise manner to remove the 10, 30, and 50% fastest evolving sites. Trees were reconstructed for all three conditions of the two marker subsets using IQ-tree [ 43 ] (v2.1.2, settings: -m LG+C60+F+R -nt AUTO -bb 1000 -alrt 1000). Annotation of genomes All genomes included in the reference dataset (651) were annotated using our annotation pipeline to ensure consistency of annotations Annotation_Tables/1_Input/Annotations.txt [ 38 ]. Coding sequences were predicted using Prokka v1.14 [ 46 ] (settings: --kingdom Archaea -- addgenes --force --increment 10 --compliant --centre UU --cpus 20 --norrna –notrna). For functional annotation of proteins several additional databases were used including COGs [ 47 ] (downloaded October 2020), arCOGs [ 48 ] (2014 version), KO profiles from the KEGG Automated Annotation Server [ 49 ] (downloaded April 2021), the Pfam database [ 50 ] (release 34.0), the TIGRFAM database [ 40 ] (release 15.0), the Carbohydrate-Active enZymes (CAZy) database [ 51 ] (v7, downloaded August 2020), the Transporter Classification Database [ 52 ] (downloaded April 2021), the Hydrogenase database [ 53 ] (HydDB, downloaded July 2020), and NCBI_nr (downloaded Aug 2021). In addition to this, protein domain predictions were carried out using InterProScan [ 54 ] (v5.62-94.0, setting: --iprlookup --goterms). Annotations for the respective databases were carried out as follows. COGs, arCOGs, KOs, PFAMs, TIGRFAMs, and CAZymes were all identified using hmmsearch v3.1b2 [ 39 ] (settings: -E 1e-5). The Transporter Classification Database and Hydrogenase Database were queried using BLASTp v2.7.1 [ 55 ] (settings: -evalue 1e-20). For database searches the best hit was selected based on the highest e-value and bit-score and summarised for Caliditerrarchaeota in Supplementary Table 3 and for the full set Annotation_Tables/1_Input/Annotations.txt [ 38 ]. Multiple hits were allowed for InterProScan domain annotations using a custom script for parsing results Annotation_Tables/parse_IPRdomains_vs2_GO_2.py [ 38 ]. Best blast hits against the NCBI_nr database were identified using DIAMOND v0.9.22..123 [ 56 ] (settings: blastp --more-sensitive --evalue 1e-5 --no-self-hits). CRISPR systems were identified in Caliditerrarchaeota genomes using the CRISPRCasTyper v1.8.0 tool [ 57 ]. Caliditerrarchaeota genomes were taxonomically classified using GTDB-Tk (setting: –skip_ani_screen)[ 58 ]. Analysis of NADH- [NiFe]- and [FeFe]-hydrogenases To confirm annotation of putative hydrogenase subunits predicted catalytic subunits from Caliditerrarchaeota genomes were identified and aligned to reference sets of previously published NiFe and FeFe hydrogenase catalytic subunits [ 59 , 60 ] using MAFFT-LINSI v7.407 (settings: reorder). Alignments were trimmed using BMGE-1.12 (settings:-tAA -m BLOSUM30 -h 0.55) and manually screened for presence of conserved active sites in putative Caliditerrarchaeota hydrogenases. Caliditerrarchaeota sequences missing conserved active site residues were removed from the dataset and remaining sequences were realigned with MAFFT-LINSI v7.407 (settings: reorder) and trimmed with BMGE-1.12 (settings:-tAA -m BLOSUM30 -h 0.55). Phylogenetic trees were inferred using IQTree v2.1.2 (settings: -m LG+C20+F+R -nt AUTO -ntmax 25 -bb 1000 -alrt 1000). Comparative genomics Output from the annotation pipeline was used for comparative genomics. Most genomes were clustered into class-level lineages, whilst DPANN and most uncultivated taxa were defined at the level of phylum. Presence/absence patterns of proteins encoded by these clades were determined using a custom R script Annotation_Tables/Count_Tables.r [ 38 ]. Briefly, the number of occurrences of each gene in every genome in the dataset was tallied and used to generate summary tables using the ddply function within the plyr (v1.8.8) package. Heatmaps were then plotted by converting the summary tables into presence/absence matrices followed by application of the ddply function to summarize counts across the different phylogenetic clusters. Data was then visualized as a heatmap using ggplot2 (v3.4.2). Genome reconstruction for Supplementary Figure 21 was carried out manually using KEGG annotations. Genes were classified as present (found in more than 50% of genomes, indicated with filled in circle), partially present (found in 0 - 50% of genomes, indicated with half-filled circle), or absent (missing from all genomes) for Supplementary Figure 21. Amino acid frequency analysis To investigate signatures of halophily across our reference set of genomes, amino acid frequencies were calculated using a custom R script Amino_Acid_Analysis/AA_Freq_analysis.R [ 38 ]. Briefly, predicted protein sequences from each genome were concatenated and the frequency of each amino acid (i.e. number of its occurrence) was calculated and divided by the total length of the concatenated sequence. Principal components analysis was carried out using prcomp from the stats package (v4.4.0) on a matrix of calculated amino acid frequencies per individual genome across the entire dataset. Statistical significance of amino acid frequency variation between lineages within the reduced dataset was calculated using one-way ANOVA tests from the stats package (v4.4.0) with a Games-Howell Post-hoc evaluation of significance from the rstatix (v0.7.2) package. P-values were used to generate groups with letter designations to simplify representation with multcompview (v0.1-9). Acidity of predicted protein sequences was calculated using the peptides package (v2.4.5) isoelectric point command applied on a protein-by-protein basis to each genome. Calculated pI values were then plotted in density plots on a genome-by-genome basis. Gene tree-species tree reconciliation Gene tree-species tree reconciliation analyses were performed using ALE v1.0 [ 36 , 37 ], ALE/ALE_arCOGs_final.md [ 38 ]. Protein clusters were generated using arCOG annotations produced using hmmsearch as described above (section Genome Annotation). To account for gene fusion of arCOGs in some taxa, proteins with more than 50 aa remaining after removal of the sequence part assigned to an arCOG were screened for secondary arCOG annotations and split up, with this procedure being repeated up to four times. Clusters were then cleaned by removing sequences containing Xs prior to alignment. Clusters with 1000 sequences or less were aligned using MAFFT L-INS-I v7.407 (settings: reorder) whilst those with more than 1000 sequences were aligned with MAFFT E-INS-I v7.407 (settings: reorder). All alignments were trimmed using BMGE-1.12 (settings:-tAA -m BLOSUM30 -h 0.55). Clusters with three or fewer sequences were removed from further analysis. To evaluate gene clusters, initial trees were inferred from trimmed alignments using FastTree v2.1.11 (settings: -lg -gamma) and KEGG annotations mapped to sequences in the tree. A custom script ALE/Split_Count_v2.py [ 38 ] was used to screen these phylogenies for long branches and the monophyly of KEGG annotations within trees. Long branches were defined as branches that have lengths greater than 5 times the interquartile range for the tree in which they were found, and corresponding sequences were flagged for removal. Instances where multiple KEGG annotations were assigned to one arCOG cluster were flagged for splitting if more than 10% of sequences in the tree were annotated with the relevant KEGG number and all of these were monophyletic. A total of 424/9481 (4.5%) of clusters were identified as potential candidates for splitting which were then manually reviewed resulting in 74 clusters (0.8%) being split for a total of 9555 individual clusters. Following long branch removal and splitting of clusters, retained sequences were realigned with either MAFFT L-INS-I v7.407(less than or equal to 1000 sequences) or MAFFT E-INS-I v7.407(>1000 sequences) and trimmed with BMGE-1.12 as described above. Once final alignments were produced guide trees were inferred (settings: -m LG+G+F --score- diff all -nt 1 -wbtl -B 1000 -bnni) and model tests carried out (settings: -m MF -mset LG -madd LG+C10,LG+C10+G,LG+C10+R,LG+C10+F,LG+C10+R+F,LG+C10+G+F,LG+C20,LG+C20 +G,LG+C20+F,LG+C20+G+F,LG+C20+R,LG+C20+R+F --score-diff all -T 1) using IQTree v2.1.2. Model test results were summarised and alignments were distributed into two categories: category one comprised alignments where the best fitting model was a C-series model. For computational feasibility, trees for category 1 alignments were inferred using the rapid PMSF method, which approximates full profile mixture models [ 61 ]. Non-mixture models were chosen as best model in category 2 alignments, for which trees could be inferred without PMSF. Trees were inferred for all alignments using IQTree v2.1.2 (settings: -T 1 -wbtl -B 1000 -pers 0.2 -nstop 500) and for category 1 alignments the additional command to run using a PMSF model (-ft Phylogenies/single/iqtree_lg_guide/{1}.treefile). Following inference of single gene trees, ALE reconciliation was performed for all 9555 arCOG clusters against the species tree inferred using the 50% best marker genes described above. The species tree was rooted between the DPANN and all other archaea for reconciliations, based on previous analyses [ 4 , 62 ]. A first round of reconciliations were performed using ALEm1_undated v1.0 15 for each gene family including CheckM2 v0.1.3 estimates of genome completeness to correct for incomplete genomes using the fraction_missing flag. In order to carry out ancestral genome reconstructions, the probabilities that gene families originate at the root of the species tree was optimised for each arCOG category by maximum likelihood using a python script ALE/setup_OR_estimation.py [ 38 ] and summary statistics extracted using another python script ALE/parse_or.py [ 38 ] for each arCOG. This origination model implies that the prior probability of gene family origination is the optimised value, OR, at the root, and (1-OR) divided by the number of non-root nodes elsewhere. Following optimisation of root origination rate, a second run of ALE was performed with ALEm1_undated v1.0 including the maximum likelihood origination rate as a correcting factor with the flag O_R and completeness scores with the flag fraction_missing as above. Inferred gene statistics were parsed using a custom python script (ale_parser.py). Data was filtered for nodes of interest using another custom python script (Ale_summary.py) and genome reconstruction carried out manually. arCOGs were classified as likely present (PP >= 0.8, filled in circle), possible present (0.8 > PP >= 0.5, half-filled circle), or likely absent (PP < 0.5, empty circle) for genome reconstructions. Sisterhood Analysis To investigate occurrences of sisterhood relationships between archaeal taxa, single gene trees produced for ALE analyses were processed using a custom python script HGT_Analysis/Tree_Analyser.py [ 38 ]. Briefly, GTDB taxonomy was mapped to leaves in the trees and for all Order and Family level lineages the relative frequency of sisterhood was calculated per tree. To calculate relative frequency of sisterhood each instance of the target lineage in the tree was identified and progressive searches conducted of nodes upstream until a member of a different lineage was found. Maximum branch length (3) and minimum branch support (0.7) cutoffs were applied and sisterhood frequencies were not calculated for trees in which length or support values fell outside these cutoffs. Once a sister clade was identified the relative frequency of different lineages within the sister clade was calculated per tree. Following this the relative frequencies across all trees for each lineage were summed together. Plots were then produced using a custom R script HGT_Analysis/Sisterhood_Analyses.R [ 38 ]. Results and discussion Caliditerrarchaeota form a thermophilic, non-halophilic sister phylum of the Nanohaloarchaeota To assess the phylogenetic relationships among DPANN cluster 2 lineages, we built upon a previously established approach [ 4 ] to identify a set of universal single copy marker genes least affected by HGT (25% and 50% top ranked markers). All concatenated phylogenies resolved a monophyletic clade within the DPANN consisting of Nanohaloarchaeota, Aenigmatarchaeota, and Caliditerrarchaeota (see Classification of Caliditerrarchaeota) ( Figure 1 , Supplementary Figures 1 - 4). Caliditerrarchaeota were recovered as the sister lineage of the Nanohaloarchaeota in phylogenies inferred using the 25 and 50% top marker genes (100/100 and 99.8/100 SH-like aLRT/ultrafast bootstrap support, respectively) ( Figure 1 , Supplementary Figures 1 and 2). Their placement sister to both Nanohaloarchaeota and the Aenigmatarchaeota lineage PWEA01 (recently proposed as Haloaenigmatarchaeaceae [ 18 ]) (26/69 and 89.2/95 SH-like aLRT/ultrafast bootstrap support respectively) in phylogenies using the 25 and 50% worst makers (Supplementary Figures 3 and 4) is likely an artifact of incongruent markers. Together, this suggests that the Nanohaloarchaeota and Calditerrarchaeota branch with the Aenigmatarchaeota, consistent with previous analyses [ 18 ], and form a clade which we here refer to as ACN (for Aenigmatarchaeota, Calditerrarchaeota and Nanohaloarchaeota). Download figure Open in new tab Figure 1 Phylogenetic tree showing placement of Caliditerrarchaeota based on a concatenated alignment of 50% top ranked marker genes and the 651 species set. The alignment was trimmed with BMGE (Alignment length = 12,397 aa). A Maximum Likelihood (ML) phylogenetic tree was inferred using IQ-Tree with the LG+C60+F+R model and ultrafast bootstrap approximation (left) and SH-like approximate likelihood tests (right), each run with 1000 replicates. The tree has been artificially rooted between DPANN and other Archaea. The full uncollapsed version of the tree is provided as Supplementary Figure 1. Scale bar: Average number of substitutions per site. Removal of the 10, 30, or 50% fastest evolving [ 63 ] (Supplementary Figures 5 - 10) or compositionally biased [ 64 ] (Supplementary Figures 11 - 16) sites had little to no impact on the placement of the Caliditerrarchaeota in either of the top 25 or 50% marker gene phylogenies. Likewise, addition of genomes from the recently described Asbonarchaeaceae lineage [ 22 ] (a sister lineage to the Nanosalinaceae within the Nanohaloarchaeota) further supported the sister relationship of Caliditerrarchaeota and Nanohaloarchaeota (Supplementary Figs 17 - 20). Caliditerrarchaeota are putative non-halophilic symbionts To provide insights into the metabolism and salt adaptation of Caliditerrarchaeota, we analysed 11 publicly available MAGs (genome completeness and contamination ranging from 64 – 91% and 0 – 2.19%, respectively) (Supplementary Tables 1 and 2) derived from hydrothermal vent [ 32 ] and deposit [ 63 ], methane seep, and radioactive site metagenomes [ 64 ]. Only one previous study investigated Caliditerrarchaeota metabolism, concluding that they are fermentative symbionts with a higher than typical number of transporters compared to other DPANN based on a single MAG (GCA_902384675.1) [ 64 ]. Metabolic predictions revealed that the 11 representatives of the Calditerrarchaeota have limited catabolic and anabolic potential similar to other DPANN archaea (Supplementary Table 5, Supplementary Figures 21 - 25, Supplementary Information). Specifically, while encoding a glycolytic pathway and enzymes for the degradation of complex carbohydrates, most representatives lack TCA cycles genes and genes for any of the known carbon fixation pathways of archaea [ 65 ]. Many biosynthetic pathways such as for amino acids, vitamins, purine and pyrimidine, and archaeal lipids are incomplete. However, similar to other DPANN, representatives encode the capacity for interconversion of nucleotides as well as ribose 1,5- bisphosphate isomerase (K18237, 8 MAGs) and ribulose bisphosphate carboxylase (RbcL; RuBisCo, K01601, 7 MAGs), which are hypothesized to function in the salvage of nucleosides [ 4 ]. However, all Caliditerrarchaeota do encode a complete A/V-type ATP synthase, and some representatives encode Group A [FeFe]-hydrogenases (2 MAGs), a group 3 [NiFe]- hydrogenase (2 MAGs), putative Group 4 [NiFe]-hydrogenase (3 MAGs) and a putative NADH-dehydrogenase (Supplementary Text, Supplementary Tables 3 and 6, Supplementary Figures 26 - 28). The presence of reverse gyrase homologs in all but one Caliditerrachaeota MAG (GCA_902384675.1) is consistent with their distribution in high-temperature marine sediments. PCA analyses of amino acid frequencies, isoelectric point (pI) profiles and amino acid frequencies inferred for all representatives in our taxon set, revealed that Caliditerrarchaeota are not extreme halophiles. Specifically their proteomes clustered with non-halophilic Aenigmatarchaeota ( Figure 2a ) and isoelectric point (pI) profiles showed no signs of increased proteome acidity characteristic for halophilic Archaea ( Figure 2b ). Further, we did not observe statistically significant variation in individual amino acid frequencies for Caliditerrarchaeota except for tryptophan and proline ( Figure 2c , Supplementary Table 7). However, these analyses revealed a subclade within the Aenigmatarchaeota with hallmarks of adaptations to higher salt conditions ( Figure 2a ). Isoelectric profiles of PWEA01 protein coding sequences also showed signs of a shift towards higher acidity in the proteome, and statistically significant variation in amino acid frequencies were observed for nine amino acids, including aspartate and glutamate, which are typically elevated in halophiles [ 19 , 66 ]. Other amino acids that significantly vary in frequency amongst Nanohaloarchaeota, such as cysteine and serine, do not differ in PWEA01. Overall, the amino acid profiles of the PWEA01 clade appear to occupy an intermediate position between Nanohaloarchaeota and other archaea in PCA plots. This indicates that members of this group are halophiles, which is in agreement with the recent discovery of PWEA01 representatives, now also referred to as Haloaenigmatarchaeaceae, in hypersaline brines from the Danakil Depression [ 18 ]. Download figure Open in new tab Figure 2 Amino acid composition of both ACN and known halophilic lineages. a) PCA showing distribution of genomes in the 651 genome dataset based on amino acid profile. b) Protein isoelectric point frequency plot of genomes in the 651 genome dataset. Plots show isoelectric points per genome with genomes colour-coded according to which lineage they are assigned to. Genomes assigned to lineages outside the ACN (Aenigmatarchaeota, Caliditerrarchaeota, and Nanohaloarchaeota) cluster or known halophiles are grouped into a single line for readability c) Boxplot showing individual amino acid frequencies with statistical significance tests across the 651 genome dataset. For all plots ACN lineages and known halophiles are highlighted with colour whilst all other lineages are shown in grey. Letters above plots indicate statistically significant differences determined using one-way ANOVA test and a Games Howell Post-hoc evaluation of significance and then simplified with letter codes using multcompview. The evolution of metabolic gene repertoires and halophilic lifestyles in the ACN clade To elucidate the evolutionary history of gene repertoires in the ACN clade and the adaptation to halophilic lifestyles in some member lineages, we next performed gene tree-species tree reconciliations using Amalgamated likelihood analysis (ALE) [ 36 , 37 , 67 ]. We rooted our species tree between DPANN and the rest of the archaea in agreement with several recent publications [ 4 , 62 , 68 ]. Alternative root positions, such as within the former ‘Euryarchaeota’ [ 69 ] or between ‘Euryarchaeota and TACK/Asgard Archaea’ [ 27 , 70 ], are unlikely to significantly impact our results because the ACN lineage represents a derived clade relative to any of the proposed root positions. Ancestral genome content was inferred based on posterior probabilities (PP) of arCOG family presence in any node of interest (Supplementary Table 8). We considered gene families with PP values between 0.5-0.8 to have low support and greater than 0.8 to be of moderate support for having been present at the nodes examined. Reconstructed metabolic processes support an ancestral fermentative lifestyle for all last common ancestors examined; i.e. Aenigmatarchaeota (LCA-A), Caliditerrarchaeota (LCA-C), Nanohaloarchaeota (LCA-N), Caliditerrarchaeota-Nanohaloarchaeota (LCA-CN), Aenigmatarchaeota-Caliditerrarcheota-Nanohaloarchaeota (LCA-ACN) with acetate the likely end-product for all ancestors except for the Nanohaloarchaeota and Haloaenigmatarchaeaceae. Specifically, all ancestors were predicted to encode the majority of proteins for glycolysis but to lack respiratory complexes and various genes for TCA cycle enzymes ( Figure 3 , Supplementary Table 8). Citrate synthase, either encoded by two (K22224 and K01905) or a single gene (K01647), is the only TCA cycle protein inferred to be potentially present in most ACN ancestors (LCA-A: PP=0.97/1/0.04; LCA-C: PP=0.85/1/0.07; LCA-N: PP=0.39/0.28/0.93; LCA-CN: PP=0.84/0.9/0.56; LCA-ACN: PP=0.95/1/0.45) and citrate may therefore represent an important intermediary in the central carbon metabolism in these archaea. Nanohaloarchaeota appear to have had an ancestral citrate synthase (K22224, K01905), replaced by an alternative version (K01647), with both types potentially present in the common ancestor of Nanohaloarchaeota and Caliditerrarchaeota. Given the absence of other TCA cycle genes and the potential reversibility of the reaction carried out by these enzymes it is possible that these DPANN are instead converting citrate into pyruvate enabling either ATP production via fermentation to acetate or carbon storage via gluconeogenesis as previously suggested for Nanohaloarchaeota [ 11 ]. The predicted presence of a putative tri-carboxylic acid importer capable of citrate import in all ancestors examined (arCOG04469: LCA-A: PP=1; LCA-C: PP=1; LCA-N: PP=0.98, LCA-CN: PP=1, LCA-ACN: PP=1, LCA-P: PP=1; LCA-PB: PP=1) could provide the means for uptake of exogenous citrate. Download figure Open in new tab Figure 3 Ancestral genome reconstruction for ACN cluster ancestors. Figure shows predicted presence/absence of major metabolic/symbiosis associated genes in various ACN lineage ancestors as predicted from ALE gene tree/species tree reconciliation. Half circles indicate a posterior probability for gene presence of ≥0.5 <0.8 and full circles indicate a posterior probability of ≥0.8. The data used to produce this figure is provided in Supplementary Table 7. All ancestors examined, with the exception of LCA-N, were inferred to have complete or near-complete phospholipid biosynthesis pathways allowing production of archaeol from acetyl-coA indicating their capability of synthesising membrane lipids ( Figure 3 , Supplementary Table 8). In contrast, the majority of quinone and carotenoid biosynthesis pathways were predicted to be absent from all ancestral genomes ( Figure 3 ). Absence of quinone synthesis pathways is unsurprising considering that most Cluster 2 DPANN are generally thought to lack respiratory complexes that require quinones. The analysed ancestors were also predicted to encode pili/archaellum subunits, although individual KOs and arCOGs showed differential distributions across the various lineages ( Figure 3 , Supplementary Table 8). Typically, ancestral proteomes comprise the scaffold proteins that are also identified in genomes of extant representatives, whilst the accessory proteins, including the pilins themselves, display a variable distribution ( Figure 3 ). Pilins may be involved in symbiont-host interactions [ 71 – 73 ] with specific pilins potentially allowing interaction with specific hosts. However, the low number of cultivated DPANN and known hosts currently limits experimental validation. A minimum of two S-layer proteins were predicted to be encoded by all ancestral genomes with all lineages except Haloaenigmatarchaeaceae predicted to share the same two arCOGs (arCOG02080: LCA-A: PP=0.91; LCA-C: PP=1; LCA-N: PP=1, LCA-CN: PP=1, LCA-ACN: PP=0.98, and arCOG03418: LCA-A: PP=1; LCA-C: PP=1; LCA-N: PP=0.93, LCA-CN: PP=1, LCA-ACN: PP=1). The Haloaenigmatarchaeaceae ancestor was instead predicted to encode an alternative S-layer protein, assigned to arCOG03256 (PP=1) rather than arCOG03418 (PP=0.35). Subunits of the sodium-hydrogen antiporter (arCOG03076, arCOG03079, arCOG03082, arCOG03099, arCOG03121, arCOG01537, arCOG01962), which is particularly important in regulating osmotic balance in extreme halophiles, was predicted to be present in all individual ancestors of the various ACN lineages but not in LCA-ACN, with LCA-A and LCA-CN predicted to encode different KOs (Supplementary Table 8). Absence of these genes from LCA-ACN may indicate that each lineage acquired their antiporter complexes via HGT. Consistent with this scenario, single gene trees resolved Nanohaloarchaeota sequences as either sister to or branching within halobacterial clades for all antiporter subunits whilst Aenigmarchaeota and Caliditerrarchaeota sequences typically form monophyletic clades sister to Thermoplasmatota. However, it is also possible that the amino acid biases associated with adaptation to high salt conditions has caused artificial attraction of the nanohaloarchaeal and halobacterial sequences. LCA-N was predicted to encode at least four different redox regulation proteins including two glutaredoxins (arCOG02608: PP=0.94 and arCOG01297: PP=0.98), one peroxiredoxin (arCOG00314: PP=0.88) and a thioredoxin reductase (arCOG01296: PP=0.97) but not rubrerythrin. None of these protein families have high posterior probabilities for being present in the proteomes of any of the ancestors, though there is moderate support for rubrerythrin in some of them (K19824: LCA-A: PP=0.55; LCA-C: PP=0.54; LCA-N: PP=0.11, LCA-CN: PP=0.50, LCA-ACN: PP=0.55, Figure 3 ). The absence of rubrerythrin from LCA-N is consistent with a transition into an oxic environment alongside their haloarchaeal hosts whilst the putative presence of it in some of the other lineages may indicate their adaptation to an anoxic environment. LCA-N is the only DPANN ancestor predicted to encode both photolyase (arCOG02840: LCA-A: PP=0.04; LCA-C: PP=0.07; LCA-N: PP=0.99, LCA-CN: PP=0.49, LCA-ACN: PP=0.28) and RecB (arCOG00802: LCA-A: PP=0.12; LCA-C: PP=0.06; LCA-N: PP=0.99, LCA-CN: PP=0.47, LCA-ACN: PP=0.27) which both may play a role in DNA repair. This is particularly relevant as many hypersaline systems cause exposure to high UV-radiation [ 74 ] necessitating adaptation to UV-induced DNA damage. Finally, we analysed the ALE output to infer copy number change along branches of interest ( Figure 4 , Supplementary Table 9). While the Nanohaloarchaeota and Haloaenigmatarchaeaceae seem to have distinct protein families with multiple copies per proteome, the Kef K + transporter (arCOG01955) has the highest copy number increase along the branches leading to both lineages. The Kef-type potassium transporters play an important role in halophiles that use a salt-in strategy by facilitating the uptake of K + ions allowing to maintain osmotic balance whereas Na + and Mg 2+ ions are excluded from the cytoplasm [ 66 ]. Acquisition of multiple copies of the Kef-type transporter may have allowed members of both the Nanohaloarchaeota and Haloaenigmatarchaeaceae to adjust to hypersaline systems in the absence of additional protective measures (e.g. osmoprotectants such as glycine betaine) that are generally present in Halobacteriales [ 75 ]. Download figure Open in new tab Figure 4 Predicted gene copy number changes along branches of interest within the ACN cluster. Figure shows the 10 genes with the highest copy number increase and the 10 genes with the highest copy number decrease predicted from ALE gene tree/species tree reconciliations along branches of interest within the ACN cluster. Data used to produce this figure is provided in Supplementary Table 8. Who are the hosts of uncultivated representatives of the ACN lineages? It has previously been shown that some DPANN archaea exchange genes more frequently with their hosts than with other taxa, such as Nanohaloarchaeota with Halobacteriales, Micrarchaeota and Parvarchaeota with Thermoplasmatales, Huberarchaeales with Altiarchaeales, and Nanoarchaeales with Sulfolobales [ 4 ]. To investigate potential hosts of the Caliditerrarchaeota and Haloaenigmatarchaeaceae lineages, we calculated the relative frequency of sisterhood relationships for all trees used in the ALE analysis at the level of Order and Family from the GTDB taxonomy ( Figure 5 , Supplementary Table 10 and 11, Supplementary Figure 29). While we could not identify a clear signal for Caliditerrarchaeota, Haloaenigmatarchaeaceae representatives displayed an increased frequency of sisterhoods with PWKY01 (Halarchaeoplasmatales), suggesting that members of the PWKY01 may interact with or serve as hosts for some representatives of the Haloaenigmatarchaeaceae clade. Download figure Open in new tab Figure 5 Rate of sisterhood for GTDB order level lineages across 9,555 gene trees used for ALE analysis. Relative sisterhood frequencies were calculated per gene and summed for each taxonomic group. Related lineages have been clustered together using colours and specific lineages that show higher rates of sisterhood with DPANN lineages highlighted with unique colours. The data used to generate this plot is available in Supplementary Table 10. It is conspicuous that all DPANN symbiont-host partnerships with observable increase in sisterhood rates (except Huberarchaeales and Altiarchaeales) occur in extreme environments (hypersaline, acidic, and/or high-temperature). It seems possible that the selective pressures involved in adapting to these environments favours the acquisition of genes related to the specific extremophily from the host at rates higher than those seen in other DPANN symbiont-host partnerships from less extreme environments. Consistent with this, several copies of the KefB Potassium-efflux system gene (the highest increase in copy number for both Nanohaloarchaeota and Haloaenigmatarchaeaceae) from DPANN halophile genomes placed as sister to their respective/putative hosts ( Halobacteriales and PWKY01) in single gene trees ALE/Treefiles [ 38 ]. Alternatively, given that extreme environments typically support less diverse microbial communities, symbiont-host gene transfers may be more easily detected from background HGT. Additionally, amino acid composition biases, such as those displayed by extreme halophiles and thermophiles, are known to cause compositional attraction artefacts in trees, particularly when limited signal is available as is the case for single gene trees. Thus, a fraction of sisterhood relationships between extremophilic DPANN and their putative hosts may be the result of erroneous gene trees rather than genuine gene transfer [ 4 , 22 ]. Finally, we note that the trees used for this analysis were limited to archaeal taxa only. However, many DPANN lineages occupy environments dominated by Bacteria and some representatives have been proposed to associate with bacterial hosts [ 4 , 63 , 76 , 77 ]. The absence of bacterial sequences from our trees due to computational limitations of the gene tree-species tree reconciliation workflow, limit the confidence with which sisterhood relationships can be determined. Therefore whilst our results suggest a possible relationship between the Haloaenigmatarchaeaceae and the Halarchaeoplasmatales which remains to be confirmed experimentally, they do not allow us to identify hosts for DPANN that do not interact with other Archaea. Classification of Caliditerrarchaeota Classification of the Caliditerrarchaeota genomes with GTDB-Tk [ 58 ] indicated that all 11 MAGs included in this analysis belong to the existing candidate phylum referred to as EX4484-52. The included genomes represent 6 families, 7 genera, and 10 species. Consistent with the SeqCode Registry requirements for designation of type material we designate Candidatus Caliditerrarchaeum hikurangii (Assembly ID: GCA_013138765.1, Estimated completeness ∼90%, Estimated contamination: 1.6%, tRNAs: 20/20, 5S and partial 16S rRNA genes present) as type material for the phylum EX4484-52 with the new proposed name Caliditerrarchaeota, and the corresponding family (Caliditerrarchaeaceae), order (Caliditerrarchaeales), and class (Caliditerrarchaeia), following the principle of propagation from type material as outlined in SeqCode (Section 3, Rule 15). Additionally, we designate Candidatus Marinivulcanus frater (Assembly ID: GCA_015520605.1, Estimated completeness: ∼91%, Estimated contamination: 0%, tRNAs: 15/20, 5S rRNA gene present) as type material for the novel family Marinivulcanaceae. Description of ‘ Candidatus Caliditerrarchaeum’ gen. nov. ‘Caliditerrarchaeum’ (Cal.i.di.terr.ar.chae’um. L. adj. calidus warm, hot: L. fem. n. terra earth: N.L. neut. n. archaeum archaeon from Gr. adj. archaios −ê −on ancient; N.L. neut. n. An archaeon that inhabits hot earth, reflecting the preference for this lineage to inhabit hot sediments) Description of ‘ Candidatus Caliditerrarchaeum hikurangii’ sp. nov. ‘Caliditerrarchaeum hikurangii’ (hi.ku.ran.gi’i N.L. neut. n. hikurangii , of Hikurangi, due to the sample site from which the genome originates being found in the Hikurangi Margin, an active subduction zone in the deep sea located off the east coast of New Zealand) Description of ‘ Candidatus Marinivulcanus’ gen. nov. ‘Candidatus Marinivulcanus’ (mar.in.ni.vul.kan.nus. L. adj. marīnus marine: L. masc. n. vulcānus fire; N.L. masc. n. marine volcano, referring to the type genome within this genus originating from marine volcano sediments) Description of ‘ Candidatus Marinivulcanus frater’ sp. nov. Marinivulcanus frater (fra.ter. L. masc. n. frater brother; referring to the site this genome originates from, Brothers Volcano, a submarine volcano located in the Pacific Ocean) Concluding Remarks The Caliditerrarchaeota, which we infer to be fermentative thermophiles, occupy an evolutionarily important position as the closest sister to the extremely halophilic Nanohaloarchaeota (including both Nanosalinaceae and Asbonarchaeaceae ), but are not themselves halophiles. The inclusion of Caliditerrarchaeota in gene content analyses revealed that heightened tolerance to DNA damage and increased capacity for import and export of salt ions were key in the evolution of all currently known halophilic DPANN archaea. However, the results also indicated important differences between lineages such as the adaptation to oxic environments in the Nanohaloarchaeota and preferences for different protein families involved in the same functions e.g. S-layer proteins, Na + /H + antiporter, and citrate metabolism enzymes. Furthermore, the predicted acquisition of genes from host species via HGT highlights the potential importance of the symbiotic interactions these DPANN engage in for their adaptation to hypersalinity, although it remains possible these analyses are impacted by compositional attraction artefacts. Future work is necessary to confirm the potential partnership between Haloaenigmatarchaeaceae and Halarchaeoplasmatales and to assess the degree to which compositional biases impact the predicted rates of HGT between halophilic archaea. However, our work provides a framework for investigating the adaptation to hypersalinity in the DPANN archaea that can serve as a foundation for future works examining the evolution halophily across the archaeal domain. Author Contributions JNH and AS conceived the study. JNH, ND, LEVA, CG, TAW, and AS performed genomic and phylogenetic analyses. JNH, TAW, LEVA, CG, and AS conducted data interpretation. JNH, ND, LEVA, CG, TAW, and AS wrote the manuscript. All authors have read and approved the manuscript submission. Competing Interests The authors declare no competing interests. Code availability All custom scripts and workflows used to generate data can be found in our data repository at Zenodo [10.5281/zenodo.14627918] [ 38 ] Data availability All datasets generated and/or analysed during this study are available in our data repository at Zenodo [10.5281/zenodo.14627918] [ 38 ]. Public databases used in this study are the following: the arCOG database (version from 2014) downloaded from [ ftp://ftp.ncbi.nih.gov/pub/wolf/COGs/arCOG/ ], the KO profiles downloaded from the KEGG Automatic Annotation Server in April 2019 [ https://www.genome.jp/tools/kofamkoala/ ], the Pfam database (Release 31.0) [ ftp://ftp.ebi.ac.uk/pub/databases/Pfam/releases/ ], the TIGRFAM database (Release 15.0) [ ftp://ftp.jcvi.org/pub/data/TIGRFAMs/ ], the Carbohydrate-Active enZymes (CAZy) database downloaded from dbCAN2 in September 2019 [ http://bcb.unl.edu/dbCAN2/download/ ], the MEROPs database (Release 12.0) [ https://www.ebi.ac.uk/merops/download_list.shtml ], the Transporter Classification Database(TCDB) downloaded in November 2018 [ http://www.tcdb.org/download.php ], the hydrogenase database (HydDB) downloaded in November 2018 [ https://services.birc.au.dk/hyddb/browser/ ], and NCBI_nr downloaded in November 2018 [ ftp://ftp.ncbi.nlm.nih.gov/blast/db/ ]. Acknowledgements This project has received funding by the Swedish Research Council (VR starting grant 2016-03559 to AS), the Netherlands Organization for Scientific Research Dutch Research Council (NWO) (WISE fellowship to AS and OCENW.M.22.117 to A.S.)), the Moore–Simons Project on the Origin of the Eukaryotic Cell, (Simons Foundation 735929LPI to A.S. as Co-Pi; Gordon and Betty Moore Foundation, GBMF9741 to T.A.W. and A.S.), and the European Research Council (ERC) under the European Union’s Horizon 2020 research and innovation programme (grant agreement No. 947317, ASymbEL to A.S.). Our research is funded by the John Templeton Foundation (63451 to T.A.W. and A.S.; the opinions expressed in this publication are those of the authors and do not necessarily reflect the views of the John Templeton Foundation. Funder Information Declared Swedish Research Council , 2016-03559 Netherlands Organization for Scientific Research , WISE fellowship , OCENW.M.22.117 Simons Foundation , 735929LPI Gordon and Betty Moore Foundation , GBMF9741 the European Union’s Horizon 2020 research and innovation programme , grant agreement No. 947317, ASymbEL Footnotes https://zenodo.org/records/14627918 References 1. ↵ Castelle CJ , Wrighton KC , Thomas BC et al. Genomic Expansion of Domain Archaea Highlights Roles for Organisms from New Phyla in Anaerobic Carbon Cycling . Curr Biol 2015 ; 25 : 690 – 701 . OpenUrl CrossRef PubMed 2. ↵ Castelle CJ , Banfield JF . Major New Microbial Groups Expand Diversity and Alter our Understanding of the Tree of Life . Cell 2018 ; 172 : 1181 – 97 . OpenUrl CrossRef PubMed 3. ↵ Dombrowski N , Lee JH , Williams TA et al. Genomic diversity, lifestyles and evolutionary origins of DPANN archaea . FEMS Microbiol Lett 2019 ; 366 , DOI: 10.1093/femsle/fnz008 . OpenUrl CrossRef PubMed 4. ↵ Dombrowski N , Williams TA , Sun J et al. Undinarchaeota illuminate DPANN phylogeny and the impact of gene transfer on archaeal evolution . Nat Commun 2020 ; 11 : 3939 . OpenUrl CrossRef PubMed 5. ↵ Rinke C , Schwientek P , Sczyrba A et al. Insights into the phylogeny and coding potential of microbial dark matter . Nature 2013 ; 499 : 431 – 7 . OpenUrl CrossRef PubMed Web of Science 6. ↵ Rinke C , Chuvochina M , Mussig AJ et al. A standardized archaeal taxonomy for the Genome Taxonomy Database . Nat Microbiol 2021 ; 6 : 946 – 59 . OpenUrl PubMed 7. ↵ Huber H , Hohn MJ , Rachel R et al. A new phylum of Archaea represented by a nanosized hyperthermophilic symbiont . Nature 2002 ; 417 : 63 – 7 . OpenUrl CrossRef PubMed Web of Science 8. Kato S , Ogasawara A , Itoh T et al. Nanobdella aerobiophila gen. nov., sp. nov., a thermoacidophilic, obligate ectosymbiotic archaeon, and proposal of Nanobdellaceae fam. nov ., Nanobdellales ord. nov. and Nanobdellia class. nov. Int J Syst Evol Microbiol 2022 ; 72 : 005489 . OpenUrl 9. St John E , Liu Y , Podar M et al. A new symbiotic nanoarchaeote (Candidatus Nanoclepta minutus) and its host (Zestosphaera tikiterensis gen. nov . , sp. nov.) from a New Zealand hot spring. Syst Appl Microbiol 2019 ; 42 : 94 – 106 . OpenUrl PubMed 10. ↵ Wurch L , Giannone RJ , Belisle BS et al. Genomics-informed isolation and characterization of a symbiotic Nanoarchaeota system from a terrestrial geothermal environment . Nat Commun 2016 ; 7 : 12115 . OpenUrl CrossRef PubMed 11. ↵ Hamm JN , Erdmann S , Eloe-Fadrosh EA et al. Unexpected host dependency of Antarctic Nanohaloarchaeota . Proc Natl Acad Sci U A 2019 ; 116 : 14661 – 70 . OpenUrl Abstract / FREE Full Text 12. La Cono V , Messina E , Rohde M et al. Symbiosis between nanohaloarchaeon and haloarchaeon is based on utilization of different polysaccharides . Proc Natl Acad Sci U A 2020 ; 117 : 20223 – 34 . OpenUrl Abstract / FREE Full Text 13. ↵ Reva O , Messina E , La Cono V et al. Functional diversity of nanohaloarchaea within xylan-degrading consortia . Front Microbiol 2023 ; 14 , DOI: 10.3389/fmicb.2023.1182464 . OpenUrl CrossRef PubMed 14. ↵ Golyshina OV , Toshchakov SV , Makarova KS et al. “ARMAN” archaea depend on association with euryarchaeal host in culture and in situ . Nat Commun 2017 ; 8 : 60 . OpenUrl CrossRef PubMed 15. ↵ Krause S , Bremges A , Munch PC et al. Characterisation of a stable laboratory co-culture of acidophilic nanoorganisms . Sci Rep 2017 ; 7 : 3289 . OpenUrl CrossRef PubMed 16. ↵ Zhang IH , Borer B , Zhao R et al. Uncultivated DPANN archaea are ubiquitous inhabitants of global oxygen-deficient zones with diverse metabolic potential . mBio 2024 ; 15 : e02918 – 23 . OpenUrl PubMed 17. ↵ Oren A . Novel insights into the diversity of halophilic microorganisms and their functioning in hypersaline ecosystems . Npj Biodivers 2024 ; 3 : 1 – 9 . OpenUrl CrossRef PubMed 18. ↵ Gutiérrez-Preciado A , Dede B , Baker BA et al. Extremely acidic proteomes and metabolic flexibility in bacteria and highly diversified archaea thriving in geothermal chaotropic brines . Nat Ecol Evol 2024 , DOI: 10.1038/s41559-024-02505-6 . OpenUrl CrossRef PubMed 19. ↵ Andrei AS , Banciu HL , Oren A . Living with salt: metabolic and phylogenetic diversity of archaea inhabiting saline ecosystems . FEMS Microbiol Lett 2012 ; 330 : 1 – 9 . OpenUrl CrossRef PubMed Web of Science 20. ↵ Narasingarao P , Podell S , Ugalde JA et al. De novo metagenomic assembly reveals abundant novel major lineage of Archaea in hypersaline microbial communities . ISME J 2012 ; 6 : 81 – 93 . OpenUrl CrossRef PubMed Web of Science 21. Sorokin DY , Makarova KS , Abbas B et al. Discovery of extremely halophilic, methyl-reducing euryarchaea provides insights into the evolutionary origin of methanogenesis . Nat Microbiol 2017 ; 2 : 17081 . OpenUrl PubMed 22. ↵ Baker BA , Gutiérrez-Preciado A , Rodríguez del Río Á et al. Expanded phylogeny of extremely halophilic archaea shows multiple independent adaptations to hypersaline environments. Nat Microbiol 2024 ; 9 : 964 – 75 . OpenUrl PubMed 23. ↵ Zhou H , Zhao D , Zhang S et al. Metagenomic insights into the environmental adaptation and metabolism of Candidatus Haloplasmatales, one archaeal order thriving in saline lakes . Environ Microbiol 2022 ; 24 : 2239 – 58 . OpenUrl 24. ↵ Bonnaud E , Oger PM , Ohayon A et al. Haloarchaea as Promising Chassis to Green Chemistry . Microorganisms 2024 ; 12 : 1738 . OpenUrl PubMed 25. ↵ Aouad M , Taib N , Oudart A et al. Extreme halophilic archaea derive from two distinct methanogen Class II lineages . Mol Phylogenet Evol 2018 ; 127 : 46 – 54 . OpenUrl CrossRef PubMed 26. ↵ Aouad M , Flandrois J-P , Jauffrit F et al. A divide-and-conquer phylogenomic approach based on character supermatrices resolves early steps in the evolution of the Archaea . BMC Ecol Evol 2022 ; 22 : 1 . 27. ↵ Baker BA , McCarthy CGP , López-García P et al. Phylogenomic analyses indicate the archaeal superphylum DPANN originated from free-living euryarchaeal-like ancestors . Nat Microbiol 2025 ; 10 : 1593 – 604 . OpenUrl PubMed 28. ↵ . Hug LA , Baker BJ , Anantharaman K et al. A new view of the tree of life . Nat Microbiol 2016 ; 1 : 16048 . OpenUrl PubMed 29. ↵ Mahendrarajah TA , Moody ERR , Schrempf D et al. ATP synthase evolution on a cross-braced dated tree of life . Nat Commun 2023 ; 14 : 7456 . OpenUrl CrossRef PubMed 30. ↵ . Li Yu-Xian , Rao Yang-Zhi , Qi Yan-Ling et al. Deciphering Symbiotic Interactions of “Candidatus Aenigmarchaeota” with Inferred Horizontal Gene Transfers and Co-occurrence Networks . mSystems 2021 ; 6 : doi: 10.1128/msystems.00606-21 . OpenUrl CrossRef 31. ↵ Dombrowski N , Teske AP , Baker BJ . Expansive microbial metabolic versatility and biodiversity in dynamic Guaymas Basin hydrothermal sediments . Nat Commun 2018 ; 9 : 4999 . OpenUrl CrossRef PubMed 32. ↵ Dombrowski N , Seitz KW , Teske AP et al. Genomic insights into potential interdependencies in microbial hydrocarbon and nutrient cycling in hydrothermal sediments . Microbiome 2017 ; 5 : 106 . OpenUrl CrossRef PubMed 33. ↵ Hou J , Sievert SM , Wang Y et al. Microbial succession during the transition from active to inactive stages of deep-sea hydrothermal vent sulfide chimneys . Microbiome 2020 ; 8 : 102 . OpenUrl CrossRef PubMed 34. ↵ Xie Y-G , Luo Z-H , Fang B-Z et al. Functional differentiation determines the molecular basis of the symbiotic lifestyle of Ca. Nanohaloarchaeota . Microbiome 2022 ; 10 : 1 – 13 . OpenUrl CrossRef PubMed 35. ↵ Zhao D , Zhang S , Kumar S et al. Comparative Genomic Insights into the Evolution of Halobacteria-Associated “Candidatus Nanohaloarchaeota.” mSystems 2022 ; 7 : e00669 – 22 . OpenUrl PubMed 36. ↵ Szöllősi GJ , Rosikiewicz W , Boussau B et al. Efficient Exploration of the Space of Reconciled Gene Trees . Syst Biol 2013 ; 62 : 901 – 12 . OpenUrl CrossRef PubMed 37. ↵ . Szöllősi GJ , Boussau B , Abby SS et al. Phylogenetic modeling of lateral gene transfer reconstructs the pattern and relative timing of speciations . Proc Natl Acad Sci 2012 ; 109 : 17513 – 8 . OpenUrl Abstract / FREE Full Text 38. ↵ Hamm JN , Dombrowski N , Valentin-Alvarado LE et al. Caliditerrarchaeota, a new sister to Nanohaloarchaeota, provides insights into the evolution of DPANN halophily . 2025 . 39. ↵ Steinegger M , Meier M , Mirdita M et al. HH-suite3 for fast remote homology detection and deep protein annotation . BMC Bioinformatics 2019 ; 20 : 473 . OpenUrl CrossRef PubMed 40. ↵ Haft DH , Selengut JD , White O . The TIGRFAMs database of protein families . Nucleic Acids Res 2003 ; 31 : 371 – 3 . OpenUrl CrossRef PubMed Web of Science 41. ↵ Katoh K , Standley DM . MAFFT multiple sequence alignment software version 7: improvements in performance and usability . Mol Biol Evol 2013 ; 30 : 772 – 80 . OpenUrl CrossRef PubMed Web of Science 42. ↵ Criscuolo A , Gribaldo S . BMGE (Block Mapping and Gathering with Entropy): a new software for selection of phylogenetic informative regions from multiple sequence alignments . BMC Evol Biol 2010 ; 10 : 210 . OpenUrl CrossRef PubMed 43. ↵ Nguyen LT , Schmidt HA , von Haeseler A et al. IQ-TREE: a fast and effective stochastic algorithm for estimating maximum-likelihood phylogenies . Mol Biol Evol 2015 ; 32 : 268 – 74 . OpenUrl CrossRef PubMed 44. ↵ Viklund J , Ettema TJG , Andersson SGE . Independent Genome Reduction and Phylogenetic Reclassification of the Oceanic SAR11 Clade . Mol Biol Evol 2012 ; 29 : 599 – 615 . OpenUrl CrossRef PubMed Web of Science 45. ↵ Kostka M , Uzlikova M , Cepicka I et al. SlowFaster, a user-friendly program for slow-fast analysis and its application on phylogeny of Blastocystis . BMC Bioinformatics 2008 ; 9 : 341 . OpenUrl CrossRef PubMed 46. ↵ Seemann T . Prokka: rapid prokaryotic genome annotation . Bioinformatics 2014 ; 30 : 2068 – 9 . OpenUrl CrossRef PubMed Web of Science 47. ↵ Galperin MY , Makarova KS , Wolf YI et al. Expanded microbial genome coverage and improved protein family annotation in the COG database . Nucleic Acids Res 2015 ; 43 : D261 – 9 . OpenUrl CrossRef PubMed 48. ↵ Makarova KS , Wolf YI , Koonin EV . Archaeal Clusters of Orthologous Genes (arCOGs): An Update and Application for Analysis of Shared Features between Thermococcales , Methanococcales, and Methanobacteriales. Life Basel Switz 2015 ; 5 : 818 – 40 . OpenUrl 49. ↵ Aramaki T , Blanc-Mathieu R , Endo H et al. KofamKOALA: KEGG Ortholog assignment based on profile HMM and adaptive score threshold . Bioinformatics 2020 ; 36 : 2251 – 2 . OpenUrl CrossRef PubMed 50. ↵ Bateman A , Coin L , Durbin R et al. The Pfam protein families database . Nucleic Acids Res 2004 ; 32 : D138 – 41 . OpenUrl CrossRef PubMed Web of Science 51. ↵ Yin Y , Mao X , Yang J et al. dbCAN: a web resource for automated carbohydrate-active enzyme annotation . Nucleic Acids Res 2012 ; 40 : W445 – 51 . OpenUrl CrossRef PubMed Web of Science 52. ↵ Saier MH , Tran CV , Barabote RD . TCDB: the Transporter Classification Database for membrane transport protein analyses and information . Nucleic Acids Res 2006 ; 34 : D181 – 6 . OpenUrl CrossRef PubMed Web of Science 53. ↵ Sondergaard D , Pedersen CN , Greening C . HydDB: A web tool for hydrogenase classification and analysis . Sci Rep 2016 ; 6 : 34212 . OpenUrl CrossRef PubMed 54. ↵ Jones P , Binns D , Chang HY et al. InterProScan 5: genome-scale protein function classification . Bioinformatics 2014 ; 30 : 1236 – 40 . OpenUrl CrossRef PubMed Web of Science 55. ↵ Altschul SF , Madden TL , Schaffer AA et al. Gapped BLAST and PSI-BLAST: a new generation of protein database search programs . Nucleic Acids Res 1997 ; 25 : 3389 – 402 . OpenUrl CrossRef PubMed Web of Science 56. ↵ Buchfink B , Reuter K , Drost HG . Sensitive protein alignments at tree-of-life scale using DIAMOND . Nat Methods 2021 ; 18 : 366 – 8 . OpenUrl CrossRef PubMed 57. ↵ Russel J , Pinilla-Redondo R , Mayo-Muñoz D et al. CRISPRCasTyper: Automated Identification, Annotation, and Classification of CRISPR-Cas Loci . CRISPR J 2020 ; 3 : 462 – 9 . OpenUrl CrossRef PubMed 58. ↵ Chaumeil PA , Mussig AJ , Hugenholtz P et al. GTDB-Tk: a toolkit to classify genomes with the Genome Taxonomy Database . Bioinformatics 2019 ; 36 : 1925 – 7 . OpenUrl CrossRef PubMed 59. ↵ Greening C , Cabotaje PR , Valentin Alvarado LE et al. Minimal and hybrid hydrogenases are active from archaea . Cell 2024 ; 187 : 3357 – 3372 .e19. OpenUrl CrossRef PubMed 60. ↵ Spang A , Stairs CW , Dombrowski N et al. Proposal of the reverse flow model for the origin of the eukaryotic cell based on comparative analyses of Asgard archaeal metabolism . Nat Microbiol 2019 ; 4 : 1138 – 48 . OpenUrl PubMed 61. ↵ Wang H-C , Minh BQ , Susko E et al. Modeling Site Heterogeneity with Posterior Mean Site Frequency Profiles Accelerates Accurate Phylogenomic Estimation . Syst Biol 2018 ; 67 : 216 – 35 . OpenUrl CrossRef PubMed 62. ↵ Moody ERR , Mahendrarajah TA , Dombrowski N et al. An estimate of the deepest branches of the tree of life from ancient vertically evolving genes . Perry GH , Koonin EV (eds.). eLife 2022 ; 11 : e66695 . OpenUrl CrossRef PubMed 63. ↵ Reysenbach AL , St John E , Meneghin J et al. Complex subsurface hydrothermal fluid mixing at a submarine arc volcano supports distinct and highly diverse microbial communities . Proc Natl Acad Sci U A 2020 ; 117 : 32627 – 38 . OpenUrl Abstract / FREE Full Text 64. ↵ Vázquez-Campos X , Kinsela AS , Bligh MW et al. Genomic Insights Into the Archaea Inhabiting an Australian Radioactive Legacy Site . Front Microbiol 2021 ; 12 : 732575 . 65. ↵ Berg IA , Kockelkorn D , Ramos-Vera WH et al. Autotrophic carbon fixation in archaea . Nat Rev Microbiol 2010 ; 8 : 447 – 60 . OpenUrl CrossRef PubMed Web of Science 66. ↵ Oren A . Diversity of halophilic microorganisms: Environments, phylogeny, physiology, and applications . J Ind Microbiol Biotechnol 2002 ; 28 : 56 – 63 . OpenUrl CrossRef PubMed Web of Science 67. ↵ Williams TA , Davin AA , Szánthó LL et al. Phylogenetic reconciliation: making the most of genomes to understand microbial ecology and evolution . ISME J 2024 ; 18 : wrae129 . OpenUrl CrossRef PubMed 68. ↵ Williams TA , Szollosi GJ , Spang A et al. Integrative modeling of gene and genome evolution roots the archaeal tree of life . Proc Natl Acad Sci U S A 2017 ; 114 : E4602 – 11 . OpenUrl Abstract / FREE Full Text 69. ↵ Raymann K , Brochier-Armanet C , Gribaldo S . The two-domain tree of life is linked to a new root for the Archaea . Proc Natl Acad Sci U S A 2015 ; 112 : 6670 – 5 . OpenUrl Abstract / FREE Full Text 70. ↵ Petitjean C , Deschamps P , Lopez-Garcia P et al. Rooting the Domain Archaea by Phylogenomic Analysis Supports the Foundation of the New Kingdom Proteoarchaeota . Genome Biol Evol 2015 ; 7 : 191 – 204 . OpenUrl CrossRef PubMed 71. ↵ Comolli LR , Banfield JF . Inter-species interconnections in acid mine drainage microbial communities . Front Microbiol 2014 ; 5 : 367 . OpenUrl CrossRef PubMed 72. Hamm JN , Liao Y , von Kügelgen A et al. The parasitic lifestyle of an archaeal symbiont . Nat Commun 2024 ; 15 : 6449 . OpenUrl PubMed 73. ↵ Xie B , Wang J , Nie Y et al. Type IV pili trigger episymbiotic association of Saccharibacteria with its bacterial host . Proc Natl Acad Sci U S A 2022 ; 119 : e2215990119 . OpenUrl CrossRef PubMed 74. ↵ Jones DL , Baxter BK . DNA Repair and Photoprotection: Mechanisms of Overcoming Environmental Ultraviolet Radiation Exposure in Halophilic Archaea . Front Microbiol 2017 ; 8 : 1882 . OpenUrl CrossRef PubMed 75. ↵ Oren A . Life at high salt concentrations, intracellular KCl concentrations, and acidic proteomes . Front Microbiol 2013 ; 4 . 76. ↵ Hamann E , Tegetmeyer HE , Riedel D et al. Syntrophic linkage between predatory Carpediemonas and specific prokaryotic populations . ISME J 2017 ; 11 : 1205 – 17 . OpenUrl CrossRef PubMed 77. ↵ Ortiz-Alvarez R , Casamayor EO . High occurrence of Pacearchaeota and Woesearchaeota (Archaea superphylum DPANN) in the surface waters of oligotrophic high-altitude lakes . Environ Microbiol Rep 2016 ; 8 : 210 – 7 . OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted August 07, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Caliditerrarchaeota, a new sister to Nanohaloarchaeota, provides insights into the evolution of DPANN halophily Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Caliditerrarchaeota, a new sister to Nanohaloarchaeota, provides insights into the evolution of DPANN halophily Joshua N. Hamm , Nina Dombrowski , Luis E. Valentin-Alvarado , Chris Greening , Tom A. Williams , Anja Spang bioRxiv 2025.08.05.668663; doi: https://doi.org/10.1101/2025.08.05.668663 Share This Article: Copy Citation Tools Caliditerrarchaeota, a new sister to Nanohaloarchaeota, provides insights into the evolution of DPANN halophily Joshua N. Hamm , Nina Dombrowski , Luis E. Valentin-Alvarado , Chris Greening , Tom A. Williams , Anja Spang bioRxiv 2025.08.05.668663; doi: https://doi.org/10.1101/2025.08.05.668663 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Evolutionary Biology Subject Areas All Articles Animal Behavior and Cognition (7640) Biochemistry (17706) Bioengineering (13902) Bioinformatics (41978) Biophysics (21465) Cancer Biology (18611) Cell Biology (25528) Clinical Trials (138) Developmental Biology (13387) Ecology (19920) Epidemiology (2067) Evolutionary Biology (24332) Genetics (15615) Genomics (22519) Immunology (17747) Microbiology (40424) Molecular Biology (17194) Neuroscience (88662) Paleontology (667) Pathology (2838) Pharmacology and Toxicology (4827) Physiology (7650) Plant Biology (15160) Scientific Communication and Education (2046) Synthetic Biology (4302) Systems Biology (9826) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00