Deconstructing the common anteroposterior organisation of adult bilaterian guts

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 190,340 characters · extracted from preprint-html · click to expand
Deconstructing the common anteroposterior organisation of adult bilaterian guts | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Deconstructing the common anteroposterior organisation of adult bilaterian guts View ORCID Profile Stefano Davide Vianello , View ORCID Profile Ching-Yi Lin , Wahyu Cristine Pinem , Han-Ru Li , View ORCID Profile Kun-Lung Li , Grace Sonia , View ORCID Profile Shu-Hua Lee , Szu-Kai Wu , View ORCID Profile Vincent Laudet , View ORCID Profile Yi-Hsien Su , View ORCID Profile Jr-Kai Yu , View ORCID Profile Stephan Q. Schneider doi: https://doi.org/10.1101/2025.07.02.662275 Stefano Davide Vianello 1 Marine Research Station, Institute of Cellular and Organismic Biology, Academia Sinica , Yilan, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Stefano Davide Vianello For correspondence: stefano{at}vianello.ai vincent.laudet{at}oist.jp yhsu{at}as.edu.tw jkyu{at}gate.sinica.edu.tw sqschneider{at}gate.sinica.edu.tw Ching-Yi Lin 2 Institute of Cellular and Organismic Biology, Academia Sinica , Taipei 11529, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Ching-Yi Lin Wahyu Cristine Pinem 3 Department of Bioscience and Biotechnology, National Taiwan Ocean University 2 Institute of Cellular and Organismic Biology, Academia Sinica , Taipei 11529, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site Han-Ru Li 2 Institute of Cellular and Organismic Biology, Academia Sinica , Taipei 11529, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site Kun-Lung Li 2 Institute of Cellular and Organismic Biology, Academia Sinica , Taipei 11529, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Kun-Lung Li Grace Sonia 2 Institute of Cellular and Organismic Biology, Academia Sinica , Taipei 11529, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site Shu-Hua Lee 1 Marine Research Station, Institute of Cellular and Organismic Biology, Academia Sinica , Yilan, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Shu-Hua Lee Szu-Kai Wu 1 Marine Research Station, Institute of Cellular and Organismic Biology, Academia Sinica , Yilan, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site Vincent Laudet 1 Marine Research Station, Institute of Cellular and Organismic Biology, Academia Sinica , Yilan, Taiwan 4 Marine Eco-Evo-Devo Unit, Okinawa Institute of Science and Technology Graduate University , Onna son, Okinawa, Japan 5 CNRS IRL 2028 “Eco-Evo-Devo of Coral Reef Fish Life Cycle” (EARLY) Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Vincent Laudet For correspondence: stefano{at}vianello.ai vincent.laudet{at}oist.jp yhsu{at}as.edu.tw jkyu{at}gate.sinica.edu.tw sqschneider{at}gate.sinica.edu.tw Yi-Hsien Su 2 Institute of Cellular and Organismic Biology, Academia Sinica , Taipei 11529, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Yi-Hsien Su For correspondence: stefano{at}vianello.ai vincent.laudet{at}oist.jp yhsu{at}as.edu.tw jkyu{at}gate.sinica.edu.tw sqschneider{at}gate.sinica.edu.tw Jr-Kai Yu 2 Institute of Cellular and Organismic Biology, Academia Sinica , Taipei 11529, Taiwan 1 Marine Research Station, Institute of Cellular and Organismic Biology, Academia Sinica , Yilan, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jr-Kai Yu For correspondence: stefano{at}vianello.ai vincent.laudet{at}oist.jp yhsu{at}as.edu.tw jkyu{at}gate.sinica.edu.tw sqschneider{at}gate.sinica.edu.tw Stephan Q. Schneider 2 Institute of Cellular and Organismic Biology, Academia Sinica , Taipei 11529, Taiwan 3 Department of Bioscience and Biotechnology, National Taiwan Ocean University Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Stephan Q. Schneider For correspondence: stefano{at}vianello.ai vincent.laudet{at}oist.jp yhsu{at}as.edu.tw jkyu{at}gate.sinica.edu.tw sqschneider{at}gate.sinica.edu.tw Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract A through-gut is one of the major features of bilaterians. Comparative work among bilaterians has identified common molecular mechanisms during early gut patterning, but the primordial gut later often undergoes different degrees of reorganization in each lineage to form a fully differentiated adult gut with specializations along its anteroposterior (AP) axis. Yet, how the conserved embryonic gut AP pattern relates to the adult guts in diverse bilaterians after metamorphosis is still poorly understood. To unravel the molecular subdivisions of adult guts, we investigated the gut through transcriptomic analyses of five phylogenetically informative species, an annelid, a sea urchin, a hemichordate, a cephalochordate, and a vertebrate. We identified bipartite transcriptional programs defining the AP functional subdivisions. Patterning systems composed of Hox, Parahox, and, surprisingly, other transcription factors (TFs) known to be involved in gut formation in sea urchin larvae are maintained in these adult tissues. Using unbiased analyses, we identified five conserved TF modules corresponding to the AP compartments of the guts that are elaborated or shifted in different species. Our study inferred conserved and modified adult AP patterning modules along bilaterian guts enabling the reconstruction of ancestral bilaterian features with profound implications for the evolution of the bilaterian body plan. Introduction The through-gut: an evolutionary old invention in bilaterians A through-gut, a “one-way” digestive organ with a mouth and anus, is one of the major features of animals with bilateral symmetry, the bilaterians. Vertebrates, including humans, share this feature with e.g. sea urchins, acorn worms, flies, tardigrades, molluscs, and worms, suggesting that an inner digestive tube was already established in the last common ancestor. Through-guts have however also been identified within non-bilaterian clades and phyla which are not currently believed to have had a through-gut ancestor ( Dunn et al., 2022 ; Han et al., 2018 ; Zhang et al., 2022 ; Zhao et al., 2019 ). Within the Cnidaria, which classically harbour instead a blind-gut configuration in which food enters and exits from a single, shared external opening ( Ruppert et al., 2004 ), some species do indeed display veritable “one-way” through-guts ( Avian et al., 2022 ), or guts that are not completely blind due to mixed anatomical solutions ( Aria & Chan, 1989 ). Another non-bilaterian phylum, Ctenophora (comb jellies), has also long been known to possess through-guts ( Presnell et al., 2016 ; Miyake et al., 2019 ; Tamm, 2019 ). The actual homology between these non-bilaterians and bilaterian through-guts remains uncertain. Such an assessment is mostly complicated by the outstanding phylogenetic and paleontological uncertainty on the order of emergence of metazoan phyla ( Kapli et al., 2021 ; Laumer et al., 2018 ; Nanglu et al., 2023 ; Peterson & Eernisse, 2016 ; Silva et al., 2025 ), and the consequent debated phylogenetic position of key non-bilaterian and bilaterian phyla with divergent gut architectures ( Gavilán et al., 2019 ; Hejnol & Martindale, 2008 ; Mayorova et al., 2025 ; Smith & Mayorova, 2019 ). Even within extant species, assessments of homology between through-guts are still restricted by a relative limitedness of histological/molecular/genetic characterisations of bilaterian and non-bilaterian key model species. Though efforts to find a shared comparative basis between animal guts are making significant progress in this area (on a developmental biology basis, see below), there remains a fundamental uncertainty about which regions of the gut should be used as terms of comparison between adult guts with different architectures, or even between through-guts of different species. Accordingly, even though some bilaterians do not have a through-gut (most notably, many Platyzoa; ( Hejnol & Martín-Durán, 2015 )), the prevalence of through-guts across bilaterians ( Hejnol & Martín-Durán, 2015 ; Maderspacher, 2009 ), the current rooting of both Cnidarians and Ctenophores to blind-gut ancestors ( Dunn et al., 2022 ; Han et al., 2018 ; Zhang et al., 2022 ; Zhao et al., 2019 ), and the recent identification of through-gutted Ediacaran fossils with bilaterian affinity ( Martynov & Korshunova, 2022 ; Schiffbauer et al., 2020 ) currently do support the interpretation of through-gut evolution as a milestone developmental transition at the base of the bilaterian clade rather than a repeatedly lost earlier metazoan innovation. Functional and anatomical divergence of a common bilaterian through-guts Today, bilaterian adult through-guts display a remarkable variety of forms and functions across phyla, species and diets ( Yonge, 1937 ; Engel & Moran, 2013 ; Lobo-da-Cunha, 2019 ; Nakayama et al., 2019 ). Beyond the widespread variation in gut length and/or gut cell type proportions familiarly associated with dietary specialisations ( Duque-Correa et al., 2021 ; Fages et al., 2024 ), examples include veritable anatomical oddities such as the “fractal” gut anatomy of branched annelids ( M’Intosh, 1879 ; Aguado et al., 2022 ), and highly divergent anatomical adaptations such as the “armored” stomach of scorpion-eating mice ( Horner et al., 1964 ). Similarly, some bilaterian through-guts are capable of functions that have generally found few or no equivalents in other species: the through-gut of many holothurians can be everted as a defense mechanism ( Wilkie, 2001 ), and the gut of two recently extinct frog species was uniquely able to temporarily dedifferentiate into a non-digestive brooding chamber ( Fanning et al., 1982 ). Examples of through-gut anatomical and functional variation abound, and add to the parallel remarkable variety in presence, number and form of buds/diverticula/glands/organs of unclear homology that connect to- or branch off from varying points of the gut tube across many bilaterian species, or seem to be completely missing instead in others ( Cornelius, 1985 ). Yet, even in the face of such diversity, a picture starts to emerge whereby the remarkable variety of bilaterian through-gut forms and functions may be understood as the result of (divergent or convergent) evolutionary, ontogenetic or ecological modification of an underlying common structure. That is, the placement of the through-gut at the base of the bilaterian tree predicts that an underlying set of core anatomical and/or functional modules would exist and be homologous across all bilaterian through-guts. Current investigative efforts in this direction are mostly searching for such homologies in terms of conserved gene expression patterns and conserved gene regulatory networks: molecular data assessed at phylotypic stages, at early embryonic/larval stages where the through-gut shows the first signs of patterning, and at gastrulation ( Annunziata et al., 2019 ; Annunziata & Arnone, 2014 ; Boyle et al., 2014 ; He et al., 2020 ; Nowotschin et al., 2019 ; Sherwood et al., 2009 ). The formation of the embryonic basis that will act as a substrate for the elaboration of postembryonic identities (e.g. in vertebrates, the embryonic gut tube) is itself highly divergent and non-equivalent across species: bilaterian through-guts are formed through a wide variety of embryonic processes, germ layer contributions, and non-equivalent topological transformations ( Grapin-Botton & Melton, 2000 ; Nakazawa et al., 2013 ; Nowotschin et al., 2019 ; Nowotschin & Hadjantonakis, 2020 ; Wallace & Pack, 2003 ). Yet, investigations of cross-species correspondences in developing guts show strong conservation of anteroposterior (AP) patterns of gene expression and of the underlying gene-regulatory networks during the patterning process itself, even across distant phyla ( Annunziata et al., 2019 ; Annunziata & Arnone, 2014 ; Boyle et al., 2014 ; Cole et al., 2009 ; Magri et al., 2024 ; Voronov et al., 2024 ). Such deep conservation of molecular signatures, developmental mechanisms, and patterning systems makes the independent repeated evolution of bilaterian through-guts unlikely, and has allowed to sketch out broad homologies between embryonic gut territories ( Annunziata et al., 2019 ; He et al., 2020 ). The diversity of bilaterian guts would have, at least in these terms, a common, comparable basis, further elaborated upon by gains, losses, and rearrangements throughout the bilaterian tree. Critically, investigations based on gene expression signatures also allowed to draw new, non-intuitive connections even between highly divergent gut structures, further allowing the discrimination between ancestral and derived functions. Most recently, the link between the vertebrate pancreas and specific cell types and cell functions was found within the gut tube of sea urchin ( Paganos et al., 2022 ; Perillo et al., 2016 ). Similar considerations apply to the vertebrate liver organ, though the evolutionary rooting of this organ has up to now focused on the chordate branch ( Wu et al., 2024 ) and the homology with protostome liver-like organs/cells is still to be assessed ( Cornelius, 1985 ; Dai et al., 2024 ; Li & Zhang, 2010 ; Subbotin, 2017 ). In general, much is left in being able to distinguish between true through-gut innovations and highly divergent deeply homologous structures. It also fundamentally remains unclear whether correspondences between through-gut regions may extend beyond the tripartite “foregut”, “midgut”, “hindgut” framework that has been defined from embryonic and larval gene expression patterns. Critically, identifying a shared signature across extant bilaterian guts, conserved across millions of years of evolution, may provide a possible identikit of the likely features of its ancestral counterpart. Conversely, the modes through which the original through-gut might have been used to interact with, process, and exploit a wide variety of nutrients, and their effective distribution across its AP length, may have left a deep homologous signature to be recovered across extant bilaterian through-guts, regardless of their current digestive solutions and highly divergent gastrointestinal variations. Justification of current study In this study, we analyse anteroposteriorly-resolved transcriptomic data collected along the adult gut of five bilaterian species, to compare AP gene expression patterns and identify regional equivalences. We seek to define an interpretative lens, based on molecular data, through which the adult bilaterian gut may best be understood. We find such an interpretative lens in an AP scaffold that is overall organised in two compartments, and along which are arranged a specific set of five conserved expression modules which otherwise underlie highly divergent AP organisation of shared functions. Our investigation has implications beyond comparative studies of adult gut function and evolution, potentially informing equivalent frameworks through which to understand their embryonic/ontogenetic basis, historical and evolutionary reconstructions on the likely adult configuration of the through-gut ancestor, and offers a potential avenue to assess the homology of the alternative adult through-guts found in non-bilateria. Results Section 1: Adult guts in annelids, hemichordates, echinoderms, cephalochordates, and vertebrates We considered five marine organisms across main branches of the bilaterian evolutionary tree. As a representative of the protostomes, the annelid worm Platynereis dumerilii (Audouin & Milne Edwards, 1833; Dumeril’s clam worm, “Pd”; ( Özpolat et al., 2021 )). Among deuterostomes, within the Ambulacraria, the echinoderm Strongylocentrotus purpuratus (Stimpson, 1857; purple sea urchin, “Sp”) and the hemichordate Ptychodera flava (Eschscholtz, 1825; acorn worm, “Pf”). For the chordate branch, the cephalochordate Branchiostoma floridae (Hubbs, 1922; Florida lancelet, “Bf”), and the vertebrate Amphiprion ocellaris (Cuvier and Valenciennes, 1830; common clownfish, “Ao”; ( Roux et al., 2020 )). We then dissected out the entire adult gastrointestinal tract (with associated digestive organs if applicable) from each of the five species under consideration (with the exception of Pf, see Methods), and further subdivided each gastrointestinal tube into subsegments taken to span the entire length of each tract, from anterior to posterior ( Figure 1A ). All segments from each species were processed for RNA sequencing. Detailed documentation about the dissection criteria, the dissection process, transcriptome extraction and sequencing are provided in Materials and Methods , Supplementary Figure 1×1 , and Supplementary Figure 1×2 . Download figure Open in new tab Figure 1: Adult guts in annelids, hemichordates, echinoderms, cephalochordates, and vertebrates. A ) Schematic phylogeny of the 5 bilaterian species compared in this study, and of their gastrointestinal anatomy. In red, schematic illustration of the gut segments collected, arranged along the gut AP axis. A, anterior; P, posterior; Or, oral; Ab, aboral. B ) For each species, heatmap of the Spearman’s Rank Correlation coefficients between all pairs of gut segments (white, low; purple, high). Segments are numbered sequentially, and color-coded, according to AP position (where applicable). Grey line: segments of the first compartment. Light blue line: segments of the second compartment. C ) For each species, distribution of gut segments (all replicates) across the two main Principal Components (PCs; PC1, PC2). Segments are color-coded and numbered by increasing AP position, as in B. The clownfish liver segment is omitted because it dominated the variance of the combined dataset. D ) For each species, heatmap showing the expression pattern (z-scores) of the top 2000 most-variant genes, along the gut (columns: AP-ordered gut segments). Genes (rows) are ordered according to Rank-2 Elliptical seriation (R2E). Dark rectangle: segments classified as “block compartment”; Graded rectangle: segments classified as “gradient compartment” (see main text). Here again the expression data for the clownfish liver segment is not included as the organ is not part of the adult AP structure. Having thus obtained anteroposteriorly-resolved transcriptomic data of the gastrointestinal tract of five bilaterian species, we then proceeded to investigate the broadscale structure of gene expression across each, aiming to identify conserved principles of bilaterian gut organisation. We first aimed to investigate whether gene expression similarities, within each species, would allow us to summarise segments into a smaller set of equivalent “domains”, whether such domains would reflect the AP position of the segments themselves (i.e. would group contiguous segments or not), and whether such broader domains would reveal a conserved higher-order AP compartmentalisation of gene expression across bilaterian guts (e.g. a tripartite one). We alternatively hypothesise that we could recover instead a continuous, gradual shift in transcriptomic similarity scores traversing the entire AP length of the gastrointestinal tract, a configuration that may or may not then further reveal itself to be conserved across through-guts. By analysing the Spearman’s Rank Correlation coefficients between gut segments, calculated on the top 2000 most variant genes expressed in each gut, we do identify a conserved organisation of gene expression along all five guts, and one with a mixed profile between the two scenarios mentioned above ( Figure 1B ). Specifically we note that i ) anteriormost gut segments can consistently be summarised as a single well-defined molecular compartment (which excludes expected highly-dissimilar pre-oral segments, see the case in Pf), and ii ) segments posterior to this first domain, up to the terminal most end of the gut, define a second compartment of graded AP similarity where transcriptional similarity decays with distance. In species such as Pd and Sp, the terminal-most segments further appear to be distinct enough from the preceding segments of the same domain to define what could be identified as a third (sub)domain. In other words, we consistently identify two main gut compartments in all five through-guts, which we describe here as an anterior “block” compartment and a posterior “gradient” compartment. In contrast to the maybe more conventional tripartite understanding of bilaterian guts, often also applied to the adult configuration, we only see such an organisation in few of the species considered (Pd, Sp; whose grouping would be polyphyletic), and as a subregion at the posterior of the gradient compartment. Principal Component Analysis ( Figure 1C ) does not resolve clearer-cut groupings (except for Sp). Across the top principal components, segments distribute instead into distinctive arch-shaped arrangements, which resolve the actual AP anatomical position of the segment across the gut tube. Critically, AP position would seem to be the explanatory factor underlying the main transcriptional variability within bilaterian guts, supporting AP ordination of gene expression as a shared feature of bilaterian guts. In all species considered, the first axis of transcriptional variation (PC1) would correspond to differences between anterior segments and segments just posterior to them (i.e. anterior segments of the gradient compartment), while the second axis of variation (PC2) would seem to reflect gene-expression patterns characteristic of terminal segments. Interestingly, the most dissimilar regions of the through-gut would not be the most distant ones (mouth+oesophagus vs the hindgut/anus), but rather the anterior vs middle regions. We stress however that arch/horseshoe-shaped patterns in PCA can result from well-known properties of auto-correlated data ( Podani & Miklós, 2002 ), and can lead to erroneous interpretations of sample similarity and of the effective drivers of sample differences ( Camiz, 2005 ; Morton et al., 2017 ; Novembre & Stephens, 2008 ; Shah et al., 2024 ; Shinn, 2023 ). We note that we could not rule out nor confirm that the above segment (dis)similarity inferences are artefactual. For this reason, and because the degree of similarity between bilaterian through-gut termini has particular importance in gut EvoDevo, we preferred to root our assessment of segment affinities on approaches that do not rely on dimensionality reduction throughout the rest of this work. We therefore proceeded to visualise the actual patterns of the genes expressed across through-gut segments ( Figure 1D ). We use heatmaps and combine them with a seriation criterion able to highlight long-range gradients in expression pattern (Rank-2 Elliptical seriation, “R2E”; ( Chen, 2002 )). We expect such long-range gradients in expression patterns from our sample-correlation analysis, PCA, and the increasing literature on gene expression organisation across adult guts ( Buchon et al., 2013 ; Fang et al., 2006 ; Zwick et al., 2024 ). We observed that the main organisation of gene expression along all guts indeed consistently highlights a first set of genes marking anterior segments and a second group of genes with much more pronounced graded distribution spanning the segments of the second block. Since our transcriptomic data can be directly linked to the actual anatomical location of the segments, we clearly notice that the boundary defining the separation between these two conserved through-gut domains invariably corresponds to an actual anatomical boundary in the form of a sphincter. This sphincter — which we would suggest to be a key reference transition point between two potentially comparable regions of bilaterian through-gut architecture — is not considered to be an equivalent structure across bilaterians (“pyloric sphincter” in vertebrates, and the transition between esophagus and stomach in sea urchin/invertebrates). In this new interpretative key, we would like to refer to it as the “transition sphincter”. We also note that species that show a clearer third subcompartment, in transcriptomic terms, are also species with further sphincters downstream the “transition sphincter” (for example, the boundary between stomach and intestine of sea urchins). These downstream sphincters however do not lead to such a clear-cut transition between gene expression profiles and are still traversed by extensive AP gradients of gene expression that do not stop at them. Studies of the Drosophila through-gut, where meticulous characterisation of the correspondences between anatomical sphincters and gene expression boundaries is available ( Buchon et al., 2013 ), similarly identify the anterior “cardiac” sphincter as the anatomical site of the majority of gene expression boundaries, i.e. the site of highest gene expression discontinuity. In conclusion, we find bilaterian adult guts to be best summarised as “anterior-block, posterior gradient” systems, with the transition sphincter in between. Section 2: Hox and Parahox patterning systems in adult guts in bilaterian lineages Hox genes are the most likely candidate for an AP reference system along the bilaterian gut. Though the investigation of their axial expression patterns has extensively focused on neuroectodermal and mesodermal tissues, it has long been put forward that the expression pattern in these tissues may have been just a later recruitment of an original patterning system of the gut tube ( van der Hoeven et al., 1996 ). Moreover, Hox genes are notably amongst the few embryonic gut patterning genes whose expression is well known to persist in the adult gut ( Morgan, 2006 ; Yahagi et al., 2004 ) to the point that detailed maps of their expression patterns for key vertebrate models are widely available ( Yahagi et al., 2004 ). Based on the most recent genomic annotations, we first determined a conservative reconstruction of the full Hox complement of the common clownfish (see Materials and Methods ; 47 Hox genes, 38 of which expressed in the gut). We further verified previously-published reconstructions of the Hox complement in the other four species under consideration ( Cameron et al., 2006 ; Freeman et al., 2012 ; Hejnol et al., 2021 ; Takatori et al., 2008 ) ( Figure 2A ). We are then able to describe the complete map of antero-posterior expression of Hox genes across the entire adult gut of the five bilaterian species considered ( Figure 2B ). Due to the presence of 7 different Hox clusters in clownfish, we order Hox genes in a way that reconstructs their AP sequence of expression (R2E seriation, and which indeed overall matches paralogue numbers), but we also provide cluster-specific maps (ordered by paralogue number), and paralogue-specific maps (ordered by cluster) in Supplementary Figure 2×1 for more convenient reference. Download figure Open in new tab Figure 2: Hox and Parahox patterning systems in adult guts in bilaterian lineages A ) Reconstruction of the Hox complement of the 5 species under study, in reference to the fruit fly model ( Drosophila melanogaster ) reference. Hox genes are color coded by general AP position from blue to yellow/orange, to pink/purple. Hollowed rectangles indicated absence of expression of the corresponding Hox gene in the gut dataset. PG, paralogous group. B ) For each species, heatmap showing the expression pattern (z-scores) of all expressed Hox genes, along the gut AP axis. Genes (rows) are ordered according to Hox paralogue number, except in clownfish where they are ordered according to R2E. C ) For each species, heatmap showing the expression pattern (z-scores) of all expressed ParaHox genes, along the gut AP axis. Solid and graded rectangles indicate segments previously assigned to block and gradient gut compartments, as defined in previous sections. Download figure Open in new tab Supp. Figure 2×1: Alternative visualisations of Hox expression across the clownfish gut Heatmaps showing the expression pattern (z-scores) of all expressed Hox genes, along the AP axis of the clownfish gut (including the liver segment). In A) genes (rows) are grouped by genomic cluster and ordered according to Hox paralogue number within each. In B) genes (rows) are grouped by paralogue group (PG) and ordered according to Hox cluster within each. Color codes are as in Figure 2 . Solid and graded rectangles under the heatmaps indicate segments previously assigned to block and gradient gut compartments, as defined in previous sections. We find that Hox genes are expressed along the gut of all bilaterian species considered, and we recover an overall collinear AP pattern of gene expression in all species, even in species whose Hox genes are not genomically collinear such as Sp ( Figure 2B ; ( Cameron et al., 2006 )). Anteriormost Hox genes are mostly overlappingly expressed as a single block within anterior-segments; central and posterior Hox genes are predominantly expressed in segments posterior to those, in a nested, graded fashion that defines increasingly posterior segments and coincide with the graded compartment discussed in Section 1 ( Figure 2B ). Critically, we therefore find a correspondence between the block-gradient expression pattern of Hox genes and the overall block-gradient organisation of gene expression along the gut ( Section 1 ). We are able to identify other recurring features of the Hox patterning system across bilaterian guts: i ) segments that are not part of the actual linear AP sequence of the gut tube (bifurcations and separated organs) tend to be excluded by the Hox patterning system (see Bf hepatic caecum, Ao liver), and ii ) the anteriormost segments of the gradient compartment consistently show lowest expression of Hox genes, and lowest number of Hox genes expressed (see Pd t2 and stomach, Sp stomach1/2/3, Pf hepatic1, Bf midgut, Ao pyloric caeca and Anterior intestine). In this sense, the expression of middle Hox genes is often shifted away from the posteriormost boundary of expression of anterior Hox genes, leaving intervening segments Hox-poor (one exception is Pf, likely due to the inclusion of the ectodermal layers that obscure the analysis result). We finally note that Hox genes also allow to define an anteriormost terminus of the gut AP system, with pre-oral and oral structures generally not showing anterior Hox gene expression (see Pd mouth and stomodeum, Sp pharynx, and Pf pre-oral segments). This same pattern (anteriormost Hox genes overlapping in the anterior gut, posteriormost genes grading the posterior, and relative paucity of Hox genes expressed in the intervening segments) is indeed the pattern recovered for the embryonic gut of the mouse ( Beck et al., 2000 ; Kawazoe et al., 2002 ; Sekimoto et al., 1998 ). We here recover it as a conserved signature of adult bilaterian through-guts, therefore locating the gut Hox code as a likely ancestral feature of the bilaterian ancestor, specifically in the deployment pattern highlighted above. We then investigated the pattern of expression of ParaHox genes Gsx, Pdx, Cdx ( Figure 2C ). We confirm the general exclusion of Gsx as part of the bilaterian gut patterning system, though we note that we do detect its expression not only in Pd (matching larval reports, ( Hui et al., 2009 )), but also in some segments of Bf. In neither case, and therefore in none of the adult guts here considered, does Gsx appear to carry anterior information. We confirm instead that the classic ParaHox gut patterning system of sequential Pdx and Cdx expression is a distinctive feature of adult bilaterian guts, and we note that these two paraHox genes are specifically deployed to pattern the gradient compartment and not the block compartment. Critically, with Pdx, the ParaHox system fills in the Hox-poor, intermediate, segments, in fact most often allowing to determine the anteriormost boundary of the gradient compartment. Gut tube bifurcations and separated organs are excluded from the ParaHox system, just as they are from the Hox system (see again Bf hepatic caecum, Ao liver). We observed that the relative position of the anterior edge of Cdx expression (relative to the Pdx domain) is quite variable across species, just as the posterior boundary of Pdx expression, but that only in clownfish does Cdx extend all the way to the anterior of the gradient compartment ( Figure 2C ). In summary, we find that adult bilaterian guts share a common complementary Hox and Para-Hox AP organisation system, deployed on a bipartite basis just like the overall gene expression patterns, and that only includes segments that are part of the actual linear AP sequence of the gut. With an anterior boundary that does not necessarily match the anteriormost segments of the gastrointestinal tube, bilaterian guts share a Hox and Para-Hox AP coordinate system of i ) segments characterised by block expression of anterior Hox genes, and no ParaHox, ii ) segments characterised by Pdx expression with low levels of Hox expression, iii ) segments characterised by graded expression of posterior ParaHox (Cdx) and posterior Hox genes. The anterior Hox segments corresponds to the posterior region of the anterior block compartment, while the Pdx segments and the Cdx/Hox segments coincide with the posterior gradient compartment. Section 3: Larval AP patterning genes display regionalized expression pattern along adult guts in bilaterian invertebrates Having recovered the persistent expression of Hox and ParaHox embryonic patterning genes along the adult gut of all the species considered, we investigated the extent to which this might be a conserved feature of other genes classically associated with gut tube AP patterning. Traditionally, these genes have been studied (and defined) based on embryonic or larval stages. Given the absence of established sets of conserved adult gastrointestinal AP patterning transcription factors, we resort to these classical embryonic signatures, hypothesising that they might also be recovered in adult guts just as Hox and ParaHox genes. We therefore refer to the set of conserved transcription factors defined in Annunziata et al., 2014 , shown to pattern the AP axis of the developing gut tube of early sea urchin larvae and as such representing a set of evolutionary conserved gut patterning markers shared with vertebrate embryos ( Annunziata et al., 2014 ) and bilaterian embryos more generally ( Boyle et al., 2014 ). We show that the expression of all of these early patterning markers (including, here again, Hox and ParaHox genes) is conserved along the Strongylocentrotus purpuratus adult gut, virtually unchanged ( Figure 3A ). We find this conservation extraordinary, not only because it suggests the long-term permanence of a “larval” AP gut signature long into adulthood, but also because such signature is manifestly retained even across drastic ontogenic restructuring of the very physical materiality of the gut tube itself, as is the case of what happens specifically to the sea urchin gut tube during metamorphosis ( Holland, 2020 ). Download figure Open in new tab Figure 3: Larval AP patterning genes display regionalized expression pattern along adult guts in bilaterian invertebrates A ) Left : qualitative “heatmap” showing the expression pattern (red, high; blue, low) of conserved gut patterning markers along the sea urchin larval gut; as per Annunziata et al., 2014 . Redrawn from the same publication. Blue rectangle, foregut, yellow rectangle, midgut; pink rectangle, hindgut. Right : heatmap showing the expression pattern (z-scores) of the same marker genes along the adult gut AP axis (this study). Genes (rows) are ordered according to R2E seriation. Blue, yellow, pink rectangles, segments inferred to correspond to the larval foregut, midgut, hindgut, respectively. Dashed lines link genes with shifts in AP expression patterns across datasets. Truncated links indicate genes that are not expressed in the adult dataset. B ) For each species, heatmap showing the expression pattern (z-scores) of all expressed Hox genes, along the gut AP axis. Genes (rows) are ordered according to the adult sea urchin reference sequence (highlighted in grey). Solid and graded rectangles under the heatmaps indicate segments previously assigned to block and gradient gut compartments, as defined in previous sections. Crucially, we further show that these same markers display similar AP expression patterns in the adult gut of our other ambulacrarian species Ptychodera flava (Pf, Figure 3B ), as well as the adult gut of the two chordate species, despite an increasing loss of resolving power in this branch. We show that this transcription factor signature is extremely well conserved in the adult gut of the protostome Platynereis dumerilii , hinting at a deep conservation of this signature (and possibly in turn, of its underlying early embryonic/larval patterning basis) at least up to the bilaterian stem. At the same time, our results suggest significant elaboration in the chordate branch. In addition to such remarkable conservation, we note that where there are differences in pattern across species, these often involve anterior gut markers (in Sp) shifting to the posterior or showing expression at anterior and posterior in other species. Conversely, some posterior gut markers (in Sp) shift to the anterior, or show anterior and posterior expression in other species. In other words, a subset of anteriormost or posteriormost gut markers, which would appear as having poor AP conservation, may be best understood at a more holistic pan-bilaterian level as “terminal” markers (see e.g. foxD , foxP , foxI , Figure 3B ), and be conserved in this role across life stages and species. In conclusion, we show a remarkable conservation of the embryonic/larval gut plan into the adult: adult bilaterian guts maintain or redeploy “embryonic-” and “larval” markers and do so in a way that parallels known embryonic or larval AP patterns of expression. To some extent, these results expand, at least for the gut tube, the applicability of these markers and question conceptions of embryonic patterning systems as transient or impermanent. Given that the gut tube of some of the species we consider above undergoes dramatic restructuring during metamorphosis, these results also bring forward new questions about the possible mechanisms and evolutionary constraints that would bring about the maintenance or redeployment of AP expression patterns across an impermanent patterning substrate. Regardless, we show that the AP pattern of expression of these markers (with the modification we document above and with frequent terminal shifts) is strongly conserved across bilaterians, and in fact even in the annelid worm Platynereis , hinting at a possible feature of the ancestral adult gut tube. Section 4: Unbiased analyses of regionalized gene expression along the adult gut in bilaterian lineages In an attempt to identify an adult gut AP signature conserved across bilaterians, we decided to map the expression pattern of all transcription factors along the AP axis of our adult bilaterian guts and see if we could identify a shared organisation across species. This strategy uniquely allows us to approach this question in an unbiased, systematic, and comprehensive way, within the limits of our comparative approach and gene orthology attributions. We identified all transcription factors within each species’ proteome by a protein domain scan referencing the AnimalTFDB database (see Materials and Methods ). The proteins we retrieved (proteins with transcription factor domains, which we here take as de facto “transcription factors”) were then summarised at the orthogroup level to allow between-species comparisons. To avoid discarding orthogroups with many-to-one correspondences, a “best ancestral orthologue” representative was selected among a species’ paralogues based on sequence similarity scores, as in recent literature (( Mantica et al., 2024 ); see Materials and Methods ). Of these transcription-factor orthogroups (i.e. orthogroups containing proteins classified as transcription factors; including manually curated Hox orthogroups), 356 were shared across all five bilaterian species, in line with the minimal transcription factors content estimated for the Protostome-Deuterostome Ancestor (216; ( Larroux et al., 2008 )). 277 out of these 356 transcription factors were expressed in all five gut datasets ( Figure 4A ). Download figure Open in new tab Figure 4: Unbiased analyses of regionalized gene expression along the adult gut in bilaterian lineages A ) Summary of the steps deployed to derive the final set of conserved, gut-expressed transcription factors (TFs) used for cross-species comparison. B ) Generalised Association Plot summarising the expression data of the 85 AP-associated TFs orthogroups across bilaterian gut segments. Top : heatmap of the Spearman’s Rank Correlation coefficients between all segments, regardless of species. Segments are ordered according to R2E seriation. Bottom Left : heatmap of the Spearman’s Rank Correlation coefficients between all 85 AP-associated TF orthogroups considered, ordered according to R2E seriation-guided hierarchical clustering. Bottom Right : heatmap showing the expression pattern (z-scores) of all TFs considered based on the segment (columns) and gene (rows) order defined above. Segments are color coded by approximate equivalent AP position as in the Legend provided. Solid and dashed green lines indicate qualitative assignment of major and minor groupings of gut segments based on correlation patterns and known anatomical position. Magenta lines identify gene modules. C) Summary of the 5 main modules identified, in their general AP order, with representative TF markers indicated. In bold, established gut patterning markers across the literature. D) For each species, heatmap showing the expression pattern (z-scores) of all representative TFs from each of the identified modules, along the gut AP axis. Magenta highlights: modules that appear to not match the expected expression pattern in a given species. Solid and graded rectangles under the heatmaps indicate segments previously assigned to block and gradient gut compartments, as defined in previous sections. Download figure Open in new tab Supp. Figure 4×1: R2E seriation of bilaterian adult gut segments based on the expression pattern of all conserved TFs A ) Summary of the steps deployed to derive the final set of conserved, gut-expressed transcription factors (TFs) used for cross-species comparison. For each species, heatmap of the Spearman’s Rank Correlation coefficients between segments, based on the expression of these same TFs. Segments are arranged according to R2E seriation, which matches AP position. B) Partial Generalised Association Plot summarising TF expression data across bilaterian gut segments. Top : heatmap of the Spearman’s Rank Correlation coefficients between all segments, regardless of species. Segments are ordered according to R2E seriation. Bottom : heatmap showing the expression pattern (z-scores) of all TFs considered. TFs (rows) are ordered according to R2E seriation-guided hierarchical clustering. Segments are color coded by approximate equivalent AP position, as indicated in A. Shaded areas indicate examples of genes that appear to still define segments at equivalent (anatomical) AP positions (blue shade: anterior segments, purple shade: hindguts, yellow shade: intestinal segments). Solid green line indicates qualitative grouping of gut segments based on correlation patterns and known anatomical position Download figure Open in new tab Supp. Figure 4×2: PCA overview of conserved TF expression across bilaterian adult gut segments A ) Distribution of all gut segments (all species) across the two main Principal Components (PCs; PC1, PC2) and based on the full set of conserved, gut-expressed Transcription Factors (TFs). Segments are color coded by approximate equivalent AP position as in the legend provided on the right. Dashed vertical line indicates main separation between clusters. Left: Plot indicating the proportion of variance explained by each PC (scree plot). Blue dashed line: proportion of variance that would be explained if all components had equal contribution. B) Summary table of the top TFs associated with sample separation across PC1. Right/Left red highlight of the contribution scores indicate whether TF expression is driving samples to the right/left of the PC plot, respectively. C) Same data as in the central panel of A, but with segments color-coded by relative level of expression of each of the main PC1 drivers (as in B) and other TFs of interest (bottom row). Red, high; blue, low. Dashed vertical line indicates main separation between clusters D) For each species, heatmap showing the expression pattern (z-scores) of the main drivers of separation across PC1. TFs (rows) are clustered according to hierarchical clustering. Solid and graded rectangles under the heatmaps indicate segments previously assigned to block and gradient gut compartments, as defined in previous sections. Download figure Open in new tab Supp. Figure 4×3: Cross-species SAMap mapping of gut segments A ) Heatmap of SAMap Mapping Scores between gut segments across species, based on the expression of all TF genes ( upper triangle , above the diagonal) or all non-TF genes ( lower triangle , below the diagonal). In the SAMap approach, all paralogues are included for 1-to-many orthogroups. We observe that R2E seriation of gut segment TF expression within each species orders them based on their actual anatomical location ( Supplementary Figure 4×1A ), whereas R2E seriation of gut segments across species does not ( Supplementary Figure 4×1B ). The same overall non-equivalence is seen in the grouping of samples across PCA space ( Supplementary Figure 4×2A ). Specifically, it appears that when considering all conserved expressed TFs across species, Pd hindgut segments group with bilaterian foreguts, and intestinal segments (especially of the two chordate species) do not necessarily cluster close to their expected AP equivalents in other species ( Supplementary Figure 4×1B , Supplementary Figure 4×2 ). In other words, beyond a pan-bilaterian subdivision that allows to classify segments in “block compartments” (with Pd hindgut; gli2+ , znf521+ , zeb2+, six1+ ), and “gradient compartments” ( nr2a1 / hnf4a+, srebf+, zfp36l+, pdx1+, gata4+, Hox PG09+ ), we recover an overall high divergence (non-equivalence) of the AP organisation of shared transcription factors along adult guts. At the same time, we do observe a minority subset of transcription factors that do appear to define segments at equivalent (anatomical) AP positions ( Supplementary Figure 4×1B ). Orthogonal network-based approaches able to consider all TF and TF paralogues (SAMap, ( Tarashansky et al., 2021 )) recover finer AP matches on a pair by pair basis, yet similarly highlight an overall fragility of pan-bilaterian AP correspondences ( Supplementary Figure 4×3 , upper triangle). Observing that only a minority of TFs across bilaterian guts define the coordinates of the anatomical AP axis, we decided to isolate such TFs by modelling gene expression profiles with generalised additive models and identifying genes whose expression pattern is most associated with AP position (Tradeseq; ( Van den Berge et al., 2020 )). By reclustering all segments based on this refined subset of 85 TFs, segments do cluster by relative AP position, with overall much stronger cross-species concordance between anterior, middle, and posterior segments of the gradient compartment ( Figure 4B ). Overall, we are therefore able to decompose the common bilaterian AP axis into 5 (non-exhaustive) main gene sets (“modules”; Figure 4B , Figure 4C ). An “anterior (only)” module (module 1) characterised by known hox genes PG01 and PG02, and which includes nkx2.3 , smad3 , and camta1 . This module groups all the segments anterior to the “transition sphincter”, and matches the domain identified as the 1st compartment (“block compartment”) of the shared bilaterian bipartite organisation of gene expression. an “intestinal/digestive” module (module 2) characterised by known parahox gene Pdx1/Xlox , Gata4 , Hnf4 , prdm1a , but also several novel potential markers ( sox7, myrf, e2f8 ). an “intermediate module” (module 3) generally expressed in more posterior segments, and notably characterised by nr5a2 and jun2 expression, shifted to the gills in Bf. a “posterior” module (module 4) characterised by an extremely limited set of members, and which are indeed just Hox PG08/09 and Hox PG11/13, as well as MafG (which is however already not conserved in Bf). This module groups all the posteriormost segments of all species. Note that Cdx could not be considered in this unbiased analysis (see Material and Methods “Filtering and standard counts processing” ) but would also be another marker of this module as shown in previous figures (e.g. Figure 2 ). We also note a fifth module that we here call module “Ex” (for “ Ex ocrine”) due to its grouping of notable gut patterning transcription factors Ptf1, Hhex, and bhlha15/Mist, associated — in vertebrates — with pancreatic tip acinar cells ( Lichtenberg et al., 2018 ). This would represent a module clearly of key interest, overall conserved AP position, but variable position with respect to bilaterian gut compartments and the modules that characterise them. In Pd and Ao, it is detected in posterior segments of the block compartment (i.e. esophageal segments, including the vertebrate stomach; i.e. overlapping module 1 segments), in the other species it is detected at the anteriormost segments of the gradient compartment, i.e. overlapping with module 2 segments. Comparing the gene expression pattern of representatives of these modules confirms their validity as conserved bilaterian AP markers, while also identifying again significant elaboration within the chordates ( Figure 4D ). We critically note that module 2 is highly fragmented in the gut tube of clownfish (Ao, magenta outline) and is in big part represented instead by the oesophagus (“anteriorisation”). Similarly, we note a cephalochordate-specific “loss” of module 3 with a shift to the gills (Bf, magenta outline). Overall, we here define a conserved set of transcription factors that mark AP positions which we would consider to be homologous in adult bilaterian guts. Remarkably, the signature we identify, and which we summarise here in 5 main modules, appears to be conserved across hundreds of millions of years of evolution and despite the divergence of overall transcription factor expression patterns, through-gut anatomies, and dietary specialisation. We stress that this list of transcription factors is a conservative list of markers, not to be interpreted as precluding the existence of additional transcription factors with a conserved AP expression in these five bilaterian species. Specifically, such expression patterns may be conserved in paralogues that were here discarded when resolving many-to-one correspondences. Though such a loss of potentially informative transcription factors is inherent to comparative transcriptomic approaches ( Emms & Kelly, 2019 ; Mantica et al., 2024 ; Nehrt et al., 2011 ; Tarashansky et al., 2021 ), we note that it is here additionally complicated by the underlying non-established equivalence between gut segments. Critically, this prevents more refined orthologue selection criteria that also take into account the conservation of tissue expression pattern. We also continue to recover, especially at this cross-species level, an overall high transcriptional similarity between segments at the two ends of the through-gut. This pattern echoes our previous recovery, at the species level, of a shared “terminal” pattern of gene expression, a conservation of gene expression at either terminus, and ontogenetic inter-termini shifts of gene expression at least in sea urchin. At the pan-bilaterian level, the shared expression of terminal Hox genes may well be one of the few conserved features of bilaterian through-guts. Section 5: Common functions of bilaterian through-guts We repeat the analysis on non-transcription factor genes, selecting the top 2500 most variant genes out of a total of 5562 non-TF genes expressed in the through-gut of all 5 species. Critically, the main interpretation of gut segments based on these other (functional/structural) genes, at the cross-species level, is one where anterior functions/structures are distinct from hepatic and anterior-intestine segments, but where posterior segments have highly variable affinities across species ( Figure 5A and 5B ). In this regard, the hindgut of the protostome Pd is not an entity distinct from anterior through-gut segments (if only in space). This is also the case for Pf hindgut segments, a deuterostome, indicating that observed terminal equivalences may not necessarily directly relate to the embryonic origin of these segments. Cross-species comparison based on SAMap highlights cross- or U-shaped alignments centered on the hepatic/anterior intestinal segments ( Supp Figure 4×3 , lower triangle) indicating an even lower AP concordance between segments of different species than that instead highlighted by TF expression. Here again, through-gut termini (anterior and posterior) would in many cases be considered equivalent matches across species. Download figure Open in new tab Figure 5: Analysis of adult bilaterian gut segments based on non-TF gene expression A) Heatmap of the Spearman’s Rank Correlation coefficients between all gut segments, regardless of species, based on the full set of conserved, gut-expressed non-Transcription Factors. Segments are ordered according to R2E seriation. B) Distribution of all gut segments (all species) across the two main Principal Components (PCs; PC1, PC2) based on the same set of genes. Segments are color coded by approximate equivalent AP position as in Legend. Download figure Open in new tab Supp. Figure 5×1: Model-based Gene Set Analysis of non-TFs expressed across adult bilaterian gut segments A ) Summary results of enriched Gene Ontology pathways across all gut-expressed non-Transcription Factor genes ( Left ) and among the top 2500 most variant subset of them ( Right ). Pathways names in bold and highlighted in yellow have their expression pattern plotted in B. “in/tot”: ratio between the number of genes of a given pathway present in the set considered, and the total number of genes belonging to that pathway; “estimate”: MGSA score. B) For each species, heatmap showing the expression pattern (z-scores) of all expressed genes belonging to the GO pathway of interest. Genes (rows) are clustered according to hierarchical clustering. Segments (columns) are ordered according to AP position. Solid and graded rectangles under the heatmaps indicate segments previously assigned to block and gradient gut compartments, as defined in previous sections. Not surprisingly, we find that bilaterian through-guts can be summarised as sites of protein synthesis and secretion (translation, protein transport, intracellular protein transport), lipid transport, and fatty acid, carbohydrate, and amino acid metabolism ( Supp Figure 5×1A ). We find that many of these functions are highly localised within the AP length of the gut of each species, and localised to comparable AP positions across species ( Supp Figure 5×1B ). We note for example that, in all bilaterians considered, translation functions are consistently localised to the first segments of the gradient compartment, likely reflecting an AP constraint in the site of digestive enzyme synthesis/secretion. In Ao, this function is correspondingly mainly localised to the liver, which releases its enzymes in these same segments. Fatty acid metabolism is also highlighted as a conserved function enriched in the anterior portion of the gradient compartment in all bilaterian guts considered. At the same time, significant re-elaboration (shifts) and losses of functions can be seen even just within the five species sampled, reflecting not only the overall poor conservation of AP localisation of gut functions but also the remarkable versatility in how these functions are spatially deployed. We highlight the case of proton transmembrane transport, related to the establishment of acidic or alkaline compartments across bilaterian guts ( Stumpp et al., 2015 ). Accordingly, the expression of V-type ATPases is in most species enriched in anterior segments of the gradient compartment, but in Ao is instead shifted to the posterior intestine (likely representing lysosomal functions). Such a loss of anterior intestinal V-type ATPase function could possibly reflect the unique gnathostome innovation of the stomach ( Castro et al., 2012 ; Koelz, 1992 ; Stumpp et al., 2015 ), the takeover of acidification functions by this more anterior compartment, and a consequent relaxation of pH regulation needs in the gradient compartment compared to stomach-less species. Section 6: Characterisation of bilaterian gut modules We turn to a more in-depth characterisation of the modules we identified based on TF expression patterns, in an attempt not only to build a more complete picture on the markers that define them, but also to identify functions that may be conserved in their association with homologous segments rather than in their relative AP position. Critically, our module-based interpretative framework allows us to impute shared segment identities across species, and therefore to apply supervised dimensionality reduction approaches such as Partial Least Squares - Discriminant Analysis (sPLS-DA, ( Rohart et al., 2017 )) to identify their discriminating markers and/or expand the signatures beyond TFs alone. Module 1/“cilia” Module 1 corresponds to segments that are consistently located at the anterior of the gut tube of all bilaterian species considered, and that in our bipartite interpretative lens represents the anterior, Hox positive, “block” compartment. We therefore impute a shared identity to all of these segments and apply sPLS-DA to find discriminating markers ( Figure 6aA ). Among the highest scoring markers we note, in addition to anterior Hox genes and more SMAD signalling components, a dominant representation of Hedgehog signalling components ( patched 2 , smoothened , but also GLI family zinc finger 2a ) and primary cilia or cilia/microtubule-related genes (gamma tubulin complex associated protein genes, centrosomal protein 83 , testis associated actin remodelling kinase ). Accordingly, while the functional interpretation of this anteriormost module as a ciliated, filtering module would be intuitive, our analysis highlights hedgehog signalling (and therefore primary cilia) as the most distinctive feature of this module. Given the fundamental role played by hedgehog signalling during embryonic foregut development ( Litingtung et al., 1998 ), it is remarkable that we recover once again embryonic signatures (now in the form of signalling pathways) in adult guts, and that we do so in the form of pan-bilaterian conserved, AP-conserved patterns. We also note that other lesser-known markers of this module, whose pan-bilaterian conservation would highlight as of particular relevance, such as Sin3a , have indeed been linked to profound, targeted developmental anomalies within the foregut ( Yao et al., 2017 ). Download figure Open in new tab Figure 6a: Module 1 and transition sPLS-DA A ) sPLS-DA of bilaterian gut segments marked by Module 1 TFs. Left: illustration of the segments to be discriminated (Module 1 segments). Right: separation of segments according to sPLS-DA discriminant genes. Bottom : For each species, heatmap showing the expression pattern (z-scores) of the top discriminant genes identified through sPLS-DA. Genes (rows) are clustered according to hierarchical clustering. Segments (columns) are ordered according to AP position. Solid and graded rectangles under the heatmaps indicate segments previously assigned to block and gradient gut compartments, as defined in previous sections. Gene names followed by an asterisk constitute the optimal sufficient discriminant set. Gene names in color are TFs. B ) sPLS-DA of bilaterian gut segments marked by equivalent anatomical positions (and Module 2 TFs in all species except Ao). Left: illustration of the segments to be discriminated (“transition” segments, all anteriormost segments of the gradient compartment; yellow highlight). Right: separation of segments according to sPLS-DA discriminant genes. Bottom : For each species, heatmap showing the expression pattern (z-scores) of the top discriminant genes identified through sPLS-DA. Genes (rows) are clustered according to hierarchical clustering. Segments (columns) are ordered according to AP position. Solid and graded rectangles under the heatmaps indicate segments previously assigned to block and gradient gut compartments, as defined in previous sections. Gene names followed by an asterisk constitute the optimal sufficient discriminant set. Gene names in color are TFs. Download figure Open in new tab Supplementary Figure 6×1: Module 2 sPLS-DA A ) sPLS-DA of bilaterian gut segments marked by Module 2 TFs. Left: illustration of the segments to be discriminated (Module 2 segments). Right: separation of segments according to sPLS-DA discriminant genes. Bottom : For each species, heatmap showing the expression pattern (z-scores) of the top discriminant genes identified through sPLS-DA. Genes (rows) are clustered according to hierarchical clustering. Segments (columns) are ordered according to AP position. Solid and graded rectangles under the heatmaps indicate segments previously assigned to block and gradient gut compartments, as defined in previous sections. Gene names followed by an asterisk constitute the optimal sufficient discriminant set. Gene names in color are TFs. Module 2/“digestive” In our reconstructed pan-bilaterian AP signature Module 2 defines a domain that is at the anterior of the gradient compartment of bilaterian guts (the invertebrate “stomach”), and which in vertebrates seems to be fragmented across the oesophagus, stomach, and anterior intestine ( Figure 4D ). Expanding the signature of Module 2, by performing sPLS-DA with clownfish oesophagus rather than anterior intestinal segments, identifies several factors also shared with the vertebrate stomach and the liver, mostly related to protein synthesis, but also amino acid metabolism, and ether lipid synthesis. These would represent strong candidates for true module-associated functions, yet the fragmentation of this module across multiple segments in Ao may be likely confounding this analysis (which for this reason we relegate to Supplementary Figure 6×1 ). We note instead that the vertebrate (Ao) anterior intestine, consistently appears more affine to more posterior invertebrate segments (Module 3; Supplementary Figure 4×3 ), and yet ends up abutting the same equivalent domain of other species’s module 2 segments (i.e. abutting Module 1). We therefore wondered whether we could identify a molecular signature common to such an equivalent anatomical position and accordingly performed sPLS-DA by coercing vertebrate pyloric caeca into sharing an identity with invertebrate Module 2 segments. Notably, the resulting (positional) markers of such transition between equivalent AP compartments but non-equivalent modules do not include TFs. Most interestingly, we find that a notable subset of these positional markers is in fact expressed in the clownfish liver, or in both the liver and the anterior intestine ( Figure 6aB ), thus reflecting the known ontogeny of this organ in vertebrates. Markers of this position include many mitochondrial and non-mitochondrial genes generally consistent with a conserved role in the metabolism of sterols and amino acids ( insulin induced gene 1, sterol carrier protein 2a, ornithine aminotransferase, sarcosine dehydrogenase ), including what would be traditionally classified as stereotypical “liver” function markers ( glycine N−methyltransferase ), and consistent with the previously described enrichment of translation and fatty acid metabolism at this location. Module 3/“sensor” We analyse Module 3, which overall characterised through-gut segments of the “gradient compartment” generally more posterior than those characterised by Module 2, in all species ( Figure 4B ). Very surprisingly, the module is absent from the amphioxus gut, and localises instead to the gill. We use sPLS-DA to identify common discriminant markers of these segments, which we consider homologous (therefore, including Bf gills), and identify even more genes with likely conserved roles as metabolic integrators and regulators ( Figure 6bA ). These include the glucose sensor mlxip / MondoA , SREBF pathway regulator in golgi 1 Spring1 , a progestin and adipoQ receptor family member, but also ketohexokinase, as well as numerous other transcription factors (foxO3, ncoa2, pknox1.1). All are associated with the segments with Hox6/7 expression. Download figure Open in new tab Figure 6b: Module 3 and Module 4 sPLS-DA A ) sPLS-DA of bilaterian gut segments marked by Module 3 TFs. Left: illustration of the segments to be discriminated (Module 3 segments). Right: separation of segments according to sPLS-DA discriminant genes. Bottom : For each species, heatmap showing the expression pattern (z-scores) of the top discriminant genes identified through sPLS-DA. Genes (rows) are clustered according to hierarchical clustering. Segments (columns) are ordered according to AP position. Solid and graded rectangles under the heatmaps indicate segments previously assigned to block and gradient gut compartments, as defined in previous sections. Gene names followed by an asterisk constitute the optimal sufficient discriminant set. Gene names in color are TFs. B) sPLS-DA of the most posterior bilaterian gut segments (also marked by Module 4 TFs). Left: illustration of the segments to be discriminated (Module 4 segments). Right: separation of segments according to sPLS-DA discriminant genes. Bottom : For each species, heatmap showing the expression pattern (z-scores) of the top discriminant genes identified through sPLS-DA. Genes (rows) are clustered according to hierarchical clustering. Segments (columns) are ordered according to AP position. Solid and graded rectangles under the heatmaps indicate segments previously assigned to block and gradient gut compartments, as defined in previous sections. Gene names followed by an asterisk constitute the optimal sufficient discriminant set. Gene names in color are TFs. We attempted to identify a more precise function (or clear vertebrate reference) to this cluster, and yet literature on these markers (first and foremost, Nr5a2) consistently recover associations with both liver and pancreatic development, and adult endocrine functions ( Hale et al., 2014 ; Martin Vázquez et al., 2022 ; Nissim et al., 2016 ). We also note that the conserved localisation of this module posterior to the Pdx boundary and within the anterior of the Cdx domain, the endocrine and pancreatic association of Nr5a2 in vertebrates, the overall mixed metabolic-endocrine signature of other conserved markers we recover, and the extremely restricted expression of this module in the adult sea urchin, would suggest a most likely correspondent in a recently-described subpopulation of “endocrine pancreas” cells known to localise posteriorly to the pyloric sphincter in the larval sea urchin ( Paganos et al., 2022 ). We also note that Nr5a2 has been critically identified as a key regional marker along the Ciona intestinalis juvenile gut, again with localised expression in the Cdx+ region posterior to the Pdx boundary ( Iguchi, Usui, et al., 2023 ; Nakayama et al., 2016 ; Nakayama & Ogasawara, 2017 ). Remarkably, this posterior expression (but not a more anterior one) does not appear to be constitutive in the gut ( Iguchi, Usui, et al., 2023 ; Nakayama & Ogasawara, 2017 ), hinting again at a “responsive” function of the posterior regions of the gut. Overall, our results strongly support the deep conservation of this gut function, not only as one of the main evolutionary-conserved pan-bilaterian gut modules, but also as one with a generally conserved relative antero-posterior position. It puts forward a set of markers that may in fact be ancestral components of the bilaterian gastrointestinal endocrine system, and hint at the type of nutritive stimuli it may have been responsive to. We suspect that loss in Bf, and gill segment expression, may be explained by the amphioxus-specific Hatschek’s pit, involved in endocrine regulation ( Sahlin & Olsson, 1986 ). Module 4/hindgut One of the most striking observations about the modules we identify is the extreme scarcity of shared markers of hindgut segments, even as a result of -omics level investigations. Such a poor separation of hindgut segments is also noted in unsupervised PCA, indeed known to struggle to recover axes of variance driven by very small gene numbers ( Supplementary Figure 4×2 ; across all principal components investigated; ( Lenz et al., 2016 )). Not only do adult bilaterian hindguts only share the expression of 3 transcription factor orthogroups (when including Cdx), these are the three extremely well known markers of the embryonic hindgut ( Annunziata et al., 2019 ; Arenas-Mena et al., 2006 ; Dai et al., 2024 ; Gill et al., 2024 ; Hejnol & Martín-Durán, 2015 ; Illig et al., 2013 ; Nowotschin et al., 2019 ; Zhong et al., 2020 ). We wondered whether a supervised dimensionality reduction analysis could possibly expand such a signature. Accordingly, we performed sPLS-DA coercing all posterior-most segments to belong to shared identity, here based on their shared posteriormost anatomical position ( Figure 6bB ). Strikingly, sPLS-DA identifies the sole Hox PG011-15 as the optimal gene set sufficient to discriminate the hindgut from other segments. Within the expanded sPLS-DA signature (of genes that mark the hindgut but not necessarily exclusively, Figure 6bB ), we only recover one other classic transcription factor, foxD. FoxD is indeed another extremely well characterised regulator of hindgut function in vertebrates ( Wang et al., 2018 ), a key component of the larval hindgut gene regulatory network of sea urchin ( Voronov et al., 2024 ), is known to be expressed in the hindgut endoderm in the hemichordate Saccoglossus kowalevskii ( Fritzenwanker et al., 2014 ) and in amphioxus ( Aldea et al., 2019 ; Yu et al., 2002 ), and is generally associated with the early development of deuterostome hindguts (see ( Hejnol & Martín-Durán, 2015 ), and references within). We here also recover FoxD in the posterior segments of a protostome species (as in the larval stages of others, see e.g. ( Janssen et al., 2022 )). Yet, based on both the expression patterns we recover here (e.g. Pd, Sp), and the ontogenetic shift described for Sp in Figure 3A , we would classify this TF as a “terminal” marker rather than a specific posterior marker at the pan-bilaterian level. We therefore confirm that posterior Hox and posterior ParaHox genes may be the only pan-bilaterian markers of the through-gut posterior. An extended set of bilaterian hindgut markers may have to be sought in the conservation (or convergence) of non-TFs expression patterns. Within the expanded sPLS-DA hindgut signature, we notably recover amnionless , cubilin , cathepsin C , glmp/Ncu-g1 , slc35f6 , vps33a , many of which may serve as broad markers of the bilaterian hindgut. We note that many of these components belong to the cubam/endocytosis system. In teleost, posterior expression of amnionless/cubilin has been shown to correspond for the most part to a specialised class of enterocytes responsible of direct protein uptake by endocytosis (“lysosome rich enterocytes”, ( Childers et al., 2025 ; Park et al., 2019 ; Wen et al., 2021 )). This same function/cell type is also believed to be also present in invertebrate chordates ( Nakayama et al., 2019 ; Yonge, 1937 ) and cubilin/amnionless has also been recently characterised as localised to the hindgut of Ciona intestinalis (Iguchi, Nakayama, et al., 2023). Our results suggest that this same cell type, or at least the posterior presence of an endocytic intestinal function, is a deeply conserved through-gut feature, and in fact may be the only conserved function of the terminal section of bilaterian guts. The conservation of hindgut regionalisation of such components across body plans that had their last common ancestor hundreds of millions of years ago suggests that the (posterior) regionalisation of endocytic activity may have been a key feature of through-gut function in the bilaterian ancestor. Still, we note that these functions are not exclusive to, nor necessarily peaking in, the posterior most segment. We consistently fail to detect conserved bilaterian features exclusive to bilaterian posterior-most segments, beyond anatomical position and the expression of posterior Hox and ParaHox genes. Summary and conclusion To better understand how to interpret bilaterian through-guts, we collected anteroposteriorly-ordered transcriptome data of the adult gut tube of five phylogenetically informative species: an annelid, a sea urchin, a hemichordate, a cephalochordate, and a vertebrate. Overall, our cross-species comparison highlights that the highly divergent and heterogeneous gene expression patterns of adult guts across species appear to develop within a conserved, bipartite global gene expression structure, and still retain a number of modules with overall conserved relative AP position (summarised in Figure 7A and detailed in Supp Figure 7×1 ). Crucially, such a bipartite global organisation matches a conserved, bipartite, adult expression of Hox genes. Download figure Open in new tab Figure 7: Summary and conclusion figure A ) Summary model of the conserved elements of the adult bilaterian through-gut, and their AP distribution, as identified in this work. Modules are colour coded. Slashed rectangle pictogram (blue, topmost): boundary between “block” and “gradient” compartments (i.e. “transition sphincter”) as defined in the main body of text. B ) Larval bilaterian through-guts. A correspondence between larval and adult AP gut markers (dark arrow) was identified for sea urchin (Sp). The AP patterning of adult bilaterian guts may in turn be a conserved feature of larval through-guts (light arrow) C ) Reconstruction (dark arrow) of the possible configuration of the ancestral through-gut configuration, which gave rise to the diversification of adult guts seen in extant species (light arrow to panel A). Our interpretative lens would further provide an investigative angle to approach the relationship between the ancestral through-gut configuration and that of its larva and the larvae of extant species (light arrows to and from panel B). A: anterior, P: posterior. Intriguingly, the modules found to conserve relative AP information across species are largely represented by well-studied embryonic/larval markers. Hand-in-hand with this observation is our finding that the AP order of expression of classic, bilaterian-conserved, AP embryonic markers is also a feature of adult guts, to the point that such TFs may well be considered adult AP markers too. Far from the phylotypic stage, adult bilaterian through-guts thus appear to maintain an open window to early embryonic/larval patterning systems ( Figure 7B ). With the specific case of the sea urchin, this temporal continuity is clearly in contrast with the sharp discontinuity of the organism’s ontogeny, and the material impermanence of the embryonic/larval gut tube itself, precipitated by metamorphosis ( Holland, 2020 ). These markers must therefore be maintained across ontogeny or re-deployed in the adult gut: they indeed are, just as their relative AP pattern of expression. To this point, studies that have most recently directly addressed the bridge between gene expression patterns before and after metamorphosis, are indeed cementing the re-deployment of embryonic and larval molecular signatures into juvenile life as a feature of most cell types, including those of the gut (( Paganos et al., 2025 ), Paracentrotus lividus ). We show here that not only are these genes expressed across the metamorphic gap, but they are so in analogous AP order that allows direct correspondences between the domains marked at each life stage. Furthermore, we show that this order is evolutionarily conserved, allowing to further draw equivalent correspondences across adult guts of different species. Our results are particularly interesting in the context of the ancient discussion on the origin of larvae and the evolution of metamorphosis in bilaterians, a debate that has animated the literature since more than a century ( Gee, 1996 ). Already Hatschek ( Hatschek, 1888 ) had proposed that the adult form was a secondary acquisition in many groups, while Garstang ( Garstang, 1928 ) famously reversed the idea, proposing that larvae could be more recent than adults. Later, the work of Nielsen and others supported the view that a biphasic life cycle was probably ancestral but up to now, no decisive argument in favor of this view was brought by Evo-Devo studies ( Laudet, 2011 ). Our findings add new molecular and spatial arguments in favor of this idea. The fact that embryonic patterning genes are redeployed in adult guts and maintain similar antero-posterior positioning strongly argue for a developmental continuity across metamorphosis, even when the morphology changed dramatically. It suggests that metamorphosis does not erase the early program, but rather reuses it within a new context. In that sense, metamorphosis could be seen not as a rupture, but as a reconfiguration of a conserved regulatory logic, inherited from the common bilaterian ancestor ( Laudet, 2011 ). Though the adult display of such expression patterns could intuitively be explained as a mere leftover of a deeply constrained, conserved, and ancestral embryonic gut patterning system, the conservation of their adult expression in all species considered, across hundreds of millions of years of evolution, additionally points towards a key role played by these genes in the adult . That is, and reversing more intuitive embryo-based perspectives, could embryonic gut patterning genes be genes with key adult functions as regulators of key adult endodermal functions, gut “terminal selectors”? Certainly, these genes are expressed in adult guts spanning a variety of architectures and dietary specialisations, and they are clearly redeployed even in cases of ontogenetic substrate discontinuity with their patterned embryonic correspondent. Much is speculative about the configuration of the gut of the bilaterian ancestor, and even more so about its relationship with that of its embryonic form. We here add an additional layer to the question by demonstrating that the gene expression patterns of adult and embryonic/larval guts have a non-trivial continuity, implicating the adult digestive physiology and ecology of bilaterian ancestors among the elements informing the AP patterning mechanisms of the bilaterian gut. To what extent does the permanence and function of these genes in adult bilaterian guts affect the selective constraints on the patterning processes of their embryonic origin? Incidentally, this continuity between adult and embryonic gene expression patterns, at least for the markers we identify here, suggest that the strong degree of conservation of this AP system across adult bilaterian through-guts (and most strongly, in the three non-chordate species we considered) may in turn mirror a conservation of the pattern at the embryonic stages of these very species. We can only show such an actual correspondence based on published sea urchin larval data ( Annunziata et al., 2014 ): dedicated characterisations of the AP pattern of expression in the larval or embryonic forms of the other species we consider will reveal whether such likely conservation ( Boyle et al., 2014 ) holds true. Though we focused on establishing a comparative basis among bilaterian guts, our cross-species comparison in fact highlights, above all, the extreme heterogeneity of gene expression in adult guts of different species, of course reflecting the remarkable variety of gut forms and functions across phyla, species and diets. At the pan-bilaterian level, gut segments at equivalent AP positions generally cluster poorly, a common theme being recurring matches and equivalences between anterior and posterior segments across species or across ontogeny. We reinterpret many species-level “posterior” or “anterior” gut markers as belonging to a more general “terminal” repertoire at the pan-bilaterian level. Regardless, such a remarkably flexible deployment of genes and functions invariably appears to be organised across a two-compartment scaffold that is comparable across species. We find the most resonant echo of such a property in the concept of the “eigengene” as a patterning feature, as elaborated in ( Kerstjens et al., 2024 ). That is, we see a cross-species conservation of global AP spatial expression structure , rather than relative AP localisation of most of the individual genes themselves. In the case of adult guts, this bipartite global organisation is underlaid by a bipartite deployment of Hox genes, a deployment pattern observed in the embryos of model vertebrate species ( Beck et al., 2000 ; Kawazoe et al., 2002 ; Sekimoto et al., 1998 ) but which we here extend to the adult, and generalise across bilaterians. Such a bipartite deployment of Hox genes would therefore also be the most likely condition of the adult gut of the bilaterian ancestor. Among the overall heterogeneity of individual gene expression patterns, we were able to extract conserved sets of TFs that do nonetheless appear to conserve relative AP expression across species, and which we initially group into five modules. Our analysis suggests that if cross-species correspondences are to be found at a more granular level than that offered by “block” and “gradient” compartments, these five modules could be useful anchoring points and cross-species landmarks. The identification of conserved AP patterns of expression across extremely divergent guts and across hundreds of millions of years of evolution further identifies such modules as key feature of the bilaterian guts and suggests that the relative AP sequence recovered in the three non-chordate invertebrate species may have been the most likely configuration of the ancestor through-gut ( Figure 7C ). We highlight for example the Module 3 as a putative “sensory” neuro/endocrine function possibly relating to bilaterian pancreatic functions, and the overall paucity of markers (Module 4) able to support the hindgut at the pan-bilaterian level. AP shifts of these modules with respect to the fixed compartments defined by Hox genes would in turn be at the origin of evolutionary innovations. We see such shifts to be characteristic of the chordate branch. Certainly, our analysis identifies each of these modules, and their markers, as prime leads and focal points for future investigations, and identifies the sphincter marking the boundary between the two Hox compartments as a key anchoring point for cross species comparisons, and for gut Eco-Evo-Devo in general. Notably, our investigation of expression patterns of species at key phylogenetic positions allows the preliminary reconstruction of evolutionary trends that specifically highlight the vertebrate gut as a highly divergent gut architecture. Indeed, we consistently note a strong conservation of AP patterns of expression between the adult gut of Platynereis and of the two ambulacrarian species and increasing degrees of reorganisation in the chordata branch. This is even more noticeable for the vertebrate Ao, where modules that are otherwise solidly AP-localised in other species appear highly fragmented. By identifying the Hox compartment boundary as a key transitional point of bilaterian gut organisation, our interpretative framework allows us for the first time to put forward evolutionary hypotheses formulated in terms of shifts and rearrangements with respect to these invariant features. That is, in terms of AP shifts of modules with respect to a fixed Hox compartmentalisation or, vice versa, in terms of shift of Hox compartments and their boundary with respect to the fixed AP measure of the adult gut. Of note, in Ao we see an anteriorisation of module 2 ahead of the Hox transition boundary, matched with an anterior shift of the posterior paraHox (where Cdx expression comes to abut the anteriormost boundary of the gradient compartment). Such a coordinate anteriorisation event with respect to the Hox boundary would therefore be consistent with the known re-configuration and expansion of the anterior domain known to have marked the evolution of the vertebrate body plan ( Aldea et al., 2019 ; Onai et al., 2015 ). While of course such models would need to be verified, we here provide at least a first attempt at providing a reference system to trace such evolutionary scenarios for the vertebrate gut. Regardless of the evolutionary mechanisms, our model would put forward a fundamental non-equivalence between the vertebrate stomach and the invertebrate “stomach”, in the sense that the former is a structure originating in a different compartment and represented from a different module combination than that of the latter. It is intriguing to speculate that such a rearrangement could be at the origin of the gastric stomach as a gnathostome innovation ( Castro et al., 2012 ; Koelz, 1992 ; Weinrauch et al., 2025 ). We put forward this work and data not only because it provides a still rare resource of anteroposterior-resolved whole-transcriptome data of adult guts across organisms at key phylogenetic positions (joining most recent precious efforts, ( Buchon et al., 2013 ; Dai et al., 2024 ; Dutta et al., 2015 ; Fang et al., 2006 ; Gerdol et al., 2024 ; Lickwar et al., 2017 ; Lv et al., 2024 ; Marianes & Spradling, 2013 ; Matsubara et al., 2021 ; Mayeur et al., 2024 ; Pan et al., 2024 ; Sudhakaran & Peter, 2025 ; Wang et al., 2010 ; Zhang et al., 2023 ; Zhu et al., 2024 ; Zwick et al., 2024 )), but also because discriminating between derived and conserved features of such an important and heterogeneous organ as the through-gut remains central to almost all Eco, Evo, and/or Devo investigations that touch on this organ system. We here provide a hypothesis for the AP patterning system of the through-gut ancestor and its possible functions and also propose an interpretative lens we have found to best reflect the organisation of extant bilaterian guts. We believe that the application of such an interpretative lens, and the testing of this model against open questions of bilaterian and non-bilaterian through-gut biology will provide rich insight across all three fields of Eco-Evo-Devo. Download figure Open in new tab Supp. Figure 7×1: Summary organisation of each species gut tube A) Summary of the AP arrangement of compartments, modules, Hox and paraHox genes, and other common functions (red segments) in the adult through-gut of each of the five bilaterian species investigated. B) Summary model of the likely ancestral configuration of the adult bilaterian through-gut, based on the patterns observed in extant species. Materials and Methods Download figure Open in new tab Supp Figure 1×1: Dissection of the gastrointestinal tract in the 5 species considered, and segment collection For each species, representative pictures of the dissection process and subsectioning criteria to obtain the final gut segments as illustrated in Figure 1 . A, anterior; P, posterior-. Dashed lines with scissors, dissection boundary. Segments are numbered according to AP position, matching labels in Figure 1 . First row : clownfish gut dissection. Second row : amphioxus gut dissection. Third row : acorn worm sections. Fourth row : sea urchin gut dissection. Fifth row : Platynereis gut dissection. Download figure Open in new tab Supp. Figure 1×2: Overview graphical summary of counts processing pipeline. Animal Rearing Licences/ethics approval/facility/ details of couples used Clownfish were reared under licence number 21-04-1658 issued from Academia Sinica’s Institutional Animal Care and Use Committee (IACUC) to the Marine Eco-Evo-Devo Unit at the Linhai Marine Research Station. Experiments (dissections and sample collection) were performed within the provisions of the same licence. Rearing and sample collection of invertebrate species ( Branchiostoma floridae , Strongylocentrotus purpuratus , Ptychodera flava , and Platynereis dumerilii ) is exempt from IACUC oversight, as per institutional policy. Animal Rearing methods Amphiprion ocellaris Young adult A. ocellaris anemonefish were bought from a commercial anemonefish farm (S.T Biotechnology Inc., Changhua County, Taiwan) and reared under standard conditions analogous to what described in ( Roux et al., 2021 ). Specifically young adults were housed in a 70L tank in recirculating natural seawater under a 15h:9h day-night photoperiod, at 28°C. Fish were fed thrice daily either with dry pellets (Hikari® Premium Megabite; Kyorin Food Industries, Ltd) or with fresh seafood. Fish were not fed on the day of collection to minimise gut contents and possible RNA sample contamination. Branchiostoma floridae Amphioxus ( Branchiostoma floridae ) adults were originally collected from Old Tampa Bay (Florida, USA) and subsequently transported to the Institute of Cellular and Organismic Biology (ICOB), Academia Sinica, Taiwan, for laboratory rearing. Animals were maintained in plastic culture boxes supplied with natural habitat sand and aerated with air pumps. They were fed a mixed algal diet consisting of Isochrysis galbana (Pingtung, Taiwan), Tetraselmis chuii (Pingtung, Taiwan), Rhodomonas lens (USA), and Rhodomonas sp. (Japan). The rearing protocols were adapted from ( Yu & Holland, 2009 ) and ( Yong et al., 2019 ). Ptychodera flava Adult Ptychodera flava acorn worms were collected from intertidal ridge of Chito, Penghu, Taiwan, and kept in aquaria as previously described ( Lin et al., 2016 ). Strongylocentrotus purpuratus Adult Strongylocentrotus purpuratus were provided by Pete Halmay and Amro Hamdoun (Scripps Institution of Oceanography, University of California, San Diego). Animals were maintained at 15°C and fed a diet of kelp (kombu). Platynereis dumerilii Platynereis dumerilii belonged to the “Heidelberg” strain originating from the Mediterranean Sea, and were cultured at the Institute of Cellular and Organismic Biology (ICOB), Academia Sinica, as described in ( Kuehn et al., 2019 ). The animals were maintained under a light/dark photoperiod of 16:8 hours with 8 days of simulated moonlight every 28 days and were checked for death and premature maturation three times per week. Premature worms were separated into male or female maturation bowls. The worms were fed three times a week with a varied diet consisting of spinach (spinach florets; Sin Mei company, Changhua County), algae ( Tetraselmis chui ; Algae-Supply company, Taitung), spirulina (Omega®; Golden Prawn Enterprise Co., Ltd., Kaohsiung), and fish food (Tetra Bits Complete; Tetra GmbH, Germany). 20 mL of food were given to each box each day. Natural seawater used for culturing was filtered through 1 μm, 5 μm and 0,22 μm in the lab. Dissections and sample collection A summary illustration of the dissection process for each organism is provided in Supp.M&M Figure 1 . Amphiprion ocellaris Three A. ocellaris young adults at best health were each collected from the rearing tank and immediately euthanised by transfer to a cold bath of overdosed tricaine methanesulfonate (MS-222, ethyl 3-aminobenzoate methanesulfonate salt, tricaine mesylate; [Merck/Supelco CAT#A5040, 200 mg/L] dissolved in ice-cold seawater). To guarantee tissue freshness and to try to prevent the establishment of artefactual transcriptional responses, each new fish was collected only after full dissection of the previous one, and tissues were kept covered by ice-cold seawater throughout the dissection. For dissection, each fish was pinned left-side down to an ice-cold dissection mat, through the eye and through the vertebrae posterior to the trunk bar. After removing the operculum, a lateral window was cut-out to expose the visceral cavity. The cavity was rinsed and filled with ice-cold seawater, and the liver was collected by severing the duct connecting it to the anterior intestine (usually best accessible from the left side). The entire digestive tract was then excised by cutting around the anal opening on one end, and pulling on the gill arches at the other. The digestive tube was then unfolded by carefully tearing apart the tissue between intestinal folds and around the anterior intestine. After trimming away the gill arches (anterior), any carry-over anal dermis (posterior), as well as all contaminating tissues, the digestive tract was further subdivided into 6 segments defined as follows (anterior to posterior): oesophagus (up to stomach sphincter); stomach (anatomically distinct); pyloric caeca (anatomically distinct); anterior intestine (up to first noticeable constriction and change in opaqueness; the middle intestine was usually transparent); middle intestine (up to next noticeable constriction); posterior intestine. Note that the gallbladder, attaching to the anterior intestine segment, was preemptively punctured to empty it of its contents. Also note that the pancreas could not be distinguished/dissected as a separate tissue and remained likely associated to the anterior and mid intestinal segments. Each newly-obtained segment was transferred to a dedicated sterile 2mL microcentrifuge tube filled with 750mL ice-cold Trizol (TRI Reagent; Merck/Sigma-Aldrich CAT#T9424) containing three autoclaved stainless steel beads (EBL Biotechnology CAT#SB2006), and kept on ice until the end of the dissection (less than 15mins total for each set). After each set of dissections, samples were homogenised by mechanical agitation using a vibrating bead mill (TissueLyser II, Qiagen CAT#85300, RRID:SCR_018623; 3 min, 30Hz, room temperature). Homogenised sample lysates were stored at −80C overnight until RNA extraction the following day. Branchiostoma floridae Adult amphioxus B. floridae , each of 2.5-4 cm in length, were anaesthetized using MS-222 (Merck/Supelco CAT#A5040; 160 ppm in filtered seawater, adjusted to pH 7.5-8.0) for at least 10 minutes before dissection. One animal was dissected at a time, placed on a glass petri dish, with a few milliliters of filtered seawater added to prevent organs from drying out. The atrium and ventral-lateral portion of metapleural folds were cut open to expose the digestive tract. Based on prominent anatomical features, we designated the digestive tract into five ‘organs’: the gill, endostyle, midgut, liver (hepatic caecum), and hindgut. These names are used for practical purposes and do not imply their evolutionary homology with organs of other animals. Ptychodera flava Acorn worms were anaesthetised in 0.08% of MS-222 in filtered sea water for 20 minutes ( Applegate et al., 2016 ). Due to strong adhesion of the acorn worm’s digestive tract to the body wall, complete isolation of the gut was not possible to the best of our efforts. Accordingly, the whole cross section of the worm (including enveloping body wall tissues) was amputated according to the internal endodermal features and including the proboscis region with stomochord, the collar region with the mouth, the trunk region with pharynx, esophagus, hepatic region and intestine. Strongylocentrotus purpuratus Adult sea urchins were anesthetized in 0.8 g/L MS-222 for 20 minutes, then dissected along the ambulacral axis from the mouth, resulting in two separate portions of the body. The smaller portion contained the esophagus and anterior stomach (2e–3s–4s) as a continuous tissue, and a separate posterior intestine fragment (9i). The larger portion included the remaining digestive tract (5s–6s–7i–8i). Continuous tissue regions (3s–4s, 5s–6s, 7i–8i) were divided equally for downstream analysis. The pharynx (1p) was also isolated from the teeth. All dissections were carried out on filtered seawater maintained on ice to preserve tissue integrity and the isolated tissues were immediately snap-frozen in liquid nitrogen. Particular attention was given to the anterior stomach (3s), which is rich in digestive enzymes and thus particularly susceptible to RNA degradation. Platynereis dumerilii Adult Platynereis dumerilii specimens, reaching 60-70 segments and having not yet started the pre-mature stage, were dissected to isolate the digestive tract. The worms were anaesthetised in plastic plates filled with 7.5% MgCl2, as per ( Kuehn et al., 2019 ). Dissection was performed on the ventral side from anterior to posterior. Morphological landmarks were used to define ten segments along the AP axis. These ten segments correspond to the mouth, stomodeum, transition between stomodeum and esophagus, transition from esophagus to stomach, stomach, transition from stomach to midgut, midgut, transition from midgut to hindgut, and hindgut. We endeavoured to isolate specific tissues with high precision; however, the mouth and hindgut regions are consistently affected by an inseparable layer of skin epidermis. RNA extraction Amphiprion ocellaris On the day of extraction, sample lysates (in Trizol) were thawed on ice and centrifuged 10 min in a tabletop microcentrifuge at 11000 x g, 4°C to collect any leftover tissue debris to the bottom. 750uL of each supernatant was loaded into a dedicated RNA extraction column (NucleoSpin® RNA Mini kit; Macherey-Nagel CAT#740955.50) and processed according to manufacturer recommendations. Specifically, 350uL of 70% Ethanol (Honeywell/Riedel-deHaen CAT#32221, in ddH2O) were added to the filtered flowthrough, the solution was then vortexed, and loaded onto a RNA binding column. After desalting (kit-supplied Membrane Desalting Buffer), contaminating DNA was digested by a 15 min incubation in recombinant DNAse (in Reaction Buffer, room temperature). Guanidine hydrochloride/ethanol wash buffers (RAW2 and then, twice, RA3) were then sequentially used to denature proteins, discarding the flowthrough from centrifugation after each step. After a further centrifugation to remove all possible leftover buffer/ethanol (2 min, 11000 x g, 4°C), membrane-bound RNA was eluted in 30uL of RNAse-free water (UltraPure™ DNase/RNase-Free Distilled Water; Invitrogen™/Thermo Fisher Scientific CAT#10977015), in a 1.5mL RNAse-free tube (kit-supplied). RNA amounts and quality were initially assessed with a NanoDrop spectrophotometer (NanoDrop Lite; Thermo Scientific™ CAT#840281500) and by agarose gel electrophoresis (2:1 intensity ratio of 28S:18S bands; 800ng of sample per lane, 0.6 % Agarose in TAE-buffer, 1h, 50V). Extracted RNA was stored at −80C until sequencing. For samples that showed low purity (Liver03, Pyl01, Ain01; A260/A280 ratio < 1.8) an additional purification step was performed. Accordingly, eluted RNA was diluted to 100uL total volume with DEPC water, and mixed with an equal volume of phenol:chloroform (from GeneRacer™ Kit, Invitrogen™/Thermo Fisher Scientific CAT#L150201) by vigorous vortexing for 30s. Phases were separated by centrifugation at maximum speed on a tabletop minicentrifuge (21xg, 5min, RT), and the aqueous phase was collected into a new tube. To re-precipitate the RNA, 12uL of a 10mg/mL mussel glycogen, 3M sodium acetate pH5.2 solution were added (all from GeneRacer™ Kit, Invitrogen™/Thermo Fisher Scientific CAT#L150201). After further addition of 220uL of 95% ethanol, the solution was vortexed briefly. Samples were stored at −80C overnight to allow flocculation. The following day, samples were centrifuged (21xg, 20min, 4C) and all supernatant was removed paying attention to preserve the RNA pellet. The pellet was then washed by adding 500uL of 70% ethanol, followed by manual inversion of the tube and brief vortexing. The sample was then centrifuged 2min, 21g, 4C, the ethanol supernatant was removed, and the sample was centrifuged again under the same settings. Again, any remaining ethanol was removed. Pellets were air-dried for 15 to 30min, or until becoming vitreous/transparent, and then resuspended in 30uL DEPC water. RNA amounts and quality were re-assessed with a NanoDrop spectrophotometer, usually showing minimal RNA loss compared to pre-cleanup amounts, and an increase of around +0.5 points in their A260/A280 ratio. Cleaned-up RNA was stored with the rest of the samples at −80C until sequencing. Branchiostoma floridae Immediately after isolation, each organ was immersed in 350 μL of ice-cold “RLT” buffer (RNeasy Mini kit, Qiagen) containing β-mercaptoethanol (RLT/bME, 100:1 v/v). The sample was vortexed 15 seconds and placed on ice. Once all target organs were collected and treated in RLT/bME, the samples were homogenized using a BioMasher II disposable homogenizer and a battery-powered grinder PowerMasher (Nippi. Inc; 10-30 seconds, or until no visible tissue clumps remained). The homogenates were kept in the grinding tube and stored in −80°C for a few days before RNA extraction. RNA was extracted using the RNeasy Mini kit (Qiagen CAT#74104). Frozen samples in RLT/bME were thawed on ice for 5-10 minutes. We followed the manufacturer’s protocol for RNA extraction, with the exception of extending the DNase treatment to 30 minutes at room temperature. Finally, RNA was eluted in 16 μL of nuclease-free water to obtain a concentrated RNA solution. Ptychodera flava To optimize RNA quality, dissected samples were immediately rinsed in cold RNAlater™ Stabilization Solution (Invitrogen™/Thermo Fisher Scientific CAT#AM7020) to clear any remaining digestive enzyme in the gut ( Griffin et al., 2012 ). These stabilized samples were then homogenized in TRIzol with BioMasher II disposable homogenizer and a PowerMasher (Nippi. Inc.) on ice. The RNA extraction of tissue lysate was performed with Direct-zol RNA Miniprep Kit (Zymo Research CAT#R2050) after a pre-filtering step with QIAshredder biopolymer-shredding system (Qiagen CAT#79656). Strongylocentrotus purpuratus Snap-frozen tissue samples were ground in liquid nitrogen to a fine powder. The powdered samples were weighed and lysed using TRIzol™ Reagent (Invitrogen™/Thermo Fisher Scientific CAT#15596026). RNA was then extracted using the Direct-zol RNA Miniprep Kit (Zymo Research CAT#R2050), according to the manufacturer’s instructions. Platynereis dumerilii Immediately after collection in a 1.5 mL Eppendorf tube, gut segments were placed on ice to preserve RNA integrity, with 100μL TRIzol™ reagent (Invitrogen™/Thermo Fisher Scientific, CAT#12183555). Gut tissue was then homogenised using a disposable pestle and a battery-powered homogeniser. Up to 1mL of TRIzol™ reagent was then mixed thoroughly into each sample. After a 5min incubation at room temperature, Chloroform was added at a fifth of a volume, samples were shaken vigorously for 15s, and incubated at room temperature for 2–3min. After centrifugation (12,000 × g, 15 min, 4°C) the upper 2/3 aqueous phase was carefully removed. RNA was precipitated by addition of half a volume of 100% isopropanol and gentle mixing by tube inversion. Samples were incubated 10 minutes at room temperature, centrifuged (12,000 x g, 10min, 4°C), and the supernatant was removed. RNA pellets were washed with 75% ethanol-ddH2O and vortexed briefly. After a further repelleting of the RNA (7,500 x g, 5min, 4°C) and removal of all supernatant ethanol, pellets were air-dried for 10 to 15 minutes. As a final step, pellets were resuspended in 30 µL DEPC-treated water. RNA concentration and integrity were measured using a NanoDrop spectrophotometer. Sequencing Amphiprion ocellaris Quality-control, library preparation and sequencing of extracted RNA were performed by the High Throughput Sequencing Core hosted in the Biodiversity Research Center at Academia Sinica, Taipei. RNA-Seq libraries were generated from total RNA using the Illumina Stranded mRNA Prep mRNA Sample Preparation Kit with UDI indices (Illumina, USA) according to manufacturer’s instructions. Surplus PCR primers were removed using AMPure XP (Beckman Coulter Life Sciences, USA). Final cDNA libraries were checked for quality and quantified using Qubit (ThermoFisher Scientific, USA) and Fragment Analyzer for size profiling (Agilent, USA), and concentration normalized using KAPA Library Quantification Kit for Illumina Platforms (Roche, USA). Sequencing was performed on an Illumina NextSeq2000 for paired-end 150 base format. Libraries were loaded in a P2 flow cell. Branchiostoma floridae Extracted RNA was initially quantified with a NanoDrop spectrophotometer followed by quantification with a Qubit Fluorometer. RNA integrity (RQN) was assessed using the BioAnalyzer (Agilent). When five RNA sub-samples from different organs of the same animal each contained at least 200 ng of RNA and displayed high quality (RQN 8∼10), these samples were selected for library preparation using the TruSeq stranded RNA-polyA method. The multiplexed cDNA libraries were then sequenced using a Rapid Run flow cell on a HiSeq 2500 sequencer (Illumina) with paired-end 151 bp reads. Ptychodera flava Total RNA as input for Illumina Stranded mRNA Prep mRNA Sample Preparation Kit with UDI indices (Illumina, USA) according to manufacturer’s instructions. Sequencing was performed on an Illumina NextSeq2000 for paired-end 150 base format. Libraries were loaded in the P3 flow cell. Strongylocentrotus purpuratus RNA-seq experiments were conducted using four biological replicates. Total RNA quality and concentration were assessed using the Fragment Analyzer and Qubit Fluorometer. Bulk RNA sequencing was performed on the Illumina NextSeq2000 platform, generating 150 bp paired-end reads with high sequencing depth to ensure transcriptome coverage and quantification accuracy. Platynereis dumerilii The quality of the extracted RNA is assessed using Agilent Fragment Analyzer 5200 to check the integrity and Qubit 4 Fluorometer to check the concentration. The experiments are done in three biological replicates. Bulk RNA-seq are performed using Illumina Hi-seq 2500 with 125 bp paired-end reads deep sequencing which were performed by the NGS High Throughput Genomics Core in Academia Sinica. Clownfish Hox complement reconstruction The reconstruction of Amphiprion ocellaris Hox genes, their numbers and their identity, was based on the gene models available from both the NCBI reference annotation (ASM2253959v1) and the Ensembl annotation at the time (AmpOce1.0, now matched to ASM2253959v1), taking also into account the relative position of the genes within each cluster. Furthermore, only genes for which the corresponding protein was predicted to contain a homeobox domain were maintained. The resulting list of assigned identities was then cross-compared with the expected percomorph configuration based on Hox cluster evolutionary patterns in teleosts ( Hoegg & Meyer, 2005 ), and was indeed found to be most similar to the configuration in the closest reference species Oryzias latipes ( Kurosawa et al., 2006 ) and Oreochromis niloticus ( Santini & Bernardi, 2005 ). We conservatively define a final set of 47 Hox genes for Amphiprion ocellaris . Orthology assignment A complete list of the protein IDs of all annotated proteins from each species were extracted from the corresponding Gene Transfer Format (.gtf) files downloaded from NCBI, referring to the following published annotations: Ao: GCF_022539595.1; Bf: GCF_000003815.2; Pf: GCF_041260155.1; Sp: GCF_000002235.5. Custom files, based on GCA_026936325.1, were used for Pd. The protein ID corresponding to the longest transcript isoform of each (protein-coding) gene was selected as representative entry (deduplication). These IDs were then used to subset the full proteome of each species, as downloaded from NCBI, using the “filterbyname” shell script of BBTools v39.01 (RRID:SCR_016968; Bushnell B., http://sourceforge.net/projects/bbmap/ ). The resulting deduplicated proteomes were used for orthogroup identification using the standard Orthofinder2 pipeline ( Emms & Kelly, 2019 ) with default setting. Anticipating the potential needs of indexing the generated ortholog table to known vertebrate homologues, the deduplicated proteomes from human ( Homo sapiens , Hs), mouse ( Mus musculus , Mm), and zebrafish ( Danio rerio , Dr) were also included in the orthology reconstruction (Hs: GCF_000001405.40; Mm: GCF_000001635.27; Dr: GCF_000002035.6). Hox orthogroup reconstruction We note that Orthofinder fails to reconstruct coherent orthogroups for the Hox paralogues across bilaterians due to the complex evolutionary history of this gene family, often marked by independent duplication of common ancestors across lineages ( Hueber et al., 2010 , 2013 ). In our analysis, this resulted for example in the fragmentation of all Hox genes into 21 different orthogroups, with paralogues at equivalent Hox positions split across different orthogroups. In the perspective of our comparative analysis, we are interested in comparing the expression pattern of Hox genes at equivalent positions rather than necessarily preserving true phylogenetic relationships. Accordingly, all 21 orthogroups containing Hox genes were discarded and replaced by a manually defined final set of 8 “Hox orthogroups” (“OG000PG01”, “OG000PG02”, “OG000PG0304”, “OG000PG05”, “OG000PG0607”, “OG000PG08”, “OG000PG0910”, “OG000PG1115”) grouping Hox genes at equivalent cluster positions across species (e.g. “OG000PG01” grouping all Hox genes at position 01 of each Hox cluster). In cases where a given cluster member was absent from at least one species, which would prevent the use of all other species’ matches in comparative analysis, a merged “Hox orthogroup” was created by combining paralogues from neighbouring positions (e.g. “OG000PG0304” grouping all Hox genes at positions 03 and 04 of each Hox cluster, due to the absence of Hox4 in Sp). Note that for the special case of Sp Hox genes, which break genomic collinearity ( Cameron et al., 2006 ), the three 5’ Hox genes were associated to the first three Hox orthogroups, therefore prioritising phylogenetic correspondence. We observe that their expression within the gut is indeed anterior. Transcription factor identification To identify transcription factors (TFs), we followed AnimalTFDB protocols and performed biological sequence analysis on each species’ deduplicated proteome using profile hidden Markov Models (HMMER) with InterPro’s Pfam-A models and AnimalTFDB v4.0 self build HMM files ( Mistry et al., 2021 ; Potter et al., 2018 ; Shen et al., 2023 ). With these methods, 1778, 1933, 1339, 992 and 1425 TFs were identified in Ao, Bf, Pf, Sp and Pd respectively. When each species’ TFs were summarised at the Orthogroup level, we noticed that members of a same orthogroup would sometimes be classified as TFs in one or more species, but not in other ones. To resolve this mismatch, we decided to apply an inclusive approach to TF definition by further including as TFs all “non-TFs” falling within the same orthogroup of another species’ TF (i.e. we expanded the TF list based on domain-search alone). After adjustment for Hox gene orthogroups (see section “Hox orthogroup reconstruction”), we thus obtain a total of 1426 TF orthogroups as a basis for comparative analysis. Due to the constraints of cross-species comparisons, and the use of Orthogroups, we stress that our final list of TF orthogroups does not include species-specific TFs (i.e. TFs with no orthologues in any other species), regardless of any fundamental role they may well play within the adult gut of their particular species. Analysis of bulkRNAseq data Raw data preprocessing, gene-level quantification, quality control Amphiprion ocellaris Raw (demultiplexed) fastq files were quality-checked based on reports generated by using FastQC v0.12.0 (RRID:SCR_014583; ( Andrews et al., 2010 )) with default parameters, before and after adapter trimming. Adapters were trimmed using the function bbduk (RRID:SCR_016969) of BBTools v39.01 (RRID:SCR_016968; Bushnell B., http://sourceforge.net/projects/bbmap/ ) with ktrim=r, and k=23, trimpolyg=40. Categories flagged by FastQC after trimming (“warning” or “fail”) were analysed in detail and judged not to be prejudicial to further analysis. Issues relating to the detection of high sequence duplication rates were diagnosed based on the output of the analyzeDuprates function of the dupRadar package ( Sayols et al., 2016 ). To this aim, duplicate reads were marked with the function markdup from SAMtools v1.18 (RRID:SCR_002105; ( Danecek et al., 2021 )) with default parameters. As a further quality control step to detect sample contamination, trimmed reads were also run through FastQ Screen v0.15.2 (RRID:SCR_000141; ( Wingett & Andrews, 2018 )) with default parameters, against a manually curated set of genomes including — in addition to default ones — those of other fish species used by neighbouring laboratories (goldfish Carassius auratus : ASM336829v1, carp Cyprinus carpio : ASM1834038v1, zebrafish Danio rerio : GRCz11), the three main live foods fed to our fish ( Artemia franciscana : AFR02, Brachionus rotundiformis : ASM1680229v1, Chlorella vulgaris : cvul), and additional possible contaminating species (ant Formica exsecta : ASM365146v1). All FastQ Screen genomes were indexed with bowtie2 v2.4.4 (RRID:SCR_016368; ( Langmead & Salzberg, 2012 )) as per FastQ Screen recommendation. Trimmed reads were quantified at the transcript-level using the pseudo-aligner salmon v1.10.1 (RRID:SCR_017036; ( Patro et al., 2017 )) against the clownfish Amphiprion ocellaris reference transcriptome, using the genome as a decoy (decoy-aware pseudo-alignment; assembly ASM2253959v1; ( Ryu et al., 2022 )), as per documentation, and using flags --validateMappings --seqBias --gcBias. The average mapping rate was 85.9 % of total reads. Salmon output transcript-based quantification files (quant.sf) were imported in RStudio (RRID:SCR_000432; ( RStudio Team, 2020 )) and summarised at the gene level using the tximport function from the tximport package (RRID:SCR_016752; ( Soneson et al., 2015 )), referencing the gene models of the Amphiprion ocellaris reference genome assembly ASM2253959v1. The counts matrix was obtained by re-calculating counts through the flag countsFromAbundance = “lengthScaledTPM”. Gene metadata (names, descriptions) were loaded from a custom-curated reference file based on the integration of Ensembl (still based on assembly AmpOce1.0) and NCBI annotations. This metadata reference is available at the code repository associated with this publication. Branchiostoma floridae, Ptychodera flava and Strongylocentrotus purpuratus The raw sequencing data of amphioxus, acorn worm and sea urchin were processed using the following bioinformatics pipeline. Initially, quality trimming was performed using fastp v0.22.0 to remove low-quality bases and adapter sequences ( Chen et al., 2018 ). The trimmed reads were then aligned to the reference genomes of B. floridae (GCF_000003815.2, NCBI), P. flava ( Lin et al., 2024 ), and S. purpuratus (v5.0 genome assembly from Echinobase) using the STAR aligner v2.7.10b ( Dobin et al., 2013 ). The STAR output files were subsequently sorted using SAMtools v1.17 to organize for downstream analyses ( Danecek et al., 2021 ). Gene read counts were quantified using FeatureCounts v2.0.3( Liao et al., 2014 ). Finally, the count tables were processed with the DESeq2 v1.38.3 package in R for normalization and transformations, preparing the data for the downstream analysis ( Love et al., 2014 ). Platynereis dumerilii FastQC v. 0.11.9. ( Andrews, 2010 ) was used to quality control raw reads (fastq files) generated from sequencing. The raw reads were then preprocessed with Trimmomatic v. 0.39 to remove adapter sequences and low-quality regions, then passed through another round of quality control to verify successful adapter removal. Bases were removed from the start of each read if they had a Phred score below 20 (LEADING:20) and removed at the end of each read if they had a Phred score below 3 (TRAILING:3). A sliding window of 4 was used to continue removing bases based on an average score threshold of 15 (SLIDINGWINDOW:4:15). Any reads shorter than 30 bases after trimming were discarded, as they might be too short to provide reliable mapping (MINLEN:30) ( Korpelainen et al., 2014 ). Alignment of raw reads to genome references was conducted by STAR 2.7.11a following ( Dobin et al., 2013 ) and the tabulation of aligned counts was carried out using the Subread featureCounts version 3 ( Liao et al., 2014 ). Filtering and standard counts processing Raw counts from each dataset were processed under analogous conditions, following the same processing pipeline. Specifically, counts were processed as a DGEobject (edgeR package, RRID:SCR_012802; ( Chen et al., 2016 , 2025 ; McCarthy et al., 2012 ; Robinson et al., 2010 )) and differences in library size were taken into account by obtaining counts per million (CPM) values (edgeR’s function cpm) to allow a comparable threshold to filter out of lowly expressed genes. We only maintained genes for which at least 10 counts could be detected (arbitrary) in at least the number of samples corresponding to the number of replicates obtained from each species (i.e. in at least 3 or 4 samples). We note that the threshold of 10 counts, chosen a priori based on usual practices, resulted in the filtering out of key genes of interest (e.g. Wnt10 and Tbxt in Sp, Cdx4 in Ao). Though we later noticed that the pattern of expression of many filtered-out genes of interest is in fact coherent with expectation based on published adult gut literature or on known embryonic patterns, we preferred to prioritise robustness of results over expansion of the genes included in the comparison. We maintained the original count threshold set a priori. Each filtered counts table was then processed through standard Deseq2 pipeline (DESeq2 package, RRID:SCR_015687; ( Love et al., 2014 )) as in ( Mantica et al., 2024 ) but further including VST normalisation (DESeq2’s varianceStabilizingTransformation function). Batch effects associated with the biological replicates of each dataset were removed using the removeBatchEffect function from the limma package (RRID:SCR_010943; ( Ritchie et al., 2015 )). Integrated analysis Orthogroup preprocessing Count data from different species was integrated on the basis of Orthogroups, and as in ( Mantica et al., 2024 ), unless indicated. Accordingly, and to decrease later computational complexity, Orthogroups were filtered by size and complexity: orthogroups comprising more than 120 genes were removed, as well as orthogroups with more than 80 genes in cases where these had unbalanced representation across species. Of the filtered orthogroups, 6118 were represented across all species (and could therefore be used for integrated analysis). To avoid having to discard 1-to-many orthologues, a situation exasperated by the inclusion of a teleost in our panel of species, we summarised multi-member groups in each species to a single “best ancestral orthologue”, i.e. the ortholog in each species that most likely conserved the ancestral protein sequence. To do this, for each orthogroup, pairwise sequence similarity scored were calculated using the parSeqSim function from the protr package ( Xiao et al., 2015 ) with parameters type = “local”, submat = “BLOSUM62”, gap.opening = 2, gap.extension = 0.1, to recreate the mafft defaults used in Mantica et al., 2024 . The protein with the highest average sequence similarity (among all sequence similarity scores to all proteins from all other species in the same orthogroup) was ultimately selected. Note that due to the computational intensity of this step in our system, we did not require the highest average sequence similarity score to have substantial margin from that of the second-best scoring protein. Also note that though the approach in Mantica et al., 2024 furthers refines “best ancestral orthologue” assignment by factoring in conservation of expression profile (Pearson’s expression correlations across matching tissues), we could not do this in our case since finding which gut segments are analogous across species was the matter of investigation in the first place. Integration of count matrices Comparative analyses were performed by integrating normalised count matrices from all five species into a single counts matrix spanning all samples, using orthogroups as rows/features (rather than genes) to provide a common term of comparison. This results in a necessary loss of all species-specific genes, and all genes belonging to orthogroups not expressed in all five adult guts. For “many-to-one” orthogroup relationships, which need to be resolved to one-to-one relationships, the “best ancestral orthologue” was selected as representative of the orthogroup, based on the criteria detailed above. Finally, integration was achieved by working on within-dataset z-score normalised counts (from each species; (tissue counts − species mean)/(sample standard deviation within species); base R’s “scale” function with default parameters) rather than the original counts value themselves (( Cheadle et al., 2003 ); as in ( Mantica et al., 2024 )). Within-species z-scoring has been consistently observed to be required to minimise inter-species variability, avoid sample clustering by species, and to allow samples to cluster by tissue (( Mantica et al., 2024 ; Picciani et al., 2025 )). This is also what we observed in our dataset. Data analysis and visualisation Pearson correlation matrices: pairwise Spearman’s rank correlation coefficients between samples were calculated using the “cor” function (base R). PCA plots : PCA was computed on centered, unscaled counts (prcomp function, base R) and the samples’ PC scores were plotted using ggplot2 (RRID:SCR_014601; ( Wickham, 2016 )). Heatmaps : all heatmaps were plotted using the function Heatmap from the ComplexHeatmap package ( Gu, 2022 ; Gu et al., 2016 ) reporting z-scores ((counts − mean)/sample standard deviation; base R’s “scale” function with default parameters). Rank 2 Elliptical (R2E) seriation We stress that the investigation and recovery of patterns of gene expression in sets of samples with an intrinsic (anatomical) AP order revealed itself to be non-trivial. Built-in seriation methods associated with heatmap plotting packages (following hierarchical clustering) would invariably require additional subjective steps of manual re-ordering of the clusters obtained (branch flipping) to reconstitute an overall diagonal pattern of gene expression spanning the AP axis of the segments. We ultimately chose to adopt a reproducible, less-subjective seriation criterion able to highlight long-range gradients in expression pattern (Rank-2 Elliptical seriation, “R2E”; ( Chen, 2002 )) and used such a seriation criterion as an investigation tool in of itself. Though R2E seriation is available in Rstudio as an ordination method prepackaged within the “seriation” package ( Hahsler et al., 2008 ), we manually implement it from first principles ( Chen, 2002 ) to allow much more flexibility in our ability to study these patterns of expression, and to be able to easily obtain a seriation with correct directionality or with alternative starting points. Specifically, pearson correlation coefficient matrices between genes (or orthogroups, if working with the orthogroup-summarised matrix) were calculated iteratively, effectively calculating the pearson correlation coefficient between the previous pearson correlation coefficients at each successive round (“cor” function, base R), until reaching a correlation matrix of rank 2. The rank of each matrix was defined as the number of eigenvalues greater than e^-13. We generally found that 6 iterations was always sufficient to reach a rank 2 matrix given our datasets. As demonstrated in ( Chen, 2002 ) the left singular vectors of such a matrix fall on an ellipse in a two-dimensional subspace, and their relative position along such an ellipse can be used as a reordering solution for a Robinson matrix. Single value decomposition was thus applied to the first rank-2 matrix reached (“svd” function, base R) and the distribution of the left singular vector coordinates of each gene (svd$u) was visualised as an interactive plot and to easily identify the index of the first element of the series (usually corresponding to the element at the largest gap). This new, “R2E” order was obtained by extracting the clockwise or anticlockwise sequence of elements from this first starting point. The same approach — but using as starting point the correlation matrix between gut segments rather than between genes/orthogroups — was adopted for R2E seriation of gut segments where applicable. Unbiased TF analysis (SAMap) To estimate the cross-species tissue similarity based on transcription factor or non-transcription factor expression we adopted SAMap ( Tarashansky et al., 2021 ) analysis pipeline by using bulk RNAseq dataset. The TFs and non-TFs gene count tables were imported by Seurat ( Hao et al., 2024 ) in R and further converted to .h5ad files with SeuratDisk ( https://github.com/mojaveazure/seurat-disk.git ). Mapping scores were calculated using SAMap default setting. Model-based gene set analysis (MGSA) To find enriched gene sets within (unranked) genes expressed in the adult gut tube of all five species, we relied on clownfish gene annotations and clownfish gene sets given our extensive experience with these annotations in this species (see also ( Herrera, Vianello, et al., 2025 )), and the current much higher level of understanding of gene function in vertebrate species compared to the other species under analysis. We proceeded with the assumption that orthologous genes likely share functional properties. Accordingly, the clownfish best representative orthologue (see section “Integrated analysis”) was taken as the representative of each expressed orthogroup, and Model-based gene set analysis (MGSA; mgsa function from mgsa package, ( Bauer et al., 2010 )) was run by referencing the Ensembl “biological_process” Gene Ontology annotation for Amphiprion ocellaris (“aocellaris_gene_ensembl” dataset; useMart and getBM functions from biomaRt package, RRID:SCR_019214; ( Durinck et al., 2005 , 2009 )). Given that Ensembl annotations are based on a different (earlier) genome assembly (AmpOce1.0), orthogroups whose clownfish best representative orthologue had no matching Ensembl ID could not be taken into account. sPLS-DA To identify key discriminant variables of segment groups of interest, we applied the single-step cross-dataset integration and classification approach of the multivariate integration (MINT) framework ( Rohart et al., 2017 ), combining within-dataset z-score normalisation, and classification through sparse Partial Least Square Discriminant Analysis ( Lê Cao et al., 2011 ). In sPLS-DA, datasets are decomposed in a way that does not maximise variance, as in PCA, but where instead the components retrieved from decomposition of each dataset are maximally covariant (with penalties applied for further feature selection) ( Lê Cao et al., 2008 ). Data Availability □ Raw reads of bulkRNAseq datasets are available to download under NCBI BioProject accession number PRJNA1276984 : “Comparative transcriptomics analysis of the anteroposterior organisation of adult bilaterian guts” □ Counts matrix and code to reproduce the transcriptomics analysis is available at: https://github.com/StefanoVianello/ASICOB_GCP_AdultBilaterianGut s Author contributions (CRediT) Conceptualization : Stefano Davide Vianello (SDV), Vincent Laudet (VL), Yi-Hsien Su (YHS), Jr-Kai Yu (JKY), Stephan Q. Schneider (SQS); Data curation: SDV, Ching-Yi Lin (CYL), Wahyu Cristine Pinem (WCP), Han-Ru Li (HRL), Kun-Lung Li (KLL); Formal analysis: SDV, CYL, WCP; Funding acquisition: VL, YHS, JKY, SQS; Investigation: SDV, CYL, WCP, HRL, KLL, Grace Sonia (GS); Methodology: SDV, CYL, WCP, HRL, KLL, GS; Project administration: SDV, CYL, WCP, HRL, KLL, GS, VL, YHS, JKY, SQS; Resources: SDV, CYL, HRL, WCP, KLL, GS, Shu-Hua Lee (SHL), Szu-Kai Wu (SKW); Software: SDV, CYL; Supervision: SDV, VL, YHS, JKY, SQS; Visualization: SDV, CYL; Writing – original draft: SDV, CYL, WCP, HRL, KLL, GS; Writing – review & editing: SDV, VL, YHS, JKY, SQS. Download figure Open in new tab Acknowledgements This work was supported by an Academia Sinica Grand Challenge Programme Grant (AS-GC-111-L01). We thank the High Throughput Sequencing Core hosted in the Biodiversity Research Center at Academia Sinica for performing all NGS experiments. The core facility is funded by Academia Sinica Core Facility and Innovative Instrument Project (AS-CFII-108-114). We further thank all the administrative staff and aquaculture specialists of Yilan Marine Research Station, and all present members of all four labs involved in this research project. We thank Paul Gerald Layague Sanchez for valuable input on this research and critical reading of this manuscript. Funder Information Declared Academia Sinica, https://ror.org/05bxb3784 , AS-GC-111-L01 Footnotes https://github.com/StefanoVianello/ASICOB_GCP_AdultBilaterianGuts https://www.ncbi.nlm.nih.gov/bioproject/PRJNA1276984 Bibliography ↵ Aguado , M. T. , Ponz-Segrelles , G. , Glasby , C. J. , Ribeiro , R. P. , Nakamura , M. , Oguchi , K. , Omori , A. , Kohtsuka , H. , Fischer , C. , Ise , Y. , Jimi , N. , & Miura , T . ( 2022 ). Ramisyllis kingghidorahi n. Sp., a new branching annelid from Japan . Organisms Diversity & Evolution , 22 ( 2 ), 377 – 405 . doi: 10.1007/s13127-021-00538-4 OpenUrl CrossRef ↵ Aldea , D. , Subirana , L. , Keime , C. , Meister , L. , Maeso , I. , Marcellini , S. , Gomez-Skarmeta , J. L. , Bertrand , S. , & Escriva , H . ( 2019 ). Genetic regulation of amphioxus somitogenesis informs the evolution of the vertebrate head mesoderm . Nature Ecology & Evolution , 3 ( 8 ), 1233 – 1240 . doi: 10.1038/s41559-019-0933-z OpenUrl CrossRef PubMed ↵ Andrews , S. ( 2010 ). FastQC: a quality control tool for high throughput sequence data . (No Title). ↵ Andrews , S. , Krueger , F. , Segonds-Pichon , A. , Biggins , L. , Krueger , C. , & Wingett , S. ( 2010 , January). FastQC: a quality control tool for high throughput sequence data . http://www.bioinformatics.bbsrc.ac.uk/projects/fastqc ↵ Annunziata , R. , Andrikou , C. , Perillo , M. , Cuomo , C. , & Arnone , M. I . ( 2019 ). Development and evolution of gut structures: From molecules to function . Cell and Tissue Research , 377 ( 3 ), 445 – 458 . doi: 10.1007/s00441-019-03093-9 OpenUrl CrossRef PubMed ↵ Annunziata , R. , & Arnone , M. I . ( 2014 ). A dynamic regulatory network explains ParaHox gene control of gut patterning in the sea urchin . Development , 141 ( 12 ), 2462 – 2472 . doi: 10.1242/dev.105775 OpenUrl Abstract / FREE Full Text ↵ Annunziata , R. , Perillo , M. , Andrikou , C. , Cole , A. G. , Martinez , P. , & Arnone , M. I . ( 2014 ). Pattern and process during sea urchin gut morphogenesis: The regulatory landscape . Genesis , 52 ( 3 ), 251 – 268 . doi: 10.1002/dvg.22738 OpenUrl CrossRef PubMed ↵ Applegate , J. R. , Dombrowski , D. S. , Christian , L. S. , Bayer , M. P. , Harms , C. A. , & Lewbart , G. A . ( 2016 ). TRICAINE METHANESULFONATE (MS-222) SEDATION AND ANESTHESIA IN THE PURPLE-SPINED SEA URCHIN (ARBACIA PUNCTULATA) . Journal of Zoo and Wildlife Medicine , 47 ( 4 ), 1025 – 1033 . doi: 10.1638/2015-0288.1 OpenUrl CrossRef PubMed ↵ Arenas-Mena , C. , Cameron , R. A. , & Davidson , E. H . ( 2006 ). Hindgut specification and cell-adhesion functions of Sphox11/13b in the endoderm of the sea urchin embryo . Development, Growth & Differentiation , 48 ( 7 ), 463 – 472 . doi: 10.1111/j.1440-169X.2006.00883.x OpenUrl CrossRef PubMed Web of Science ↵ Aria , M. N. , & Chan , I. M . ( 1989 ). Two types of excretory pores in the hydrozoan medusa Aequorea victoria (Murbach and Shearer, 1902) . Journal of Plankton Research , 11 ( 3 ), 609 – 614 . doi: 10.1093/plankt/11.3.609 OpenUrl CrossRef ↵ Avian , M. , Mancini , L. , Voltolini , M. , Bonnet , D. , Dreossi , D. , Macaluso , V. , Pillepich , N. , Prieto , L. , Ramšak , A. , Terlizzi , A. , & Motta , G . ( 2022 ). A novel endocast technique providing a 3D quantitative analysis of the gastrovascular system in Rhizostoma pulmo: An unexpected through-gut in cnidaria . PLOS ONE , 17 ( 8 ), e0272023 . doi: 10.1371/journal.pone.0272023 OpenUrl CrossRef PubMed ↵ Bauer , S. , Gagneur , J. , & Robinson , P. N . ( 2010 ). GOing Bayesian: Model-based gene set analysis of genome-scale data . Nucleic Acids Research , 38 ( 11 ), 3523 – 3532 . doi: 10.1093/nar/gkq045 OpenUrl CrossRef PubMed Web of Science ↵ Beck , F. , Tata , F. , & Chawengsaksophak , K . ( 2000 ). Homeobox genes and gut development . BioEssays , 22 ( 5 ), 431 – 441 . doi: 10.1002/(SICI)1521-1878(200005)22:53.0.CO;2-X OpenUrl CrossRef PubMed Web of Science ↵ Boyle , M. J. , Yamaguchi , E. , & Seaver , E. C . ( 2014 ). Molecular conservation of metazoan gut formation: Evidence from expression of endomesoderm genes in Capitella teleta (Annelida) . EvoDevo , 5 ( 1 ), 39 . doi: 10.1186/2041-9139-5-39 OpenUrl CrossRef PubMed ↵ Buchon , N. , Osman , D. , David , F. P. A. , Fang , H. Y. , Boquete , J.-P. , Deplancke , B. , & Lemaitre , B . ( 2013 ). Morphological and molecular characterization of adult midgut compartmentalization in Drosophila . Cell Reports , 3 ( 5 ), 1725 – 1738 . doi: 10.1016/j.celrep.2013.04.001 OpenUrl CrossRef PubMed Web of Science ↵ Cameron , R. A. , Rowen , L. , Nesbitt , R. , Bloom , S. , Rast , J. P. , Berney , K. , Arenas-Mena , C. , Martinez , P. , Lucas , S. , Richardson , P. M. , Davidson , E. H. , Peterson , K. J. , & Hood , L. ( 2006 ). Unusual gene order and organization of the sea urchin hox cluster . Journal of Experimental Zoology Part B: Molecular and Developmental Evolution , 306B ( 1 ), 45 – 58 . doi: 10.1002/jez.b.21070 OpenUrl CrossRef PubMed ↵ Camiz , S . ( 2005 ). The Guttman effect: Its interpretation and a new redressing method . Data Analysis Bulletin , 5 , 7 – 34 . OpenUrl ↵ Castro , L. F. C. , Lopes-Marques , M. , Gonçalves , O. , & Wilson , J. M . ( 2012 ). The Evolution of Pepsinogen C Genes in Vertebrates: Duplication, Loss and Functional Diversification . PLOS ONE , 7 ( 3 ), e32852 . doi: 10.1371/journal.pone.0032852 OpenUrl CrossRef PubMed ↵ Cheadle , C. , Vawter , M. P. , Freed , W. J. , & Becker , K. G . ( 2003 ). Analysis of microarray data using Z score transformation . The Journal of Molecular Diagnostics: JMD , 5 ( 2 ), 73 – 81 . doi: 10.1016/S1525-1578(10)60455-2 OpenUrl CrossRef PubMed Web of Science ↵ Chen Chun-Houh . ( 2002 ). Generalized association plots: Information visualization via iteratively generated correlation matrices . Statistica Sinica , 7 – 29 . ↵ Chen , S. , Zhou , Y. , Chen , Y. , & Gu , J . ( 2018 ). fastp: An ultra-fast all-in-one FASTQ preprocessor . Bioinformatics , 34 ( 17 ), i884 – i890 . doi: 10.1093/bioinformatics/bty560 OpenUrl CrossRef PubMed ↵ Chen , Y. , Chen , L. , Lun , A. T. L. , Baldoni , P. L. , & Smyth , G. K . ( 2025 ). edgeR v4: Powerful differential analysis of sequencing data with expanded functionality and improved support for small counts and larger datasets . Nucleic Acids Research , 53 ( 2 ), gkaf018 . doi: 10.1093/nar/gkaf018 OpenUrl CrossRef PubMed ↵ Chen , Y. , Lun , A. T. L. , & Smyth , G. K . ( 2016 ). From reads to genes to pathways: Differential expression analysis of RNA-Seq experiments using Rsubread and the edgeR quasi-likelihood pipeline . F1000Research , 5 , 1438 . doi: 10.12688/f1000research.8987.2 OpenUrl CrossRef PubMed ↵ Childers , L. , Park , J. , Wang , S. , Liu , R. , Barry , R. , Watts , S. A. , Rawls , J. F. , & Bagnat , M . ( 2025 ). Protein absorption in the zebrafish gut is regulated by interactions between lysosome rich enterocytes and the microbiome . eLife , 13 , RP100611 . doi: 10.7554/eLife.100611 OpenUrl CrossRef PubMed ↵ Cole , A. G. , Rizzo , F. , Martinez , P. , Fernandez-Serra , M. , & Arnone , M. I . ( 2009 ). Two ParaHox genes, SpLox and SpCdx, interact to partition the posterior endoderm in the formation of a functional gut . Development , 136 ( 4 ), 541 – 549 . doi: 10.1242/dev.029959 OpenUrl Abstract / FREE Full Text ↵ Cornelius , C. E . ( 1985 ). Hepatic ontogenesis . Hepatology (Baltimore, Md.) , 5 ( 6 ), 1213 – 1221 . doi: 10.1002/hep.1840050625 OpenUrl CrossRef PubMed ↵ Dai , Y. , Pan , R. , Pan , Q. , Wu , X. , Cai , Z. , Fu , Y. , Shi , C. , Sheng , Y. , Li , J. , Lin , Z. , Liu , G. , Zhu , P. , Li , M. , Li , G. , & Zhou , X . ( 2024 ). Single-cell profiling of the amphioxus digestive tract reveals conservation of endocrine cells in chordates . Science Advances , 10 ( 51 ), eadq0702 . doi: 10.1126/sciadv.adq0702 OpenUrl CrossRef PubMed ↵ Danecek , P. , Bonfield , J. K. , Liddle , J. , Marshall , J. , Ohan , V. , Pollard , M. O. , Whitwham , A. , Keane , T. , McCarthy , S. A. , Davies , R. M. , & Li , H . ( 2021 ). Twelve years of SAMtools and BCFtools . GigaScience , 10 ( 2 ), giab008 . doi: 10.1093/gigascience/giab008 OpenUrl CrossRef PubMed ↵ Dobin , A. , Davis , C. A. , Schlesinger , F. , Drenkow , J. , Zaleski , C. , Jha , S. , Batut , P. , Chaisson , M. , & Gingeras , T. R . ( 2013 ). STAR: Ultrafast universal RNA-seq aligner. Bioinformatics (Oxford , England) , 29 ( 1 ), 15 – 21 . doi: 10.1093/bioinformatics/bts635 OpenUrl CrossRef PubMed Web of Science ↵ Dunn , F. S. , Kenchington , C. G. , Parry , L. A. , Clark , J. W. , Kendall , R. S. , & Wilby , P. R . ( 2022 ). A crown-group cnidarian from the Ediacaran of Charnwood Forest , UK. Nature Ecology & Evolution , 6 ( 8 ), 1095 – 1104 . doi: 10.1038/s41559-022-01807-x OpenUrl CrossRef PubMed ↵ Duque-Correa , M. J. , Codron , D. , Meloro , C. , McGrosky , A. , Schiffmann , C. , Edwards , M. S. , & Clauss , M . ( 2021 ). Mammalian intestinal allometry, phylogeny, trophic level and climate . Proceedings of the Royal Society B: Biological Sciences , 288 ( 1944 ), 20202888 . doi: 10.1098/rspb.2020.2888 OpenUrl CrossRef PubMed ↵ Durinck , S. , Moreau , Y. , Kasprzyk , A. , Davis , S. , De Moor , B. , Brazma , A. , & Huber , W. ( 2005 ). BioMart and Bioconductor: A powerful link between biological databases and microarray data analysis . Bioinformatics (Oxford, England) , 21 ( 16 ), 3439 – 3440 . doi: 10.1093/bioinformatics/bti525 OpenUrl CrossRef PubMed Web of Science ↵ Durinck , S. , Spellman , P. T. , Birney , E. , & Huber , W . ( 2009 ). Mapping identifiers for the integration of genomic datasets with the R/Bioconductor package biomaRt . Nature Protocols , 4 ( 8 ), 1184 – 1191 . doi: 10.1038/nprot.2009.97 OpenUrl CrossRef PubMed Web of Science ↵ Dutta , D. , Dobson , A. J. , Houtz , P. L. , Gläßer , C. , Revah , J. , Korzelius , J. , Patel , P. H. , Edgar , B. A. , & Buchon , N . ( 2015 ). Regional Cell-Specific Transcriptome Mapping Reveals Regulatory Complexity in the Adult Drosophila Midgut . Cell Reports , 12 ( 2 ), 346 – 358 . doi: 10.1016/j.celrep.2015.06.009 OpenUrl CrossRef PubMed ↵ Emms , D. M. , & Kelly , S . ( 2019 ). OrthoFinder: Phylogenetic orthology inference for comparative genomics . Genome Biology , 20 ( 1 ), 238 . doi: 10.1186/s13059-019-1832-y OpenUrl CrossRef PubMed ↵ Engel , P. , & Moran , N. A . ( 2013 ). The gut microbiota of insects – diversity in structure and function . FEMS Microbiology Reviews , 37 ( 5 ), 699 – 735 . doi: 10.1111/1574-6976.12025 OpenUrl CrossRef PubMed Web of Science ↵ Fages , A. , Luxey , M. , Ronco , F. , Huyghe , C. E. T. , Menon , P. N. K. , Indermaur , A. , Salzburger , W. , & Tschopp , P . ( 2024 ). Adaptive cellular evolution in the intestinal tracts of hyperdiverse African cichlid fishes (p. 2024.11.28.625862) . bioRxiv . doi: 10.1101/2024.11.28.625862 OpenUrl Abstract / FREE Full Text ↵ Fang , R. , Olds , L. C. , & Sibley , E . ( 2006 ). Spatio-temporal patterns of intestine-specific transcription factor expression during postnatal mouse gut development . Gene Expression Patterns , 6 ( 4 ), 426 – 432 . doi: 10.1016/j.modgep.2005.09.003 OpenUrl CrossRef PubMed ↵ Fanning , J. C. , Tyler , M. J. , & Shearman , D. J . ( 1982 ). Converting a stomach to a uterus: The microscopic structure of the stomach of the gastric brooding frog Rheobatrachus silus . Gastroenterology , 82 ( 1 ), 62 – 70 . OpenUrl CrossRef PubMed Web of Science ↵ Freeman , R. , Ikuta , T. , Wu , M. , Koyanagi , R. , Kawashima , T. , Tagawa , K. , Humphreys , T. , Fang , G.-C. , Fujiyama , A. , Saiga , H. , Lowe , C. , Worley , K. , Jenkins , J. , Schmutz , J. , Kirschner , M. , Rokhsar , D. , Satoh , N. , & Gerhart , J . ( 2012 ). Identical Genomic Organization of Two Hemichordate Hox Clusters . Current Biology , 22 ( 21 ), 2053 – 2058 . doi: 10.1016/j.cub.2012.08.052 OpenUrl CrossRef PubMed ↵ Fritzenwanker , J. H. , Gerhart , J. , Freeman , R. M. , & Lowe , C. J . ( 2014 ). The Fox/Forkhead transcription factor family of the hemichordate Saccoglossus kowalevskii . EvoDevo , 5 , 17 . doi: 10.1186/2041-9139-5-17 OpenUrl CrossRef PubMed ↵ Garstang , W . ( 1928 ). The Morphology of the Tunicata, and its bearings on the Phylogeny of the Chordata . Journal of Cell Science , s2-72 ( 285 ), 51 – 187 . doi: 10.1242/jcs.s2-72.285.51 OpenUrl CrossRef ↵ Gavilán , B. , Sprecher , S. G. , Hartenstein , V. , & Martinez , P . ( 2019 ). The digestive system of xenacoelomorphs . Cell and Tissue Research , 377 ( 3 ), 369 – 382 . doi: 10.1007/s00441-019-03038-2 OpenUrl CrossRef PubMed ↵ Gee , Henry . ( 1996 ). Before the Backbone . Springer Netherlands . doi: 10.1007/978-0-585-25272-8 OpenUrl CrossRef ↵ Gerdol , M. , Greco , S. , Marino , R. , Locascio , A. , Plateroti , M. , & Sirakov , M . ( 2024 ). Conserved Signaling Pathways in the Ciona robusta Gut . International Journal of Molecular Sciences , 25 ( 14 ), Article 14. doi: 10.3390/ijms25147846 OpenUrl CrossRef ↵ Gill , H. K. , Yin , S. , Nerurkar , N. L. , Lawlor , J. C. , Lee , C. , Huycke , T. R. , Mahadevan , L. , & Tabin , C. J . ( 2024 ). Hox gene activity directs physical forces to differentially shape chick small and large intestinal epithelia . Developmental Cell , 59 ( 21 ), 2834 – 2849 .e9. doi: 10.1016/j.devcel.2024.07.012 OpenUrl CrossRef PubMed ↵ Grapin-Botton , A. , & Melton , D. A . ( 2000 ). Endoderm development: From patterning to organogenesis . Trends in Genetics , 16 ( 3 ), 124 – 130 . doi: 10.1016/S0168-9525(99)01957-5 OpenUrl CrossRef PubMed Web of Science ↵ Griffin , M. , Abu-El-Haija , M. , Abu-El-Haija , M. , Rokhlina , T. , & Uc , A . ( 2012 ). Simplified and Versatile Method for Isolation of High-Quality RNA from Pancreas . BioTechniques , 52 ( 5 ), 332 – 334 . doi: 10.2144/0000113862 OpenUrl CrossRef PubMed ↵ Gu , Z . ( 2022 ). Complex heatmap visualization . iMeta , 1 ( 3 ), e43 . doi: 10.1002/imt2.43 OpenUrl CrossRef PubMed ↵ Gu , Z. , Eils , R. , & Schlesner , M . ( 2016 ). Complex heatmaps reveal patterns and correlations in multidimensional genomic data . Bioinformatics , 32 ( 18 ), 2847 – 2849 . doi: 10.1093/bioinformatics/btw313 OpenUrl CrossRef PubMed ↵ Hahsler , M. , Hornik , K. , & Buchta , C . ( 2008 ). Getting Things in Order: An Introduction to the R Package seriation . Journal of Statistical Software , 25 , 1 – 34 . doi: 10.18637/jss.v025.i03 OpenUrl CrossRef ↵ Hale , M. A. , Swift , G. H. , Hoang , C. Q. , Deering , T. G. , Masui , T. , Lee , Y.-K. , Xue , J. , & MacDonald , R. J . ( 2014 ). The nuclear hormone receptor family member NR5A2 controls aspects of multipotent progenitor cell formation and acinar differentiation during pancreatic organogenesis . Development (Cambridge, England) , 141 ( 16 ), 3123 – 3133 . doi: 10.1242/dev.109405 OpenUrl Abstract / FREE Full Text ↵ Han , J. , Li , G. , Wang , X. , Yang , X. , Guo , J. , Sasaki , O. , & Komiya , T . ( 2018 ). Olivooides-like tube aperture in early Cambrian carinachitids (Medusozoa, Cnidaria) . Journal of Paleontology , 92 ( 1 ), 3 – 13 . doi: 10.1017/jpa.2017.10 OpenUrl CrossRef ↵ Hao , Y. , Stuart , T. , Kowalski , M. H. , Choudhary , S. , Hoffman , P. , Hartman , A. , Srivastava , A. , Molla , G. , Madad , S. , Fernandez-Granda , C. , & Satija , R . ( 2024 ). Dictionary learning for integrative, multimodal and scalable single-cell analysis . Nature Biotechnology , 42 ( 2 ), 293 – 304 . doi: 10.1038/s41587-023-01767-y OpenUrl CrossRef PubMed ↵ Hatschek , B . ( 1888 ). Lehrbuch der Zoologie: Eine morphologische Übersicht des Thierreiches zur Einführung in das Studium dieser Wissenschaft / von Berthold Hatschek . G. Fischer,. doi: 10.5962/bhl.title.1381 OpenUrl CrossRef ↵ He , C. , Han , T. , Liao , X. , Guan , R. , Chen , J.-Y. , Tremblay , K. D. , & Lu , Z . ( 2020 ). On the origin of vertebrate body plan: Insights from the endoderm using the hourglass model . Gene Expression Patterns , 37 , 119125 . doi: 10.1016/j.gep.2020.119125 OpenUrl CrossRef PubMed ↵ Hejnol , A. , Gasiorowski , L. , & Martin-Duran , J.-M . ( 2021 ). The Evolution of Hox Genes in Spiralia . doi: 10.20944/preprints202111.0509.v1 OpenUrl CrossRef ↵ Hejnol , A. , & Martindale , M. Q . ( 2008 ). Acoel development indicates the independent evolution of the bilaterian mouth and anus . Nature , 456 ( 7220 ), 382 – 386 . doi: 10.1038/nature07309 OpenUrl CrossRef PubMed Web of Science ↵ Hejnol , A. , & Martín-Durán , J. M . ( 2015 ). Getting to the bottom of anal evolution . Zoologischer Anzeiger - A Journal of Comparative Zoology , 256 , 61 – 74 . doi: 10.1016/j.jcz.2015.02.006 OpenUrl CrossRef ↵ Herrera , M. , Vianello , S. , Mitchell , L. , Chamot , Z. , Lorin-Nebel , C. , Bonnelye , E. , Roux , N. , Besseau , L. , Gibert , Y. , & Laudet , V . ( 2025 ). From Genes to Pathways: A Curated Gene Approach to Accurate Pathway Reconstruction in Teleost Fish Transcriptomics . Journal of Experimental Zoology Part B: Molecular and Developmental Evolution, n/a(n/a) . doi: 10.1002/jez.b.23299 OpenUrl CrossRef ↵ Hoegg , S. , & Meyer , A . ( 2005 ). Hox clusters as models for vertebrate genome evolution . Trends in Genetics: TIG , 21 ( 8 ), 421 – 424 . doi: 10.1016/j.tig.2005.06.004 OpenUrl CrossRef PubMed Web of Science ↵ J. M. Lawrence Holland , N. D. ( 2020 ). Chapter 8—Digestive system in regular sea urchins . In J. M. Lawrence (Ed.), Developments in Aquaculture and Fisheries Science (Vol. 43 , pp. 147 – 163 ). Elsevier . doi: 10.1016/B978-0-12-819570-3.00008-1 OpenUrl CrossRef ↵ Horner , B. E. , Taylor , J. M. , & Padykula , H. A . ( 1964 ). Food Habits and Gastric Morphology of the Grasshopper Mouse . Journal of Mammalogy , 45 ( 4 ), 513 – 535 . doi: 10.2307/1377324 OpenUrl CrossRef ↵ Hueber , S. D. , Rauch , J. , Djordjevic , M. A. , Gunter , H. , Weiller , G. F. , & Frickey , T . ( 2013 ). Analysis of central Hox protein types across bilaterian clades: On the diversification of central Hox proteins from an Antennapedia/Hox7-like protein . Developmental Biology , 383 ( 2 ), 175 – 185 . doi: 10.1016/j.ydbio.2013.09.009 OpenUrl CrossRef PubMed ↵ Hueber , S. D. , Weiller , G. F. , Djordjevic , M. A. , & Frickey , T . ( 2010 ). Improving Hox Protein Classification across the Major Model Organisms . PLOS ONE , 5 ( 5 ), e10820 . doi: 10.1371/journal.pone.0010820 OpenUrl CrossRef PubMed ↵ Hui , J. H. L. , Raible , F. , Korchagina , N. , Dray , N. , Samain , S. , Magdelenat , G. , Jubin , C. , Segurens , B. , Balavoine , G. , Arendt , D. , & Ferrier , D. E. K . ( 2009 ). Features of the ancestral bilaterian inferred from Platynereis dumerilii ParaHox genes . BMC Biology , 7 , 43 . doi: 10.1186/1741-7007-7-43 OpenUrl CrossRef PubMed ↵ Iguchi , R. , Nakayama , S. , Sasakura , Y. , Sekiguchi , T. , & Ogasawara , M . ( 2023 ). Repetitive and zonal expression profiles of absorption-related genes in the gastrointestinal tract of ascidian Ciona intestinalis type A . Cell and Tissue Research , 394 ( 2 ), 343 – 360 . doi: 10.1007/s00441-023-03828-9 OpenUrl CrossRef PubMed ↵ Iguchi , R. , Usui , K. , Nakayama , S. , Sasakura , Y. , Sekiguchi , T. , & Ogasawara , M . ( 2023 ). Multi-regional expression of pancreas-related digestive enzyme genes in the intestinal chamber of the ascidian Ciona intestinalis type A . Cell and Tissue Research , 394 ( 3 ), 423 – 430 . doi: 10.1007/s00441-023-03839-6 OpenUrl CrossRef PubMed ↵ Illig , R. , Fritsch , H. , & Schwarzer , C . ( 2013 ). Spatio-temporal expression of HOX genes in human hindgut development . Developmental Dynamics: An Official Publication of the American Association of Anatomists , 242 ( 1 ), 53 – 66 . doi: 10.1002/dvdy.23893 OpenUrl CrossRef PubMed ↵ Janssen , R. , Schomburg , C. , Prpic , N.-M. , & Budd , G. E . ( 2022 ). A comprehensive study of arthropod and onychophoran Fox gene expression patterns . PLOS ONE , 17 ( 7 ), e0270790 . doi: 10.1371/journal.pone.0270790 OpenUrl CrossRef PubMed ↵ Kapli , P. , Natsidis , P. , Leite , D. J. , Fursman , M. , Jeffrie , N. , Rahman , I. A. , Philippe , H. , Copley , R. R. , & Telford , M. J . ( 2021 ). Lack of support for Deuterostomia prompts reinterpretation of the first Bilateria . Science Advances , 7 ( 12 ), eabe2741 . doi: 10.1126/sciadv.abe2741 OpenUrl FREE Full Text ↵ Kawazoe , Y. , Sekimoto , T. , Araki , M. , Takagi , K. , Araki , K. , & Yamamura , K . ( 2002 ). Region-specific gastrointestinal Hox code during murine embryonal gut development. Development , Growth & Differentiation , 44 ( 1 ), 77 – 84 . doi: 10.1046/j.1440-169x.2002.00623.x OpenUrl CrossRef PubMed Web of Science ↵ Kerstjens , S. , Engert , F. , Zador , A. M. , & Douglas , R. J . ( 2024 ). Eigengene reveals invariant global spatial patterns across mouse and fish brain development (p. 2024.09.19.613507) . bioRxiv . doi: 10.1101/2024.09.19.613507 OpenUrl Abstract / FREE Full Text ↵ Koelz , H. R . ( 1992 ). Gastric Acid in Vertebrates . Scandinavian Journal of Gastroenterology , 27 ( sup193 ), 2 – 6 . doi: 10.3109/00365529209095998 OpenUrl CrossRef ↵ Korpelainen , E. , Tuimala , J. , Somervuo , P. , Huss , M. , & Wong , G . ( 2014 ). RNA-seq Data Analysis: A Practical Approach . Chapman and Hall/CRC . doi: 10.1201/b17457 OpenUrl CrossRef ↵ Kuehn , E. , Stockinger , A. W. , Girard , J. , Raible , F. , & Özpolat , B. D . ( 2019 ). A scalable culturing system for the marine annelid Platynereis dumerilii . PloS One , 14 ( 12 ), e0226156 . doi: 10.1371/journal.pone.0226156 OpenUrl CrossRef PubMed ↵ Kurosawa , G. , Takamatsu , N. , Takahashi , M. , Sumitomo , M. , Sanaka , E. , Yamada , K. , Nishii , K. , Matsuda , M. , Asakawa , S. , Ishiguro , H. , Miura , K. , Kurosawa , Y. , Shimizu , N. , Kohara , Y. , & Hori , H . ( 2006 ). Organization and structure of hox gene loci in medaka genome and comparison with those of pufferfish and zebrafish genomes . Gene , 370 , 75 – 82 . doi: 10.1016/j.gene.2005.11.015 OpenUrl CrossRef PubMed Web of Science ↵ Langmead , B. , & Salzberg , S. L . ( 2012 ). Fast gapped-read alignment with Bowtie 2 . Nature Methods , 9 ( 4 ), 357 – 359 . doi: 10.1038/nmeth.1923 OpenUrl CrossRef PubMed Web of Science ↵ Larroux , C. , Luke , G. N. , Koopman , P. , Rokhsar , D. S. , Shimeld , S. M. , & Degnan , B. M . ( 2008 ). Genesis and Expansion of Metazoan Transcription Factor Gene Classes . Molecular Biology and Evolution , 25 ( 5 ), 980 – 996 . doi: 10.1093/molbev/msn047 OpenUrl CrossRef PubMed Web of Science ↵ Laudet , V . ( 2011 ). The origins and evolution of vertebrate metamorphosis . Current Biology: CB , 21 ( 18 ), R726 – 737 . doi: 10.1016/j.cub.2011.07.030 OpenUrl CrossRef PubMed ↵ Laumer , C. E. , Gruber-Vodicka , H. , Hadfield , M. G. , Pearse , V. B. , Riesgo , A. , Marioni , J. C. , & Giribet , G . ( 2018 ). Support for a clade of Placozoa and Cnidaria in genes with minimal compositional bias . eLife , 7 , e36278 . doi: 10.7554/eLife.36278 OpenUrl CrossRef ↵ Lê Cao , K.-A. , Boitard , S. , & Besse , P. ( 2011 ). Sparse PLS discriminant analysis: Biologically relevant feature selection and graphical displays for multiclass problems . BMC Bioinformatics , 12 ( 1 ), 253 . doi: 10.1186/1471-2105-12-253 OpenUrl CrossRef PubMed ↵ Lê Cao , K.-A. , Rossouw , D. , Robert-Granié , C. , & Besse , P. ( 2008 ). A sparse PLS for variable selection when integrating omics data . Statistical Applications in Genetics and Molecular Biology , 7 ( 1 ), Article 35. doi: 10.2202/1544-6115.1390 OpenUrl CrossRef PubMed ↵ Lenz , M. , Müller , F.-J. , Zenke , M. , & Schuppert , A . ( 2016 ). Principal components analysis and the reported low intrinsic dimensionality of gene expression microarray data . Scientific Reports , 6 ( 1 ), 25696 . doi: 10.1038/srep25696 OpenUrl CrossRef PubMed ↵ Li , H.-Y. , & Zhang , S.-C . ( 2010 ). [Hepatic caecum of amphioxus and origin of vertebrate liver] . Yi Chuan = Hereditas , 32 ( 5 ), 437 – 442 . doi: 10.3724/sp.j.1005.2010.00437 OpenUrl CrossRef PubMed ↵ Liao , Y. , Smyth , G. K. , & Shi , W . ( 2014 ). featureCounts: An efficient general purpose program for assigning sequence reads to genomic features . Bioinformatics , 30 ( 7 ), 923 – 930 . doi: 10.1093/bioinformatics/btt656 OpenUrl CrossRef PubMed Web of Science ↵ Lichtenberg , K. H. de , Seymour , P. A. , Jørgensen , M. C. , Kim , Y.-H. , Grapin-Botton , A. , Magnuson , M. A. , Nakic , N. , Ferrer , J. , & Serup , P. ( 2018 ). Notch Controls Multiple Pancreatic Cell Fate Regulators Through Direct Hes1 -mediated Repression (p. 336305) . bioRxiv . doi: 10.1101/336305 OpenUrl Abstract / FREE Full Text ↵ Lickwar , C. R. , Camp , J. G. , Weiser , M. , Cocchiaro , J. L. , Kingsley , D. M. , Furey , T. S. , Sheikh , S. Z. , & Rawls , J. F . ( 2017 ). Genomic dissection of conserved transcriptional regulation in intestinal epithelial cells . PLOS Biology , 15 ( 8 ), e2002054 . doi: 10.1371/journal.pbio.2002054 OpenUrl CrossRef PubMed ↵ Lin , C.-Y. , Marlétaz , F. , Pérez-Posada , A. , Martínez-García , P. M. , Schloissnig , S. , Peluso , P. , Conception , G. T. , Bump , P. , Chen , Y.-C. , Chou , C. , Lin , C.-Y. , Fan , T.-P. , Tsai , C.-T. , Skarmeta , J. L. G. , Tena , J. J. , Lowe , C. J. , Rank , D. R. , Rokhsar , D. S. , Yu , J.-K. , & Su , Y.-H . ( 2024 ). Chromosome-level genome assemblies of 2 hemichordates provide new insights into deuterostome origin and chromosome evolution . PLOS Biology , 22 ( 6 ), e3002661 . doi: 10.1371/journal.pbio.3002661 OpenUrl CrossRef PubMed ↵ Lin , C.-Y. , Tung , C.-H. , Yu , J.-K. , & Su , Y.-H . ( 2016 ). Reproductive periodicity, spawning induction, and larval metamorphosis of the hemichordate acorn worm Ptychodera flava . Journal of Experimental Zoology Part B: Molecular and Developmental Evolution , 326 ( 1 ), 47 – 60 . doi: 10.1002/jez.b.22665 OpenUrl CrossRef ↵ Litingtung , Y. , Lei , L. , Westphal , H. , & Chiang , C . ( 1998 ). Sonic hedgehog is essential to foregut development . Nature Genetics , 20 ( 1 ), 58 – 61 . doi: 10.1038/1717 OpenUrl CrossRef PubMed Web of Science ↵ Lobo-da-Cunha , A . ( 2019 ). Structure and function of the digestive system in molluscs . Cell and Tissue Research , 377 ( 3 ), 475 – 503 . doi: 10.1007/s00441-019-03085-9 OpenUrl CrossRef PubMed ↵ Love , M. I. , Huber , W. , & Anders , S . ( 2014 ). Moderated estimation of fold change and dispersion for RNA-seq data with DESeq2 . Genome Biology , 15 ( 12 ), 550 . doi: 10.1186/s13059-014-0550-8 OpenUrl CrossRef PubMed ↵ Lv , Y. , Gao , X. , Dai , Q. , Zhu , L. , Liu , S. , Hu , Z. , Lu , J. , Zhou , H. , Jin , J. , & Mei , Z . ( 2024 ). Functional insights of digestion, absorption, and immunity in different segments of the intestine in Hemibarbus labeo from transcriptomic analysis . Comparative Biochemistry and Physiology Part D: Genomics and Proteomics , 52 , 101278 . doi: 10.1016/j.cbd.2024.101278 OpenUrl CrossRef ↵ Maderspacher , F . ( 2009 ). Breakthroughs and blind ends . Current Biology: CB , 19 ( 7 ), R272 – 274 . doi: 10.1016/j.cub.2009.03.043 OpenUrl CrossRef ↵ Magri , M. S. , Voronov , D. , Foley , S. , Martínez-García , P. M. , Franke , M. , Cary , G. A. , Santos-Pereira , J. M. , Cuomo , C. , Fernández-Moreno , M. , Gil-Galvez , A. , Acemel , R. D. , Paganos , P. , Ku , C. , Ranđelović , J. , Rusciano , M. L. , Firbas , P. N. , Gómez-Skarmeta , J. L. , Hinman , V. F. , Arnone , M. I. , & Maeso , I . ( 2024 ). Deep conservation of cis-regulatory elements and chromatin organization in echinoderms uncover ancestral regulatory features of animal genomes (p. 2024.11.30.626178) . bioRxiv . doi: 10.1101/2024.11.30.626178 OpenUrl Abstract / FREE Full Text ↵ Mantica , F. , Iñiguez , L. P. , Marquez , Y. , Permanyer , J. , Torres-Mendez , A. , Cruz , J. , Franch-Marro , X. , Tulenko , F. , Burguera , D. , Bertrand , S. , Doyle , T. , Nouzova , M. , Currie , P. D. , Noriega , F. G. , Escriva , H. , Arnone , M. I. , Albertin , C. B. , Wotton , K. R. , Almudi , I. , … Irimia , M . ( 2024 ). Evolution of tissue-specific expression of ancestral genes across vertebrates and insects . Nature Ecology & Evolution , 8 ( 6 ), 1140 – 1153 . doi: 10.1038/s41559-024-02398-5 OpenUrl CrossRef ↵ Marianes , A. , & Spradling , A. C . ( 2013 ). Physiological and stem cell compartmentalization within the Drosophila midgut . eLife , 2 , e00886 . doi: 10.7554/eLife.00886 OpenUrl CrossRef PubMed ↵ Martin Vázquez , E. , Cobo-Vuilleumier , N. , Araujo Legido , R. , Marín-Cañas , S. , Nola , E. , Dorronsoro , A. , López Bermudo , L. , Crespo , A. , Romero-Zerbo , S. Y. , García-Fernández , M. , Martin Montalvo , A. , Rojas , A. , Comaills , V. , Bérmudez-Silva , F. J. , Gannon , M. , Martin , F. , Eizirik , D. , Lorenzo , P. I. , & Gauthier , B. R. ( 2022 ). NR5A2/LRH-1 regulates the PTGS2-PGE2-PTGER1 pathway contributing to pancreatic islet survival and function . iScience , 25 ( 5 ), 104345 . doi: 10.1016/j.isci.2022.104345 OpenUrl CrossRef ↵ Martynov , A. V. , & Korshunova , T. A . ( 2022 ). Renewed perspectives on the sedentary-pelagic last common bilaterian ancestor . Contributions to Zoology , 91 ( 4–5 ), 285 – 352 . doi: 10.1163/18759866-bja10034 OpenUrl CrossRef ↵ Matsubara , S. , Osugi , T. , Shiraishi , A. , Wada , A. , & Satake , H . ( 2021 ). Comparative analysis of transcriptomic profiles among ascidians, zebrafish, and mice: Insights from tissue-specific gene expression . PLOS ONE , 16 ( 9 ), e0254308 . doi: 10.1371/journal.pone.0254308 OpenUrl CrossRef PubMed ↵ Mayeur , H. , Leyhr , J. , Mulley , J. , Leurs , N. , Michel , L. , Sharma , K. , Lagadec , R. , Aury , J.-M. , Osborne , O. G. , Mulhair , P. , Poulain , J. , Mangenot , S. , Mead , D. , Smith , M. , Corton , C. , Oliver , K. , Skelton , J. , Betteridge , E. , Dolucan , J. , … Debiais-Thibaud , M . ( 2024 ). The sensory shark: High-quality morphological, genomic and transcriptomic data for the small-spotted catshark Scyliorhinus canicula reveal the molecular bases of sensory organ evolution in jawed vertebrates (p. 2024.05.23.595469) . bioRxiv . doi: 10.1101/2024.05.23.595469 OpenUrl Abstract / FREE Full Text ↵ Mayorova , T. D. , Koch , T. L. , Kachar , B. , Jung , J. H. , Reese , T. S. , & Smith , C. L . ( 2025 ). Placozoan secretory cell types implicated in feeding, innate immunity and regulation of behavior (p. 2024.09.18.613768) . bioRxiv . doi: 10.1101/2024.09.18.613768 OpenUrl Abstract / FREE Full Text ↵ McCarthy , D. J. , Chen , Y. , & Smyth , G. K . ( 2012 ). Differential expression analysis of multifactor RNA-Seq experiments with respect to biological variation . Nucleic Acids Research , 40 ( 10 ), 4288 – 4297 . doi: 10.1093/nar/gks042 OpenUrl CrossRef PubMed Web of Science ↵ M’Intosh , W. C . ( 1879 ). On a Remarkably Branched Syllis, dredged by H.M.S. ‘Challenger.’ Journal of the Linnean Society of London, Zoology , 14 ( 80 ), 720 – 724 . doi: 10.1111/j.1096-3642.1879.tb02356.x OpenUrl CrossRef ↵ Mistry , J. , Chuguransky , S. , Williams , L. , Qureshi , M. , Salazar , G. A. , Sonnhammer , E. L. L. , Tosatto , S. C. E. , Paladin , L. , Raj , S. , Richardson , L. J. , Finn , R. D. , & Bateman , A . ( 2021 ). Pfam: The protein families database in 2021 . Nucleic Acids Research , 49 ( D1 ), D412 – D419 . doi: 10.1093/nar/gkaa913 OpenUrl CrossRef PubMed ↵ Miyake , H. , Wada , S. , Adachi , A. , Ohtsuka , S. , Ikeda , S. , Yonetani , M. , Pagliawan , H. B. , Metillo , E. B. , & Okoshi , K . ( 2019 ). Benthic platyctenid ctenophore, Vallicula multiformis Rankin, 1956, found in an aquarium on Palawan Island, the Philippines . Plankton and Benthos Research , 14 ( 1 ), 14 – 21 . doi: 10.3800/pbr.14.14 OpenUrl CrossRef ↵ Morgan , R . ( 2006 ). Hox genes: A continuation of embryonic patterning? Trends in Genetics: TIG , 22 ( 2 ), 67 – 69 . doi: 10.1016/j.tig.2005.11.004 OpenUrl CrossRef PubMed Web of Science ↵ Morton , J. T. , Toran , L. , Edlund , A. , Metcalf , J. L. , Lauber , C. , & Knight , R . ( 2017 ). Uncovering the Horseshoe Effect in Microbial Analyses . mSystems , 2 ( 1 ) , doi: 10.1128/msystems.00166-16 . 10.1128/msystems.00166-16 OpenUrl CrossRef ↵ Nakayama , S. , & Ogasawara , M . ( 2017 ). Compartmentalized expression patterns of pancreatic- and gastric-related genes in the alimentary canal of the ascidian Ciona intestinalis: Evolutionary insights into the functional regionality of the gastrointestinal tract in Olfactores . Cell and Tissue Research , 370 ( 1 ), 113 – 128 . doi: 10.1007/s00441-017-2627-7 OpenUrl CrossRef PubMed ↵ Nakayama , S. , Satou , K. , Orito , W. , & Ogasawara , M . ( 2016 ). Ordered expression pattern of Hox and ParaHox genes along the alimentary canal in the ascidian juvenile . Cell and Tissue Research , 365 ( 1 ), 65 – 75 . doi: 10.1007/s00441-016-2360-7 OpenUrl CrossRef PubMed ↵ Nakayama , S. , Sekiguchi , T. , & Ogasawara , M . ( 2019 ). Molecular and evolutionary aspects of the protochordate digestive system . Cell and Tissue Research , 377 ( 3 ), 309 – 320 . doi: 10.1007/s00441-019-03035-5 OpenUrl CrossRef PubMed ↵ Nakazawa , K. , Yamazawa , T. , Moriyama , Y. , Ogura , Y. , Kawai , N. , Sasakura , Y. , & Saiga , H . ( 2013 ). Formation of the digestive tract in Ciona intestinalis includes two distinct morphogenic processes between its anterior and posterior parts . Developmental Dynamics: An Official Publication of the American Association of Anatomists , 242 ( 10 ), 1172 – 1183 . doi: 10.1002/dvdy.24009 OpenUrl CrossRef PubMed ↵ Nanglu , K. , Cole , S. R. , Wright , D. F. , & Souto , C . ( 2023 ). Worms and gills, plates and spines: The evolutionary origins and incredible disparity of deuterostomes revealed by fossils, genes, and development . Biological Reviews , 98 ( 1 ), 316 – 351 . doi: 10.1111/brv.12908 OpenUrl CrossRef ↵ Nehrt , N. L. , Clark , W. T. , Radivojac , P. , & Hahn , M. W . ( 2011 ). Testing the Ortholog Conjecture with Comparative Functional Genomic Data from Mammals . PLOS Computational Biology , 7 ( 6 ), e1002073 . doi: 10.1371/journal.pcbi.1002073 OpenUrl CrossRef PubMed ↵ Nissim , S. , Weeks , O. , Talbot , J. C. , Hedgepeth , J. W. , Wucherpfennig , J. , Schatzman-Bone , S. , Swinburne , I. , Cortes , M. , Alexa , K. , Megason , S. , North , T. E. , Amacher , S. L. , & Goessling , W . ( 2016 ). Iterative use of nuclear receptor Nr5a2 regulates multiple stages of liver and pancreas development . Developmental Biology , 418 ( 1 ), 108 – 123 . doi: 10.1016/j.ydbio.2016.07.019 OpenUrl CrossRef PubMed ↵ Novembre , J. , & Stephens , M . ( 2008 ). Interpreting principal component analyses of spatial population genetic variation . Nature Genetics , 40 ( 5 ), 646 – 649 . doi: 10.1038/ng.139 OpenUrl CrossRef PubMed Web of Science ↵ L. Solnica-Krezel Nowotschin , S. , & Hadjantonakis , A.-K. ( 2020 ). Chapter Fifteen - Guts and gastrulation: Emergence and convergence of endoderm in the mouse embryo . In L. Solnica-Krezel (Ed.), Current Topics in Developmental Biology (Vol. 136 , pp. 429 – 454 ). Academic Press . doi: 10.1016/bs.ctdb.2019.11.012 OpenUrl CrossRef PubMed ↵ Nowotschin , S. , Setty , M. , Kuo , Y.-Y. , Liu , V. , Garg , V. , Sharma , R. , Simon , C. S. , Saiz , N. , Gardner , R. , Boutet , S. C. , Church , D. M. , Hoodless , P. A. , Hadjantonakis , A.-K. , & Pe’er , D . ( 2019 ). The emergent landscape of the mouse gut endoderm at single-cell resolution . Nature , 569 ( 7756 ), 361 – 367 . doi: 10.1038/s41586-019-1127-1 OpenUrl CrossRef PubMed ↵ Onai , T. , Aramaki , T. , Inomata , H. , Hirai , T. , & Kuratani , S . ( 2015 ). Ancestral mesodermal reorganization and evolution of the vertebrate head . Zoological Letters , 1 ( 1 ), 29 . doi: 10.1186/s40851-015-0030-3 OpenUrl CrossRef PubMed ↵ Özpolat , B. D. , Randel , N. , Williams , E. A. , Bezares-Calderón , L. A. , Andreatta , G. , Balavoine , G. , Bertucci , P. Y. , Ferrier , D. E. K. , Gambi , M. C. , Gazave , E. , Handberg-Thorsager , M. , Hardege , J. , Hird , C. , Hsieh , Y.-W. , Hui , J. , Mutemi , K. N. , Schneider , S. Q. , Simakov , O. , Vergara , H. M. , … Arendt , D . ( 2021 ). The Nereid on the rise: Platynereis as a model system . EvoDevo , 12 ( 1 ), 10 . doi: 10.1186/s13227-021-00180-3 OpenUrl CrossRef PubMed ↵ Paganos , P. , Ronchi , P. , Carl , J. , Mizzon , G. , Martinez , P. , Benvenuto , G. , & Arnone , M. I . ( 2022 ). Integrating single cell transcriptomics and volume electron microscopy confirms the presence of pancreatic acinar-like cells in sea urchins . Frontiers in Cell and Developmental Biology , 10 . doi: 10.3389/fcell.2022.991664 OpenUrl CrossRef ↵ Paganos , P. , Ullrich-Lüter , J. , Almazán , A. , Voronov , D. , Carl , J. , Zakrzewski , A.-C. , Zemann , B. , Rusciano , M. L. , Sancerni , T. , Schauer , M. , Akar , O. , Caccavale , F. , Cocurullo , M. , Benvenuto , G. , Croce , J. C. , Lüter , C. , & Arnone , M. I . ( 2025 ). Single Nucleus Profiling Highlights the All-Brain Echinoderm Nervous System (p. 2025.03.24.644250) . bioRxiv . doi: 10.1101/2025.03.24.644250 OpenUrl Abstract / FREE Full Text ↵ Pan , W. , Wang , X. , Ren , C. , Jiang , X. , Gong , S. , Xie , Z. , Wong , N.-K. , Li , X. , Huang , J. , Fan , D. , Luo , P. , Yang , Y. , Ren , X. , Yu , S. , Qin , Z. , Wu , X. , Huo , D. , Ma , B. , Liu , Y. , … Chen , T . ( 2024 ). Sea cucumbers and their symbiotic microbiome have evolved to feed on seabed sediments . Nature Communications , 15 ( 1 ), 8825 . doi: 10.1038/s41467-024-53205-5 OpenUrl CrossRef PubMed ↵ Park , J. , Levic , D. S. , Sumigray , K. D. , Bagwell , J. , Eroglu , O. , Block , C. L. , Eroglu , C. , Barry , R. , Lickwar , C. R. , Rawls , J. F. , Watts , S. A. , Lechler , T. , & Bagnat , M . ( 2019 ). Lysosome-Rich Enterocytes Mediate Protein Absorption in the Vertebrate Gut . Developmental Cell , 51 ( 1 ), 7 – 20 .e6. doi: 10.1016/j.devcel.2019.08.001 OpenUrl CrossRef PubMed ↵ Patro , R. , Duggal , G. , Love , M. I. , Irizarry , R. A. , & Kingsford , C . ( 2017 ). Salmon provides fast and bias-aware quantification of transcript expression . Nature Methods , 14 ( 4 ), 417 – 419 . doi: 10.1038/nmeth.4197 OpenUrl CrossRef PubMed ↵ Perillo , M. , Wang , Y. J. , Leach , S. D. , & Arnone , M. I . ( 2016 ). A pancreatic exocrine-like cell regulatory circuit operating in the upper stomach of the sea urchin Strongylocentrotus purpuratus larva . BMC Evolutionary Biology , 16 ( 1 ), 117 . doi: 10.1186/s12862-016-0686-0 OpenUrl CrossRef PubMed ↵ Peterson , K. J. , & Eernisse , D. J . ( 2016 ). The phylogeny, evolutionary developmental biology, and paleobiology of the Deuterostomia: 25 years of new techniques, new discoveries, and new ideas . Organisms Diversity & Evolution , 16 ( 2 ), 401 – 418 . doi: 10.1007/s13127-016-0270-x OpenUrl CrossRef ↵ Picciani , N. , Berger , C. A. , Nielsen , S. , Musser , J. , Oel , A. P. , Stoilova , M. I. , Arendt , D. , Garm , A. , & Oakley , T. H . ( 2025 ). Comparative analysis of convergent jellyfish eyes reveals extensive differences in expression of vision-related genes (p. 2025.03.14.642713) . bioRxiv . doi: 10.1101/2025.03.14.642713 OpenUrl Abstract / FREE Full Text ↵ Podani , J. , & Miklós , I . ( 2002 ). Resemblance Coefficients and the Horseshoe Effect in Principal Coordinates Analysis . Ecology , 83 ( 12 ), 3331 – 3343 . doi: 10.1890/0012-9658(2002)083[3331:RCATHE]2.0.CO;2 OpenUrl CrossRef Web of Science ↵ Potter , S. C. , Luciani , A. , Eddy , S. R. , Park , Y. , Lopez , R. , & Finn , R. D . ( 2018 ). HMMER web server: 2018 update . Nucleic Acids Research , 46 ( W1 ), W200 – W204 . doi: 10.1093/nar/gky448 OpenUrl CrossRef PubMed ↵ Presnell , J. S. , Vandepas , L. E. , Warren , K. J. , Swalla , B. J. , Amemiya , C. T. , & Browne , W. E . ( 2016 ). The Presence of a Functionally Tripartite Through-Gut in Ctenophora Has Implications for Metazoan Character Trait Evolution . Current Biology: CB , 26 ( 20 ), 2814 – 2820 . doi: 10.1016/j.cub.2016.08.019 OpenUrl CrossRef PubMed ↵ Ritchie , M. E. , Phipson , B. , Wu , D. , Hu , Y. , Law , C. W. , Shi , W. , & Smyth , G. K . ( 2015 ). Limma powers differential expression analyses for RNA-sequencing and microarray studies . Nucleic Acids Research , 43 ( 7 ), e47 – e47 . doi: 10.1093/nar/gkv007 OpenUrl CrossRef PubMed ↵ Robinson , M. D. , McCarthy , D. J. , & Smyth , G. K . ( 2010 ). edgeR: A Bioconductor package for differential expression analysis of digital gene expression data . Bioinformatics , 26 ( 1 ), 139 – 140 . doi: 10.1093/bioinformatics/btp616 OpenUrl CrossRef PubMed Web of Science ↵ Rohart , F. , Gautier , B. , Singh , A. , & Cao , K.-A. L . ( 2017 ). mixOmics: An R package for ‘omics feature selection and multiple data integration . PLOS Computational Biology , 13 ( 11 ), e1005752 . doi: 10.1371/journal.pcbi.1005752 OpenUrl CrossRef PubMed ↵ Roux , N. , Logeux , V. , Trouillard , N. , Pillot , R. , Magré , K. , Salis , P. , Lecchini , D. , Besseau , L. , Laudet , V. , & Romans , P . ( 2021 ). A star is born again: Methods for larval rearing of an emerging model organism, the False clownfish Amphiprion ocellaris . Journal of Experimental Zoology Part B: Molecular and Developmental Evolution , 336 ( 4 ), 376 – 385 . doi: 10.1002/jez.b.23028 OpenUrl CrossRef ↵ Roux , N. , Salis , P. , Lee , S.-H. , Besseau , L. , & Laudet , V . ( 2020 ). Anemonefish, a model for Eco-Evo-Devo . EvoDevo , 11 ( 1 ), 20 . doi: 10.1186/s13227-020-00166-7 OpenUrl CrossRef PubMed ↵ RStudio Team . ( 2020 ). RStudio: Integrated Development Environment for R . RStudio, PBC . http://www.rstudio.com/ ↵ Ruppert , E. E. , Fox , R. S. , & Barnes , R. D . ( 2004 ). Invertebrate zoology: A functional evolutionary approach (7th ed) . Thomson-Brooks/Cole . ↵ Ryu , T. , Herrera , M. , Moore , B. , Izumiyama , M. , Kawai , E. , Laudet , V. , & Ravasi , T . ( 2022 ). A chromosome-scale genome assembly of the false clownfish, Amphiprion ocellaris . G3 Genes|Genomes|Genetics , 12 ( 5 ), jkac074 . doi: 10.1093/g3journal/jkac074 OpenUrl CrossRef ↵ Sahlin , K. , & Olsson , R . ( 1986 ). The Wheel Organ and Hatschek’s Groove in the Lancelet, Branchiostoma lanceolatum (Cephalochordata) . Acta Zoologica , 67 ( 4 ), 201 – 209 . doi: 10.1111/j.1463-6395.1986.tb00864.x OpenUrl CrossRef ↵ Santini , S. , & Bernardi , G . ( 2005 ). Organization and base composition of tilapia Hox genes: Implications for the evolution of Hox clusters in fish . Gene , 346 , 51 – 61 . doi: 10.1016/j.gene.2004.10.027 OpenUrl CrossRef PubMed Web of Science ↵ Sayols , S. , Scherzinger , D. , & Klein , H . ( 2016 ). dupRadar: A Bioconductor package for the assessment of PCR artifacts in RNA-Seq data . BMC Bioinformatics , 17 ( 1 ), 428 . doi: 10.1186/s12859-016-1276-2 OpenUrl CrossRef PubMed ↵ Schiffbauer , J. D. , Selly , T. , Jacquet , S. M. , Merz , R. A. , Nelson , L. L. , Strange , M. A. , Cai , Y. , & Smith , E. F . ( 2020 ). Discovery of bilaterian-type through-guts in cloudinomorphs from the terminal Ediacaran Period . Nature Communications , 11 ( 1 ), 205 . doi: 10.1038/s41467-019-13882-z OpenUrl CrossRef PubMed ↵ Sekimoto , T. , Yoshinobu , K. , Yoshida , M. , Kuratani , S. , Fujimoto , S. , Araki , M. , Tajima , N. , Araki , K. , & Yamamura , K . ( 1998 ). Region-specific expression of murine Hox genes implies the Hox code-mediated patterning of the digestive tract . Genes to Cells: Devoted to Molecular & Cellular Mechanisms , 3 ( 1 ), 51 – 64 . doi: 10.1046/j.1365-2443.1998.00167.x OpenUrl CrossRef PubMed Web of Science ↵ Shah , N. , Meng , Q. , Zou , Z. , & Zhang , X . ( 2024 ). Systematic analysis on the horse-shoe-like effect in PCA plots of scRNA-seq data . Bioinformatics Advances , 4 ( 1 ), vbae109 . doi: 10.1093/bioadv/vbae109 OpenUrl CrossRef ↵ Shen , W.-K. , Chen , S.-Y. , Gan , Z.-Q. , Zhang , Y.-Z. , Yue , T. , Chen , M.-M. , Xue , Y. , Hu , H. , & Guo , A.-Y . ( 2023 ). AnimalTFDB 4.0: A comprehensive animal transcription factor database updated with variation and expression annotations . Nucleic Acids Research , 51 ( D1 ), D39 – D45 . doi: 10.1093/nar/gkac907 OpenUrl CrossRef PubMed ↵ Sherwood , R. I. , Chen , T.-Y. A. , & Melton , D. A . ( 2009 ). Transcriptional dynamics of endodermal organ formation . Developmental Dynamics , 238 ( 1 ), 29 – 42 . doi: 10.1002/dvdy.21810 OpenUrl CrossRef PubMed Web of Science ↵ Shinn , M . ( 2023 ). Phantom oscillations in principal component analysis . Proceedings of the National Academy of Sciences , 120 ( 48 ), e2311420120 . doi: 10.1073/pnas.2311420120 OpenUrl CrossRef PubMed ↵ Silva , A. S. , Natsidis , P. , Piovani , L. , Kapli , P. , & Telford , M. J . ( 2025 ). Support for the deuterostome clade comes from systematic errors (p. 2025.01.13.632777) . bioRxiv . doi: 10.1101/2025.01.13.632777 OpenUrl Abstract / FREE Full Text ↵ Smith , C. L. , & Mayorova , T. D . ( 2019 ). Insights into the evolution of digestive systems from studies of Trichoplax adhaerens . Cell and Tissue Research , 377 ( 3 ), 353 – 367 . doi: 10.1007/s00441-019-03057-z OpenUrl CrossRef PubMed ↵ Soneson , C. , Love , M. I. , & Robinson , M. D . ( 2015 ). Differential analyses for RNA-seq: Transcript-level estimates improve gene-level inferences . F1000Research , 4 , 1521 . doi: 10.12688/f1000research.7563.2 OpenUrl CrossRef ↵ Stumpp , M. , Hu , M. Y. , Tseng , Y.-C. , Guh , Y.-J. , Chen , Y.-C. , Yu , J.-K. , Su , Y.-H. , & Hwang , P.-P . ( 2015 ). Evolution of extreme stomach pH in bilateria inferred from gastric alkalization mechanisms in basal deuterostomes . Scientific Reports , 5 ( 1 ), 10421 . doi: 10.1038/srep10421 OpenUrl CrossRef PubMed ↵ Subbotin , V . ( 2017 ). Arguments on the origin of the vertebrate liver and the amphioxus hepatic diverticulum: A hypothesis on evolutionary novelties . Pisma v Vavilovskii Zhurnal . ↵ Sudhakaran , A. , & Peter , M. C. S . ( 2025 ). Effects of L-NAME and air exposure on mitochondrial energetic markers, thyroid hormone receptor/regulator system and stress/ease-responsive receptor expression in the brain/gut axis of zebrafish . Comparative Biochemistry and Physiology Part C: Toxicology & Pharmacology , 287 , 110043 . doi: 10.1016/j.cbpc.2024.110043 OpenUrl CrossRef ↵ Takatori , N. , Butts , T. , Candiani , S. , Pestarino , M. , Ferrier , D. E. K. , Saiga , H. , & Holland , P. W. H . ( 2008 ). Comprehensive survey and classification of homeobox genes in the genome of amphioxus, Branchiostoma floridae . Development Genes and Evolution , 218 ( 11 ), 579 – 590 . doi: 10.1007/s00427-008-0245-9 OpenUrl CrossRef PubMed Web of Science ↵ Tamm , S. L . ( 2019 ). Defecation by the ctenophore Mnemiopsis leidyi occurs with an ultradian rhythm through a single transient anal pore . Invertebrate Biology , 138 ( 1 ), 3 – 16 . doi: 10.1111/ivb.12236 OpenUrl CrossRef ↵ Tarashansky , A. J. , Musser , J. M. , Khariton , M. , Li , P. , Arendt , D. , Quake , S. R. , & Wang , B . ( 2021 ). Mapping single-cell atlases throughout Metazoa unravels cell type evolution . eLife , 10 , e66747 . doi: 10.7554/eLife.66747 OpenUrl CrossRef PubMed ↵ Van den Berge , K. , Roux de Bézieux , H. , Street , K. , Saelens , W. , Cannoodt , R. , Saeys , Y. , Dudoit , S. , & Clement , L. ( 2020 ). Trajectory-based differential expression analysis for single-cell sequencing data . Nature Communications , 11 ( 1 ), 1201 . doi: 10.1038/s41467-020-14766-3 OpenUrl CrossRef ↵ van der Hoeven , F. , Sordino , P. , Fraudeau , N. , Izpisúa-Belmonte , J. C. , & Duboule , D. ( 1996 ). Teleost HoxD and HoxA genes: Comparison with tetrapods and functional evolution of the HOXD complex . Mechanisms of Development , 54 ( 1 ), 9 – 21 . doi: 10.1016/0925-4773(95)00455-6 OpenUrl CrossRef PubMed Web of Science ↵ Voronov , D. , Paganos , P. , Magri , M. S. , Cuomo , C. , Maeso , I. , Gómez-Skarmeta , J. L. , & Arnone , M. I . ( 2024 ). Integrative multi-omics increase resolution of the sea urchin posterior gut gene regulatory network at single-cell level . Development , 151 ( 16 ), dev202278 . doi: 10.1242/dev.202278 OpenUrl CrossRef ↵ Wallace , K. N. , & Pack , M . ( 2003 ). Unique and conserved aspects of gut development in zebrafish . Developmental Biology , 255 ( 1 ), 12 – 29 . doi: 10.1016/S0012-1606(02)00034-9 OpenUrl CrossRef PubMed Web of Science ↵ Wang , L.-J. , Wang , W.-L. , Gao , H. , Bai , Y.-Z. , & Zhang , S.-C . ( 2018 ). FOXD3/FOXD4 is required for the development of hindgut in the rat model of anorectal malformation . Experimental Biology and Medicine , 243 ( 4 ), 327 – 333 . doi: 10.1177/1535370217751073 OpenUrl CrossRef PubMed ↵ Wang , Z. , Du , J. , Lam , S. H. , Mathavan , S. , Matsudaira , P. , & Gong , Z . ( 2010 ). Morphological and molecular evidence for functional organization along the rostrocaudal axis of the adult zebrafish intestine . BMC Genomics , 11 ( 1 ), 392 . doi: 10.1186/1471-2164-11-392 OpenUrl CrossRef PubMed ↵ Weinrauch , A. M. , Kwan , G. T. , Giacomin , M. , Bouyoucos , I. A. , Tresguerres , M. , & Goss , G. G . ( 2025 ). Evolutionary insights into gut acidification: Invertebrate-like mechanisms in the basal vertebrate hagfish . Journal of Experimental Biology , 228 ( 14 ), jeb249641. doi: 10.1242/jeb.249641 OpenUrl CrossRef ↵ Wen , J. , Mercado , G. P. , Volland , A. , Doden , H. L. , Lickwar , C. R. , Crooks , T. , Kakiyama , G. , Kelly , C. , Cocchiaro , J. L. , Ridlon , J. M. , & Rawls , J. F . ( 2021 ). Fxr signaling and microbial metabolism of bile salts in the zebrafish intestine . Science Advances , 7 ( 30 ), eabg1371 . doi: 10.1126/sciadv.abg1371 OpenUrl FREE Full Text ↵ Wickham , H . ( 2016 ). Ggplot2 . Springer International Publishing . doi: 10.1007/978-3-319-24277-4 OpenUrl CrossRef ↵ Wilkie , I. C . ( 2001 ). Autotomy as a prelude to regeneration in echinoderms . Microscopy Research and Technique , 55 ( 6 ), 369 – 396 . doi: 10.1002/jemt.1185 OpenUrl CrossRef PubMed Web of Science ↵ Wingett , S. W. , & Andrews , S . ( 2018 ). FastQ Screen: A tool for multi-genome mapping and quality control . F1000Research , 7 , 1338 . doi: 10.12688/f1000research.15931.2 OpenUrl CrossRef PubMed ↵ Wu , B. , Xu , W. , Wu , K. , Li , Y. , Hu , M. , Feng , C. , Zhu , C. , Zheng , J. , Cui , X. , Li , J. , Fan , D. , Zhang , F. , Liu , Y. , Chen , J. , Liu , C. , Li , G. , Qiu , Q. , Qu , K. , Wang , W. , & Wang , K . ( 2024 ). Single-cell analysis of the amphioxus hepatic caecum and vertebrate liver reveals genetic mechanisms of vertebrate liver evolution . Nature Ecology & Evolution , 8 ( 10 ), 1972 – 1990 . doi: 10.1038/s41559-024-02510-9 OpenUrl CrossRef PubMed ↵ Xiao , N. , Cao , D.-S. , Zhu , M.-F. , & Xu , Q.-S . ( 2015 ). protr/ProtrWeb: R package and web server for generating various numerical representation schemes of protein sequences . Bioinformatics , 31 ( 11 ), 1857 – 1859 . doi: 10.1093/bioinformatics/btv042 OpenUrl CrossRef PubMed ↵ Yahagi , N. , Kosaki , R. , Ito , T. , Mitsuhashi , T. , Shimada , H. , Tomita , M. , Takahashi , T. , & Kosaki , K . ( 2004 ). Position-specific expression of Hox genes along the gastrointestinal tract . Congenital Anomalies , 44 ( 1 ), 18 – 26 . doi: 10.1111/j.1741-4520.2003.00004.x OpenUrl CrossRef PubMed ↵ Yao , C. , Carraro , G. , Konda , B. , Guan , X. , Mizuno , T. , Chiba , N. , Kostelny , M. , Kurkciyan , A. , David , G. , McQualter , J. L. , & Stripp , B. R . ( 2017 ). Sin3a regulates epithelial progenitor cell fate during lung development . Development (Cambridge, England) , 144 ( 14 ), 2618 – 2628 . doi: 10.1242/dev.149708 OpenUrl Abstract / FREE Full Text ↵ M. B. Rogers Yong , L. W. , Kozmikova , I. , & Yu , J.-K. ( 2019 ). Using Amphioxus as a Basal Chordate Model to Study BMP Signaling Pathway . In M. B. Rogers (Ed.), Bone Morphogenetic Proteins: Methods and Protocols (pp. 91 – 114 ). Springer . doi: 10.1007/978-1-4939-8904-1_8 OpenUrl CrossRef ↵ Yonge , C. M . ( 1937 ). Evolution and Adaptation in the Digestive System of the Metazoa . Biological Reviews , 12 ( 1 ), 87 – 114 . doi: 10.1111/j.1469-185X.1937.tb01223.x OpenUrl CrossRef ↵ Yu , J. K. S. , & Holland , L. Z . ( 2009 ). Cephalochordates (amphioxus or lancelets): A model for understanding the evolution of chordate characters . Cold Spring Harbor Protocols , 2009 ( 9 ), pdb.emo130 . doi: 10.1101/pdb.emo130 OpenUrl Abstract / FREE Full Text ↵ Yu , J.-K. , Holland , N. D. , & Holland , L. Z . ( 2002 ). An amphioxus winged helix/forkhead gene, AmphiFoxD: Insights into vertebrate neural crest evolution . Developmental Dynamics , 225 ( 3 ), 289 – 297 . doi: 10.1002/dvdy.10173 OpenUrl CrossRef PubMed Web of Science ↵ Zhang , G. , Parry , L. A. , Vinther , J. , & Ma , X . ( 2022 ). Exceptional soft tissue preservation reveals a cnidarian affinity for a Cambrian phosphatic tubicolous enigma. Proceedings . Biological Sciences , 289 ( 1986 ), 20221623 . doi: 10.1098/rspb.2022.1623 OpenUrl CrossRef PubMed ↵ Zhang , W. , Jiang , A. , Yu , H. , & Dong , B . ( 2023 ). Comparative Transcriptomic Analysis Reveals the Functionally Segmented Intestine in Tunicate Ascidian . International Journal of Molecular Sciences , 24 ( 7 ), Article 7. doi: 10.3390/ijms24076270 OpenUrl CrossRef ↵ Zhao , Y. , Vinther , J. , Parry , L. A. , Wei , F. , Green , E. , Pisani , D. , Hou , X. , Edgecombe , G. D. , & Cong , P . ( 2019 ). Cambrian Sessile, Suspension Feeding Stem-Group Ctenophores and Evolution of the Comb Jelly Body Plan . Current Biology , 29 ( 7 ), 1112 – 1125 .e2. doi: 10.1016/j.cub.2019.02.036 OpenUrl CrossRef PubMed ↵ Zhong , Y. , Herrera-Úbeda , C. , Garcia-Fernàndez , J. , Li , G. , & Holland , P. W. H . ( 2020 ). Mutation of amphioxus Pdx and Cdx demonstrates conserved roles for ParaHox genes in gut, anus and tail patterning . BMC Biology , 18 ( 1 ), 68 . doi: 10.1186/s12915-020-00796-2 OpenUrl CrossRef PubMed ↵ Zhu , H. , Ludington , W. B. , & Spradling , A. C . ( 2024 ). Cellular and molecular organization of the Drosophila foregut . Proceedings of the National Academy of Sciences , 121 ( 11 ), e2318760121 . doi: 10.1073/pnas.2318760121 OpenUrl CrossRef PubMed ↵ Zwick , R. K. , Kasparek , P. , Palikuqi , B. , Viragova , S. , Weichselbaum , L. , McGinnis , C. S. , McKinley , K. L. , Rathnayake , A. , Vaka , D. , Nguyen , V. , Trentesaux , C. , Reyes , E. , Gupta , A. R. , Gartner , Z. J. , Locksley , R. M. , Gardner , J. M. , Itzkovitz , S. , Boffelli , D. , & Klein , O. D . ( 2024 ). Epithelial zonation along the mouse and human small intestine defines five discrete metabolic domains . Nature Cell Biology , 26 ( 2 ), 250 – 262 . doi: 10.1038/s41556-023-01337-z OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted July 03, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Deconstructing the common anteroposterior organisation of adult bilaterian guts Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Deconstructing the common anteroposterior organisation of adult bilaterian guts Stefano Davide Vianello , Ching-Yi Lin , Wahyu Cristine Pinem , Han-Ru Li , Kun-Lung Li , Grace Sonia , Shu-Hua Lee , Szu-Kai Wu , Vincent Laudet , Yi-Hsien Su , Jr-Kai Yu , Stephan Q. Schneider bioRxiv 2025.07.02.662275; doi: https://doi.org/10.1101/2025.07.02.662275 Share This Article: Copy Citation Tools Deconstructing the common anteroposterior organisation of adult bilaterian guts Stefano Davide Vianello , Ching-Yi Lin , Wahyu Cristine Pinem , Han-Ru Li , Kun-Lung Li , Grace Sonia , Shu-Hua Lee , Szu-Kai Wu , Vincent Laudet , Yi-Hsien Su , Jr-Kai Yu , Stephan Q. Schneider bioRxiv 2025.07.02.662275; doi: https://doi.org/10.1101/2025.07.02.662275 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Developmental Biology Subject Areas All Articles Animal Behavior and Cognition (7618) Biochemistry (17636) Bioengineering (13859) Bioinformatics (41847) Biophysics (21401) Cancer Biology (18535) Cell Biology (25423) Clinical Trials (138) Developmental Biology (13353) Ecology (19860) Epidemiology (2067) Evolutionary Biology (24287) Genetics (15582) Genomics (22463) Immunology (17701) Microbiology (40300) Molecular Biology (17141) Neuroscience (88432) Paleontology (666) Pathology (2825) Pharmacology and Toxicology (4813) Physiology (7633) Plant Biology (15107) Scientific Communication and Education (2042) Synthetic Biology (4285) Systems Biology (9808) Zoology (2267)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00