Φ-Space ST: a platform-agnostic method to identify cell states in spatial transcriptomics studies

doi:10.1101/2025.02.05.636735

Φ-Space ST: a platform-agnostic method to identify cell states in spatial transcriptomics studies

2025 · doi:10.1101/2025.02.05.636735

preprint OA: closed CC-BY-NC-ND-4.0

📄 Open PDF Full text JSON View at publisher

Full text 75,468 characters · extracted from preprint-html · click to expand

Φ-Space ST: a platform-agnostic method to identify cell states in spatial transcriptomics studies | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Φ-Space ST: a platform-agnostic method to identify cell states in spatial transcriptomics studies View ORCID Profile Jiadong Mao , View ORCID Profile Jarny Choi , View ORCID Profile Kim-Anh Lê Cao doi: https://doi.org/10.1101/2025.02.05.636735 Jiadong Mao 1 Melbourne Integrative Genomics, School of Mathematics and Statistics, The University of Melbourne , Australia Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jiadong Mao Jarny Choi 2 Bioinformatics and Cellular Genomics, St Vincent’s Institute , Australia Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jarny Choi Kim-Anh Lê Cao 1 Melbourne Integrative Genomics, School of Mathematics and Statistics, The University of Melbourne , Australia Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Kim-Anh Lê Cao For correspondence: kimanh.lecao{at}unimelb.edu.au Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract We introduce Φ-Space ST, a platform-agnostic method to identify continuous cell states in spatial transcriptomics (ST) data using multiple scRNA-seq references. For ST with supercellular resolution, Φ-Space ST achieves interpretable cell type deconvolution with significantly faster computation. For subcellular resolution, Φ-Space ST annotates cell states without cell segmentation, leading to highly insightful spatial niche identification. Φ-Space ST harmonises annotations derived from multiple scRNA-seq references, and provides interpretable characterisations of disease cell states by leveraging healthy references. We validate Φ-Space ST in three case studies involving CosMx, Visium and Stereo-seq platforms for various cancer tissues. Our method revealed niche-specific enriched cell types and distinct cell type co-presence patterns that distinguish tumour from non-tumour tissue regions. These findings highlight the potential of Φ-Space ST as a robust and scalable tool for ST data analysis for understanding complex tissues and pathologies. 1 Introduction The rapid advancement of spatial transcriptomics (ST) technologies has transformed our ability to explore the spatial organisation of gene expression within tissues, offering unprecedented insights into cellular architecture and tissue microenvironments [ 1 ]. Technologies such as 10x Genomics Visium [ 2 ], NanoString CosMx [ 3 ] and BGI’s Stereo-seq [ 4 ] have allowed researchers to map gene expression at various spatial resolutions, ranging from subcellular to supercellular levels. These advances have unlocked opportunities to understand tissue organisation and cellular interactions in both healthy and disease states. However, achieving biologically meaningful annotations of continuous cell states remains a major hurdle, particularly across platforms with varying resolutions and technical specifications. A common strategy for cell type annotation in ST data involves comparing expression profiles of query ST data to those in well-annotated scRNA-seq references [ 5 , 6 ]. However, existing ST platforms lack exact single-cell resolution since they do not directly measure single cells [ 1 , 7 ]. For supercellular resolution ST such as Visium [ 2 ], each measurement unit is a multi-cellular spot and hence may contain a mixture of cell identities. For subcellular resolution ST such as CosMx [ 3 ] and Stereo-seq [ 4 ], the minimal measurement unit is often much smaller than the size of a single cell. These subcellular measurement units can be aggregated into suitable sizes via simple spatial binning or sophisticated cell segmentation algorithms [ 8 , 9 ]. However, the resulted bins or segmented cells may still contain fractions of transcripts from multiple neighbouring cells [ 9 , 10 ]. To deal with mixing cell identities commonly seen in both supercellular and subcellular ST data, cell type deconvolution methods have been developed [ 11 – 16 ]. These deconvolution methods can estimate cell type abundances within each spatial measurement unit such as supercellular spots, segmented cells and spatial bins based on reference scRNA-seq datasets. In the remainder of this article, we will refer to these spatial measurements as cell-like objects . Existing cell type deconvolution methods have a high potential but face several limitations, including over-reliance on single references and restrictive parametric assumptions about the data-generating process [ 11 , 13 , 15 , 16 ]. These limitations are especially problematic for complex and dynamic tissue environments, such as cancer, where cells frequently exhibit transitional or hybrid states that are not represented in reference datasets. In addition, existing methods are often computationally inefficient and difficult to extend for spatial omics data beyond transcriptomics, such as spatial proteomics and epigenomics [ 17 , 18 ]. To address these challenges, we present Φ-Space ST, a novel computational framework designed for platform-agnostic annotation of cell states in ST data. Φ-Space ST builds on Φ-Space, previously developed for single-cell multiomics analysis [ 19 ] ( Fig 1A ). Φ-Space ST leverages partial least squares (PLS) regression to annotate spatial cell-like objects with a continuous cell type scores. Unlike existing deconvolution methods, Φ-Space ST enables annotation using multiple scRNA-seq references, allowing the identification of both known and novel cell states. Its nonparametric and flexible framework avoids restrictive assumptions, offering greater adaptability. Additionally, Φ-Space ST is significantly faster than state-of-the-art methods like RCTD [ 11 ] and cell2location [ 13 ]. These features make Φ-Space ST highly versatile for a wide range of ST platforms and biological contexts. Download figure Open in new tab Fig 1: Schema of Φ-Space ST. A: Framework of the transcriptomic module of our previous Φ-Space method [ 19 ]. A1: Φ-Space enables continuous phenotyping of cells based on either bulk or single-cell RNA-seq references. A2: We first compute a partial least squares (PLS) regression coefficient matrix B to predict all K cell types on a continuous scale using P gene expression levels. A2: We then apply B to query gene expression matrix to obtain continuous cell type scores Ŷ query for each of the query cells. B: Framework of Φ-Space ST, a new platform-agnostic and computationally efficient method designed to identify continuous cell states of spatial cell-like objects (supercellular spots, segmented cells or spatial bins) using spatial transcriptomics (ST) data. B1: We first train PLS regression models from one or multiple scRNA-seq references to continuously predict reference cell types. B2: We then apply the PLS models to the query ST data. Φ-Space ST accurately identifies not only the within-reference cell states, but also out-of-reference, e.g. transitional and malignant, cell states. C: Analyses based on Φ-Space ST continuous annotations of query cell-like objects, which we refer to as their phenotype space embeddings . C1: We identify spatial niches by clustering the phenotype space embeddings. C2: Cell type enrichment analysis, where we identify differentially enriched cell types in each spatial niche. C3: Cell type co-presence analysis, where we quantify the spatial co-presence of cell types and then use discriminant analysis to infer how specific co-presence patterns are associated with disease conditions. In this study, we illustrate the application of Φ-Space ST to three cancer studies involving diverse ST platforms including 10x Genomics Visium [ 2 ], NanoString CosMx [ 3 ] and BGI’s Stereo-seq [ 4 ]. We demonstrate the ability of Φ-Space ST in identifying spatial niches, enriched cell types and cell type co-presence patterns that distinguish tumour from non-tumour tissue regions. By offering robust, scalable and biologically interpretable annotations, Φ-Space ST sets the stage for more comprehensive analyses of spatially resolved transcriptomics data. 2 Results 2.1 Φ-Space ST: a platform-agnostic method for identifying continuous cell states from ST data Overview Φ-Space ST is a platform-agnostic method for annotating different types of cell-like objects in ST data. We define a cell-like object as as the collection of transcripts observed in the proximity of a certain tissue location. Depending on the technical specifications of ST platforms, cell-like objects can be multi-cellular spots (e.g. 10x Visium [ 2 ]), segmented cells [ 8 ] or bins of aggregated transcripts (e.g. Stereo-seq [ 4 ]). Multi-reference learning of cell states Φ-Space ST transfers the rich knowledge about cell states from multiple reference scRNA-seq datasets to the query ST data, based on the assumption that all cell states in the query data can be characterised as mixtures of cell types defined in the reference, including out-of-reference cell states that may be present in the query. For example, some lung cancer cells may be jointly characterised by healthy lung epithelial and mesenchymal cell types [ 20 ]. Partial least squares as methodological backbone The core of Φ-Space ST is partial least squares (PLS) regression [ 21 , 22 ]. The first step of the Φ-Space ST workflow is to select genes that are useful for predicting cell types defined in the reference datasets. In the second step ( Fig 1B1 ), a PLS regression model is trained from each reference scRNA-seq dataset to predict the reference cell type on a continuous scale. In the third step ( Fig 1B2 ), the PLS models are applied to the query ST dataset. Each query cell-like object is characterised by its similarities with individual cell types defined in all references. We refer to this continuous annotation of cell-like objects as their phenotype space embeddings . Quantifying cell type divergence in complex tissue microenvironment Conventional cell type deconvolution methods characterise the cell state of a cell-like object as a composition of cell types in the reference, which requires the predicted cell type scores of each cell-like object to sum up to 1 [ 11 , 13 – 16 ]. While this is a reasonable assumption in some scenarios, it may become stringent in disease samples such as the tumour microenvironment, where tumour and tumour-related cells typically exhibit divergent cell states [ 23 ]. The restriction of cell type scores to sum up to 1 can introduce compositional bias, which may hinder biological meaningful comparison of cell states across tissue regions and samples (e.g. the difference between transcriptionally active and inactive tissue regions may be masked) [ 13 ]. Considering the complex cell state landscape of disease-altered tissue microenvironment, Φ-Space ST removes the assumption that the query cell state can be characterised as a composition of reference cell types. As a result, we can measure the cell state divergence of a query cell-like object, defined as the 75% quantile of all predicted cell type scores. Higher cell state divergence implies that a cell-like object exhibits similarity to more reference cell types, flagging stronger transcriptional activity or transitional cell states. Phenotype space embeddings for multi-sample biological discovery The phenotype space embeddings of the cell-like objects from different tissue samples are in the same scale and hence provide a basis for multi-sample biological discoveries from ST data. We use phenotype space embeddings of cell-like objects to identify spatial niches, niche-specific enriched cell types and cell type co-presence patterns that separate disease from healthy samples ( Fig 1C ; details in Methods Section 4 ). Summary of case studies We apply Φ-Space ST to three cancer studies to showcase the biological insight provided by Φ-Space ST for identifying spatial phenotypic patterns in tumour microenvironments based on data from a diverse range of ST platforms. The case studies are summarised in Table 1 along with the annotation challenges faced for each of these platforms. View this table: View inline View popup Download powerpoint Table 1: Summary of case studies and associated analytical challenges. Challenge 1: Annotating tumour-associated cell states using healthy cell states; Challenge 2: Leveraging multiple scRNA-seq references; Challenge 3: Providing tnterpretable cell type deconvolution in tumour microenvironment; Challenge 4: Identifying spatial niches based on lineage tracing information. N: number of cells; NSCLC: non-small cell lung cancer; CITE-seq: cellular indexing of transcriptomes and epitopes by sequencing; AML: acute myeloid leukaemia. We explain in detail the different characteristics of ST data analysed in these case studies: 10x Visium [ 2 ] is a sequencing-based platform, which provides whole-transcriptome sequencing in spatial spots with diameter 55 µm. Each spot may contain multiple cells and hence can be viewed as a mini-bulk. The Visium dataset we analysed consists of 18 lung sections selected from 9 individuals, including 1 healthy donor and 8 non-small cell lung cancer (NSCLC) patients (that is, two sections from each patient) [ 24 ]. Nanostring CosMx [ 3 ] is an imaging-based platform, which is capable of detecting transcripts with subcellular precision. The CosMx dataset we analysed consists of 8 tumorous lung tissue sections from 5 NSCLC patients [ 25 ]. The expression level of 980 genes were measured on each tissue sample. We used the morphology-based cell segmentation results provided by He et al. [ 25 ] and analysed transcriptional profiles of segmented cells. BGI Stereo-seq [ 4 ] is a sequencing-based platform, which provides whole-transcriptome sequencing at subcellular resolution. The Stereo-seq dataset we analysed consists of one mouse spleen section containing acute myeloid leukaemia (AML) cells [ 26 ]. Singlecell profiling and lineage tracing (SPLINTR) was used to barcode the AML cells, so that descendants from the same ancestor AML cell (i.e. an AML clone) shared the same barcode. Due to a technical issue known as ‘spot bleeding’ [ 10 ], no reliable cell segmentation could be conducted to infer cell boundaries. Hence, following Holze et al. [ 26 ], we binned the transcripts into ‘bin50’, i.e. spatial bins of sidelengths ∼25 µm, and analysed these spatial bins. 2.2 Φ-Space ST provides highly interpretable cell type deconvolution for understanding cell type co-presence For supercellular spatial platforms such as 10x Visium, single-cell resolution is technically unattainable (see Section 2.1 ). As a result, to infer spatial distribution of cell types, deconvolution algorithms must be used to estimate the abundance of different cell types within each multicellular spot. In this case study, we first demonstrate that Φ-Space ST provides more interpretable cell type deconvolution compared to some state-of-the-art deconvolution methods and is very fast to compute. We then use the Φ-Space ST deconvolution results to infer cell type co-presence patterns. This analysis leads to an interpretable separation of samples from different subtypes of non-small cell lung cancer (NSCLC), revealing potential connections between cell type co-presence and NSCLC prognosis. Φ-Space ST provides more interpretable cell type deconvolution In this benchmark we applied Φ-Space ST, RCTD [ 11 ], cell2location [ 13 ] and TACCO [ 16 ] to the Visium NSCLC dataset [ 24 ]. These four methods produced discrepant estimates of the spatial distribution of cell types. For example, for a tumorous lung section P11 T3 ( Fig 2A ), the B cell abundance in spatial spots inferred by these methods might lead to very different biological interpretations on how B cells infiltrated the tumour region ( Fig 2B ). Given the important role of B cells in tumour microenvironment [ 33 , 34 ], these diverging estimates may result in very different cancer prognosis and treatment. Download figure Open in new tab Fig 2: Benchmarking of cell type deconvolution methods using Visium lung cancer samples. A: A 10x Visium non-small cell lung cancer (NSCLC) tissue P11 T3 coloured according to expression levels of NSCLC marker KRT19 and B cell marker CD79A, where each dot represents a 55 µm multicellular spot. B: Predicted B cell abundance in P11 T3 according to Φ-Space ST and three state-of-the-art cell type deconvolution methods. These four methods resulted in very different estimates of B cell spatial distribution. To evaluate the quality of B cell abundance predictions, we calculated the number of meaningful markers for B cell prediction by each method: in each Venn diagram, the blue circle represents differentially expressed genes in the spatial region predicted to have high B cell abundance; the red circle represents B cell marker genes learned from the reference. C: Boxplot comparing mean number of meaningful markers per tissue for all 18 tissues. Average run time of each method is also shown. D: We computed cell type co-presence matrices for 18 lung tissues and computed their first two principal components (PCs) with proportions of variance explained by these PCs. The PC plot shows a clear separation between non-tumorous (healthy and background) and tumorous (LUAD and LUSC) samples. Furthermore, LUSC, which tend to have worse prognosis than LUAD, tended to be separated from LUAD.(LUAD, lung adenocarcinoma; LUSC, lung squamous cell carcinoma; background, non-tumorous tissues from cancerous lungs.) E: To investigate if the heterogeneity of tumorous samples observed in D reflected differential prognoses, we computed the favourable prognosis scores for both LUAD and LUSC samples. P24 T1 had the least favourable predicted prognosis among the LUAD samples, and was located closer to LUSC samples in D ; P11 T3 had the most favourable predicted prognosis among the LUSC samples, and was located closer to LUAD samples. In general, tumorous samples tended to form two clusters (circled in D ) according to prognoses. F: Since different disease conditions were mainly separated along PC1 in D , we plotted the top 20 cell type co-presence patterns contributing to PC1: 9/20 involved fibroblasts (marked by ⋆). Evaluating the accuracy of cell type deconvolution is challenging due to the lack of available ground truth. Thus we defined meaningful markers of a target cell type in a given tissue sample as genes in the intersection of two gene sets: the differentially expressed marker genes learned from the reference data, and the spatially differentially expressed genes in the query tissue area with high predicted abundance of the target cell type (see Supplementary Methods Section S2). The number of meaningful markers measures how cell type deconvolution matched prior knowledge about cell types via marker gene identification. When predicting B cell abundance in the tissue section P11 T3, Φ-Space ST had the highest number of meaningful markers ( Fig 2B ). Then, to evaluate the performance of the deconvolution methods on all cell types for tissue P11 T3, we calculated the mean number of meaningful markers averaged across all 61 cell types defined in the reference (Supplementary Fig S1A). Φ-Space ST had the highest mean number of meaningful markers. Finally, across all 18 tissue samples ( Fig 2C ), Φ-Space ST and RCTD had significantly higher mean number of meaningful markers compared to cell2location and TACCO. In addition, Φ-Space ST only took less than 1 minute to compute each tissue sample, much faster than RCTD, which took hours to compute each tissue sample. Φ-Space ST reveals lung cancer subtype-specific cell type co-presence With high throughput and multicellular spots, Visium samples have been viewed as particular suitable for investigating cell type co-presence [ 35 , 36 ]. A key to biologically meaningful co-presence analysis is reliable cell type deconvolution, a task that Φ-Space ST excels at ( Fig 2A–C ). Therefore, we computed the cell type co-presence matrices based on cell type abundance inferred by Φ-Space ST for the Visium samples. We computed one cell type co-presence matrix for each of the 18 Visium samples, then extracted the principle components (PCs) of the co-presence matrices (details in Methods Section 4 ). We observed a clear separation between LUAD, LUSC and non-tumorous samples ( Fig 2D ). Moreover, the LUAD and LUSC samples appeared to be more heterogeneous compared to the non-tumorous samples, with LUAD samples and LUSC samples separately grouped to-gether. Since LUSC tends to have worse prognosis than LUAD [ 37 ], we investigated whether the observed separation might be due to the differential prognoses of cancer patients. As we lacked additional patient-level information from the original publication [ 24 ], we opted for a computational approach to predict prognosis based on markers identified in the Visium samples [ 37 ] (see Supplementary Methods Section S2). Our analysis identified LUAD (LUSC) samples with the least (most) favourable prognosis ( Fig 2E ). This was confirmed by the location of sample P24 T1 (least favourable prognosis) close to the LUSC samples and P11 T3 (most favourable prognosis) close to the LUAD samples ( Fig 2D ). Therefore we were able to attribute the heterogeneity of tumorous samples observed on Fig 2D to their differential prognoses. Since the disease conditions were mainly separated along the first principal component (PC1) on Fig 2D , we investigated how co-presence of specific pairs of cell types contributed to this separation by examining the top 20 PC1 cell type co-presence loadings ( Fig 2F ). Notably, adventitial and alveolar fibroblasts were featured in 9 of the top 20 loadings, highlighting the diverse roles of fibroblasts in lung tumour microenvironment [ 38 , 39 ]. To focus on solely on immune cell types, we excluded non-immune cell types in the co-presence matrices and reran the analysis. We observed that the separation between LUAD, LUSC and non-tumorous tissues was largely retained (Supplementary Fig S1B), with plasmatoid dendritic cell (pDC) playing a prominant role in explaining this separation (Supplementary Fig S1C) [ 40 ]. In particular, the co-presence of pDC and different types of fibroblasts all had positive loadings, suggesting that the pDC–fibroblast co-presence might be related to lung cancer prognosis [ 41 ]. Deconvolution results from other methods can also be used to conduct the cell type co-presence analysis featured in Fig 2D–F . However results based on alternative methods were less interpretable compared to Φ-Space ST. For example, although the first two PCs of co-presence matrices based on RCTD also showed a good separation of disease conditions, the PCs there lacked a correspondence to cancer prognosis as in the Φ-Space ST results above (Supplementary Fig S2). Summary Through the Visium case study we showed that when single-cell resolution was technically unattainable, Φ-Space ST provided biologically interpretable cell type deconvolution results. Compared to state-of-the-art methods specifically designed for cell type deconvolution, Φ-Space ST deconvolution either led to increased interpretability or faster computation. A multi-sample cell type co-presence analysis enabled to identify differential cell type co-presence patterns in different cancer subtypes, suggesting some potentially association between cell type co-presence and cancer prognosis. 2.3 Φ-Space ST characterises heterogeneity of lung tumour microenvironment using healthy single-cell reference atlas Φ-Space ST can uncover complex cell states in tumour microenvironment by combining multiple scRNA-seq references, as we shall demonstrate below using the CosMx dataset from NSCLC patients (detailed in Section 2.1 ). Since cell segmentation was available for these tissue sections [ 25 ], we treated segmented cells as cell-like objects. We obtained biologically meaningful identification of altered cell states by leveraging multiple scRNA-seq references from healthy and fibrotic lungs, highlighting the ability of Φ-Space ST in identifying divergent cell states. Φ-Space ST uncovers complex and heterogeneous cell state landscapes of tumour microenvironment We first focused on a particular lung section Lung5 Rep1 from a lung adenocarcinoma (LUAD) patient to demonstrate how Φ-Space ST can provide insights into the cell state heterogeneity of the tumour microenvironment. Nine spatial domains were identified in this tissue section by He et al. [ 25 ] ( Fig 3A ). According to our Φ-Space ST annotation, the tumour interior, tumour-stroma boundary and lymphoid structure domains had higher cell type divergence (Supplementary Fig S3; see also Methods Section 4 ). The lymphoid structures were highly divergent, potentially due to the dense population of various immune cell types, such as T, B and dendritic cells [ 42 ] as identified by Φ-Space ST ( Fig 3B ). The tumour domains were highly divergent, consistent with lung tumours tending to exhibit molecular features of multiple cell types [ 37 ]. We found that a combination of mesenchymal, epithelial and immune cell types were enriched in the tumour domains, including tumour interior and tumour-stroma boundary ( Fig 3B ). In particular, the secretory and transitional AT2 cell types reflected the glandular cell origin of LUAD [ 43 ]; the observed basal and KRT5-/KRT17+ epithelial cell types in LUAD was consistent with previous study [ 44 ]; and the presence of mesothelial and activated myofibroblast cell types flagged the potential existence of epithelial-to-mesenchymal transition [ 45 ] and cancer-associated fibroblasts [ 46 ]. Download figure Open in new tab Fig 3: Exploring cell state heterogeneity in CosMx lung samples. A: CosMx lung sample (Lung5 Rep1) from a patient with lung adenocarcinoma (LUAD), with spatial domains identified by He et al. [ 25 ]. Each dot represents the location of the nucleus of a cell. B: Top 5 most enriched cell types of some spatial domains in the sample Lung5 Rep1 identified by Φ-Space ST. (SecretSCGB1A1+/MUC5B+: secretory cell with unregulated SCGB1A1 and MUC5B; SecretSCGB3A2+: secretory cell with upregulated SCGB3A2; AlveolarMacroph: alverolar macrophage; MyoFB Act: activated myofibroblast; TransAT2: transitional type-2 alveolar cell; ProlifImm: proliferating immune cell; CD4: CD4 T cell; cDC1: type-1 conventional dendritic cell.) C: Φ-Space ST niches, identified by clustering phenotype space embeddings of segmented cells. D: Cell type divergence of Φ-Space ST niches. D1: Cell proportions according to spatial domains ( A ) for each Φ-Space ST niche. Niches 5 and 9 contained large proportions of cells from tumour domains (tumour interior and tumour-stroma boundary). D2: Cell type divergence of Φ-Space ST niches. The two tumour niches 5 and 9 differ greatly in their divergence. D3: Φ-Space ST scores of the most enriched cell types in niches 5 and 9. While these two niches had similar enriched cell types, the scores in niche 9 were generally higher than in niche 5, leading to the difference in cell type divergence. E: Top 5 most enriched cell types in tumour interior domains of different lung samples. (LUAD: lung adenocarcinoma; LUSC: lung squamous cell carcinoma.) F: Cell type co-presence analysis. F1: First two principal components (PCs) of all the domain-specific co-presence matrices. Tumour domains (tumour interior and tumour-stroma boundary) and non-tumour domains were separated, reflecting distinct cell type co-presence patterns. F2: Discriminant analysis (DWD) of all domain-specific co-presence matrices shows clear separation between tumour and non-tumour domains. F3: DWD loadings highlighting most discriminant co-presence patterns, where two cell types having positive (negative) loading indicates if their co-presence contributes to the prediction of tumour (non-tumour) domains. (gCap: general capillary cell; FB: fibroblast; Secret: secretory cell; moDC: monocyte-derived dendritic cell.) Φ-Space ST identifies heterogeneous tumour niches with differential cell type divergence To compare Φ-Space ST spatial niches with the spatial domains identified by He et al. [ 25 ] ( Fig 3A ), we identified 9 spatial niches of Lung5 Rep1 based on the Φ-Space ST annotation ( Fig 3C ; see Methods Section 4 ). Overall, our Φ-Space ST niches corresponded well to the domains in Fig 3A . A notable difference was that we identified two tumour niches, niches 5 and 9, which both contained a large proportion of cells from the tumour interior and tumour-stroma boundary domains ( Fig 3D1 ), but had significantly different cell state divergence ( Fig 3D2 ). In particular, these two niches were enriched by the same cell types but niche 9 showed a much higher divergence compared to niche 5 ( Fig 3D2 & D3 ). This highlighted intra-tumour heterogeneity that was not captured in He et al. [ 25 ]. Φ-Space ST identifies differentially enriched cell types in different cancerous lung samples As we have previously demonstrated [ 19 ], the phenotype space embeddings of query datasets derived using PLS regression models are robust against batch effects. This property of PLS also makes Φ-Space ST annotations from different query ST samples directly comparable. For example, the enriched cell types in the tumour interior domain were reproducible across biological replicates, i.e. tissue sections from the same lungs (see replicates from Lung5 and Lung9 in Fig 3E ). In contrast, the enriched cell types in the tumour interior domain from different patients exhibited significant heterogeneity (compare Lung5, Lung6, Lung9, Lung12 and Lung13 in Fig 3E ). Specifically, mesothelial cell type was enriched in all lung adenocarcinoma (LUAD) tumours (Lung5, 9, 12 and 13) but not in lung squamous cell carcinoma (LUSC) sample (Lung6). Two myofibroblast cell types were enriched in the LUSC sample (Lung6), consistent with a recent finding that LUSC tumours tended to have higher level of myofibroblasts compared to LUAD [ 47 ]. Φ-Space ST reveals cancer-specific cell type co-presence patterns To investigate how cell type co-presence patterns distinguish spatial niches across samples, we calculated the cell type co-presence matrices for spatial domains in all 8 CosMx NSCLC samples, visualised using PCA (detailed in Methods Section 4 ). We observed a separation of tumour domains from non-tumour domains ( Fig 3F1 ). Furthermore, a discriminant analysis using DWD ( Fig 1C ) led to an improved separation between tumour and non-tumour domains ( Fig 3F2 ). The DWD loadings highlighted pairs of cell types whose co-presence in the same segmented cell contribute to the prediction of tumour or non-tumour domains ( Fig 3F3 ). The tumour domains were characterised by complex interactions between endothelial (gCap, lymphatic, venule), epithelial (ciliated, secretory) and mesenchymal (myoFB, alveolar FB, mesothelial) cell types, indicating possible epithelial-mesenchymal, mesenchymalepithelial and endothelial-mesenchymal transitions as typically seen in malignant tumours [ 20 , 48 ]. In addition, the role of monocyte-derived dentritic cells (moDC) was also highlighted. The co-presence of moDC, secretory, venule and myofibroblast cell types in tumour domains was consistent with a previous observation that myeloid DCs (including moDC) were commonly observed in NSCLC specimens [ 49 ]; however, the co-presence of moDC and mesothelial tended to be observed in non-tumour domains, which may reflect the shared role of mesothelial cells and moDCs in antigen presentation [ 50 ]. Summary Through the CosMx case study, we demonstrated that Φ-Space ST could robustly identify cancerous cell states based on four scRNA-seq multi-reference datasets from healthy and fibrotic lungs. We identified domain-specific enriched cell types that were biologically interpretable and comparable across different samples and tissue sections. Our cell type co-presence analysis identified patterns that separated tumorous from non-tumorous domains, highlighting how complex interactions between epithelial, endothelial, mesenchymal and immune cells have jointly shaped the lung tumour microenvironment. 2.4 Φ-Space ST achieves segmentation-free annotation of subcellular ST data Clonally resolved ST data links spatial information with clonal identity. This technological advance promises to uncover transcriptional mechanisms that contribute to intratumour heterogeneity of cancer clones [ 26 , 51 ]. However, ST data combined with lineage tracing remain rare and under-explored, with no established workflow. To address this challenge, we developed a Φ-Space ST-based workflow to provide unique spatial insights by incorporating information from cancer lineage tracing ( Fig 4A ). We investigated the heterogeneity of acute myeloid leukaemia (AML) clones based on a Stereo-seq mouse spleen dataset [ 26 ] (details in Section 2.1 ). Liquid tumours such as AML tumours have less clearer spatial structures compared to solid tumours [ 52 ], which adds to the challenges in analysing this dataset. Download figure Open in new tab Fig 4: Uncovering cancer clone-specific cell states in Stereo-seq AML mouse spleen data. A: Overview of the workflow for analysing clonally-resolved ST data based on Φ-Space ST. Stereo-seq AML mouse spleen data with lineage tracing information were obtained from an AML mouse with barcoded cancer cells. (Created in https://BioRender.com .) Using gene expression and barcode information as input, Φ-Space ST identifies AML ‘meta-clones’ with differential enriched cell types based on multiple reference datasets. B: Φ-Space ST identifies more nuanced spatial niches compared to conventional gene expression-based niche identification. B1: Spatial distribution of morphological gene markers Cd74 (white pulp), Marco (marginal zone) and Elane (neutrophil). Each dot represents a spatial bin of sidelengths ∼25 µm where at least one transcript was detected. B2: Density of all AML barcodes in the mouse spleen sample. B3: Eight clusters of spatial bins were identified based on either Φ-Space ST phenotype space embeddings or gene expressions of the bins. The Φ-Space ST clusters better delineated marginal zone and the high barcode density regions shown in A 2 compared to the gene expression clusters. C: A DWD discriminant analysis revealed differences between bins that contained AML barcodes (‘barcoded’) and bins that did not contain any barcodes (‘non-barcoded’). Barcoded bins tended to have larger DWD scores. Top 10 DWD loadings (ranked by absolute value) show most important cell types for distinguishing barcoded and non-barcoded bins. (CITE, Spleen, BM, Neutro: four reference datasets; Treg: regulatory T cell; Neutro: neutrophil; HPC: hematopoietic progenitor cell; T1: tumour-associated neutrophil; Mat 2, 3: mature neutrophil; Imm B: immature B cell.) D: AML meta-clones and their enriched cell types. D1: Eight meta-clones were identified based on their barcode compositions. Bins with similar barcode (clonal) compositions were grouped into the same meta-clone. D2: Proportion of 5 most abundant barcodes in each meta-clone (with the exception of meta-clone 9 that is too rare). The meta-clones had a diverse composition of individual AML clones, where all meta-clones, except 5, had a dominating AML clone. D3: Enriched cell types within individual meta-clones. Compared to F , neighbouring meta-clones (i.e. 2&7, 6&10 and 3&8) tended to have similar enriched cell types, whereas non-neighbouring meta-clones tended to have dissimilar enriched cell types (Granulo: granulocyte, including neutrophil; IMM NK: immature natural killer; Trans B: transitional B cell; RBC: red blood cell; (Pro)ErythBla: (pro)erythroblast; Imm 1, 2: immature neutrophil; Pre-B (cycl): (cycling) pre-B cell). This Stereo-seq dataset lacks reliable cell segmentation, so we binned the whole tissue slide into bins of sidelengths ∼25 µm (as in Holze et al. [ 26 ]). Therefore cell-like objects in this case study were spatial bins. Since a comprehensive mouse spleen cell atlas is not available, we used Φ-Space ST to leverage multiple scRNA-seq reference datasets without the need for prior integration (details in Methods Section 4 ). Since we wished to make use of a scRNA-seq dataset generated from the same mouse spleen as the Stereo-seq sample [ 51 ], we used a ‘bridging’ strategy for continuous annotation transfer with Φ-Space ST. Our approach is very different from other deconvolution methods which cannot transfer continuous annotations. We first annotated the intermediate scRNA-seq spleen sample, then used the scRNA-seq spleen sample (with continuous Φ-Space ST annotations) to annotate the Stereo-seq sample. Φ-Space ST multi-reference annotation provides a comprehensive characterisation of AML spleen The mouse spleen has a distinctive morphology, where T and B lymphocytes in the white pulp coordinate adaptive immune responses. Surrounding the white pulp is the marginal zone, a region enriched with macrophages, dendritic cells and marginal zone B cells that capture antigens and facilitate their delivery to lymphocytes in the white pulp [ 53 ] ( Figure 4B1 ). Specific to this spleen sample was the prevalence of Elane expression (a neutrophil marker). As lineage tracing information was available we were able to locate the AML cells ( Fig 4B2 ). The four reference datasets we used contained immune cell types from different mouse tissue types, including mouse spleen, bone marrow (origin of the myeloid lineages of immune cells) and tumour (details in Section 2.1 ). These references jointly provide a comprehensive characterisation of the immune landscape in AML mouse spleen. We first clustered the spatial bins based on their multi-reference phenotype space embeddings, which resulted in more subtle spatial regions compared to the clusters based on gene expression ( Figs 4B3 ; see Supplementary Methods Section S2). Thus our Φ-Space ST approach successfully captured biologically meaningful spatial variations across morphological structures in the spleen. We further evaluated whether the Φ-Space ST cell type scores could reveal the differences between bins that contained AML barcodes and non-barcoded bins. Our DWD analysis (detailed in Methods Section 4 ) showed that barcoded bins tended to have stronger ICOS+ regulatory T cell (ICOS+ Treg), red blood cell (RBC), neutrophil (Neutro, T1), hematopoietic progenitor cell (HPC) and CD4 T cell identities, compared to non-barcoded bins ( Fig 4C ). The strong ICOS+ Treg identity of barcoded bins likely reflects the ability of AML cells to promote the expansion of Tregs by expressing ICOS ligand [ 54 ]. The neutrophil identity of the barcoded region may be explained by the high expression of the neutrophil maker Elane in that region ( Fig 4B1 ). Notably, the barcoded and non-barcoded bins were enriched by different types of neutrophils, with barcoded bins enriched by tumour-associated T1 neutrophils and non-barcoded bins enriched by mature neutrophils (MAT2, MAT3). AML clones form phenotypically distinct meta-clones In this clonally resolved Stereo-seq dataset, we observed that individual AML clones in mouse spleen tended to be concentrated in specific spatial domains, which motivated us to define ‘meta-clones’, i.e. spatial niches of bins with similar composition of AML clones (Supplementary Fig S4). We aggregated the spatial bins into meta-clones according to their clonal compositions and identified 8 meta-clones with significantly different compositions of individual AML clones ( Fig 4D1 & D2 ; details in Supplementary Methods Section S2). The AML meta-clones exhibited differential cell states, characterised by their most enriched cell types compared to non-barcoded bins ( Fig 4D3 ; details in supplementary Methods Section S2). We observed that meta-clone 7 formed the ‘periphery’ of meta-clone 2. Both meta-clones had strong neutrophil identities. The neighbouring meta-clones 6 and 10 both had strong erythroid identities while the neighbouring meta-clones 3 and 8 both had strong lymphoid identities ( Figs 4D2 & D3 ). In addition, non-neighbouring meta-clones tended to have enriched cell types from different lineages. These observations provided unique insights into the spatial organisation of AML tumours and their heterogeneity in terms of cell states, which remain poorly understood. Summary We showed how Φ-Space ST can facilitate biological discoveries in Stereo-seq data in a case where cell segmentation was not attainable, and where a suitable reference atlas was lacking. This case study focusing on liquid tumours also highlighted the challenge of tumour niches that are difficult to define. We used four scRNA-seq references to derive the Φ-Space ST phenotype space embeddings of Stereo-seq bins, which retained the complex morphological information of a cancerous spleen, and highlighted the cell states of AML bins. Our novel ways of defining meta-clones and identifying meta-clone-specific enriched cell type provide a generic approach for investigating cancer clonal heterogeneity using clonally resolved ST data. 3 Discussion Φ-Space ST addresses key challenges in annotating cell states in complex tissues and disease environments. By leveraging the power of partial least squares (PLS) regression to annotate cell-like objects on a continuous scale using multiple references, Φ-Space ST provides a unified, platform-agnostic and computationally efficient framework for analysing ST data at multiple resolutions. The continuous cell state annotation enables the characterisation of both known and novel cell types, overcoming limitations of traditional methods that rely on single reference and are computationally costly. Through three diverse case studies, we demonstrated the versatility and effectiveness of Φ-Space ST in unravelling the cellular and spatial complexity of tumour microenvironments. In the Visium case study, Φ-Space ST provided fast and interpretable deconvolution results, revealing cell type co-presence patterns associated with different cancer subtypes and prognostic outcomes. In the CosMx case study, Φ-Space ST’s continuous annotation strategy uncovered intra- and inter-tumour heterogeneity, highlighting distinct spatial niches and niche-specific enriched cell types. Finally, in the Stereo-seq case study, Φ-Space ST successfully characterised AML clone heterogeneity without requiring cell segmentation, showcasing its robustness in cases where traditional approaches fail. Φ-Space ST’s innovative continuous annotation approach goes beyond static classification to offer rich insights into transitional and hybrid cell states, particularly in disease contexts such as cancer. Φ-Space is a highly flexible and computationally efficient tool for largescale and high-resolution spatial studies that provides a scalable solution to the increasing demands of modern spatial omics data. Future work will focus on extending Φ-Space ST to other pathological conditions and integrating additional omics assays, such as spatial proteomics and epigenomics, to further expand its applicability. Validating its performance in larger and even more diverse datasets will also enhance its generalisability and utility across a wider range of biological contexts. 4 Methods We denote the R reference datasets by ( X ref ,r , Y ref ,r ), r = 1 , …, R , where each X ref ,r is a gene by cell scRNA-seq gene expression matrix of normalised values ( Fig 1A ). The phenotype matrix Y ref ,r is a dummy matrix that represents the K r cell type labels of cells in X ref ,r . That is, each row of Y ref ,r represents a cell type and a cell is assigned the value 1 if it belongs to that cell type or −1 otherwise ( Fig 1A ). We denote the query ST dataset by ( X query , S query ), where X query is the query gene expression matrix with rows representing genes and columns representing spatial cell-like objects (segmented cells, multicellular spots or transcript bins), and where S query contains the coordinates of the cell-like objects ( x, y ). 4.1 Φ-Space ST multi-reference continuous phenotyping The main steps for deriving the Φ-Space ST cell type scores based on multiple references are as follows: Gene selection . For each reference dataset ( X ref ,r , Y ref ,r ), we use the variable selection method based on partial least squares (PLS) regression, as described in Mao et al. [ 19 ], to select the most useful genes G r for predicting the cell type Y ref ,r . That is, each G r contains the genes with the largest absolute values of PLS regression coefficients for predicting Y ref ,r . PLS model training ( Fig 1B1 ). For the r th reference, we train a PLS regression model [ 21 , 22 ] using only genes shared by G r , the selected genes for reference r , and G , all genes sequenced in the query. We estimate a low-rank regression coefficient matrix B r of size (|G r | × K r ) to fit the regression model Y ref ,r = X̃ ref ,r B r , where K r denotes the number of cell types in the r th reference and X̃ ref ,r denotes the r th gene expression matrix using only selected genes. The rank of B r is equal to the number of PLS components, by default set to K r . Prediction ( Fig 1B2 ). We compute the continuous predicted cell type scores Ŷ query ,r as a rescaled version of X̃ query B r , where X̃ query denotes the query gene expression matrix using only selected genes; see Mao et al. [ 19 ] for details of the rescaling. The final predicted cell type scores Ŷ query is the concatenation of all Ŷ query ,r and has size , where N is the number of cell-like objects in the query. That is, the number of columns of Ŷ query is equal to the sum of cell types defined in all R references. We call the predicted cell type score matrix Ŷ query the phenotype space embeddings of the query cell-like objects. Compared to hard cell type classification of cell type which assigns a unique cell type label to each query cell-like object, the phenotype space embedding contains much richer information regarding the spatial distribution of cell states and can be used for various downstream analyses described below. 4.2 Multi-sample spatial biological discovery Φ-Space ST is a novel method that uses the phenotype space embeddings Ŷ query to facilitate multi-sample biological discoveries in ST data. Spatial niche identification ( Fig 1C1 ) Φ-Space ST provides a simple approach for spatial niche identification, a major analytical task in ST data analysis to partition the whole spatial domain into cell communities [ 9 , 55 ]. We conduct k-means clustering based on the PCs of the Φ-Space ST cell type scores, where the number of PCs is selected via scree plot. Using PCs rather than the original cell type scores allows to denoise some cell type scores that may not be spatially variable enough to contribute towards niche identification. Niche-specific enriched cell types ( Fig 1C2 ) Once spatial niches have been identified, we further the analysis to identify niche-specific enriched cell types. We perform discriminant analysis using one of the following two methods: Distance-weighted discrimination (DWD) for two niches [ 56 ]. DWD is a powerful method for binary classification. We use DWD to identify a linear combination of Φ-Space cell type scores such that cell-like objects from the two niches can be best separated. We implemented DWD using the kerndwd package [ 57 , 58 ]. Partial least squares discriminant analysis (PLS-DA) for multiple niches [ 22 ]. PLS-DA is a flexible method for multi-class classification. We use PLS-DA to identify linear combinations of Φ-Space cell type scores such that cell-like objects from multiple niches can be best separated. We implemented PLS-DA using the PhiSpace package [ 19 ]. Note that PLS-DA can also handle the case involving two niches. However, we found that the DWD loadings seemed to provide clearer biological interpretation in our case studies. Hence we opted for DWD for the two-niche case. We then rank the cell types according to their contribution towards predicting a given spatial niche, based on either the DWD or PLS-DA loadings. We define spatially enriched cell types as those that contribute most positively to predicting a specific niche. Cell type co-presence ( Fig 1C3 ) To characterise the co-presence of different cell types at the same spatial location, we compute the co-presence matrix, defined as the correlation matrix of Φ-Space ST cell type scores. A positive correlation between two cell types indicates they tend to co-occur the same cell-like object. Tissue samples from donors with different disease conditions may exhibit very different cell type co-presence patterns. To facilitate a multi-sample analysis of these patterns, we apply PCA to reduce the dimensionality of cell type co-presence matrices, enabling visualisation and comparison across samples. We can also perform discriminant analysis using DWD or PLS-DA to identify cell type pairs whose co-presence distinguishes between disease conditions. Declarations Code availability The Φ-Space R package is available on GitHub ( https://github.com/jiadongm/PhiSpace ), along with the R code for processing the data and reproduce our results. Data availability The Human Lung Cell Atlas data (‘core’) [ 27 ] can be downloaded from CZ CELLxGENE ( https://cellxgene.cziscience.com/collections/6f6d381a-7701-4781-935c-db10d30de293 ). The 10x Visium NSCLC dataset [ 24 ] is available at BioStudies ( https://www.ebi.ac.uk/biostudies/ ) with accession number E-MTAB-13530. The four scRNA-seq datasets from healthy and fibrotic lungs (immune, endothelial, epithelial and mesenchymal RDS objects) [ 28 ] are available at GEO with accession GSE227136. The CosMx NSCLC dataset (‘Processed Giotto Object’) [ 25 ] can be downloaded from https://nanostring.com/products/cosmx-spatial-molecular-imager/ffpe-dataset/nsclc-ffpe-dataset/ . The mouse spleen data from [ 29 ] is available at CNSA (CNGB Sequence Archive) of CNGBdb ( https://db.cngb.org/cnsa/ ) under the accession number CNP0003930. The mouse bone marrow data from [ 30 ] is available at the Mouse HSC Atlas website ( https://gillisweb.cshl.edu/HSC_atlas/ ). The mouse spleen CITE-seq data from [ 32 ] is available on GitHub ( https://github.com/YosefLab/totalVI_reproducibility ). The mouse neutrophil scRNA-seq data [ 31 ] is available at GEO under accession number GSE243466. The AML mouse spleen stereo-seq data [ 26 ] can be downloaded from Zenodo ( https://zenodo.org/records/10685805 ) and the scRNA-seq data from the same spleen (‘Mouse 2’) [ 51 ] is available at GEO under accession number GSE161676. Competing interests The authors declare they have no competing interests. Funding JM and KALC were supported in part by the National Health and Medical Research Council (NHMRC) Investigator Grant (GNT2025648). Acknowledgements. We would like to thank Prof Mark Dawson, Dr Dane Vassiliadis and Ms Henrietta Holze (Sir Peter MacCullum Cancer Centre) for providing the processed AML mouse spleen Stereo-seq data and their helpful suggestions for writing the Stereo-seq case study. We would also like to thank Mr Yidi Deng (University of Melbourne) for helpful discussions. Footnotes https://github.com/jiadongm/PhiSpace References [1]. ↵ Mengnan Cheng , Yujia Jiang , Jiangshan Xu , Alexios-Fotios A Mentis , Shuai Wang , Huiwen Zheng , Sunil Kumar Sahu , Longqi Liu , and Xun Xu . Spatially resolved transcriptomics: a comprehensive review of their technological advances, applications, and challenges . J. Genet. Genomics , 50 ( 9 ): 625 – 640 , 2023 . OpenUrl CrossRef PubMed [2]. ↵ Visium spatial gene expression: Map the whole transcriptome within the tissue context . URL https://www.10xgenomics.com/products/spatial-gene-expression . Accessed: 20 Sep 2024 . [3]. ↵ CosMx smi for single-cell imaging . URL https://nanostring.com/products/cosmx-spatial-molecular-imager/single-cell-imaging-overview/ . Accessed: 20 Sep 2024 . [4]. ↵ Spatial transcriptome Stereo-seq . URL https://www.bgi.com/global/service/spatial-transcriptome-stereo-seq . Accessed: 21 Sep 2024 . [5]. ↵ Emma Dann , Ana-Maria Cujba , Amanda J Oliver , Kerstin B Meyer , Sarah A Teichmann , and John C Marioni . Precise identification of cell states altered in disease using healthy single-cell references . Nat. Genet ., 55 ( 11 ): 1998 – 2008 , 2023 . OpenUrl CrossRef PubMed [6]. ↵ Mohammad Lotfollahi , Yuhan Hao , Fabian J Theis , and Rahul Satija . The future of rapid and automated single-cell data analysis using reference mapping . Cell , 187 ( 10 ): 2343 – 2358 , 2024 . OpenUrl CrossRef PubMed [7]. ↵ Luyi Tian , Fei Chen , and Evan Z Macosko . The expanding vistas of spatial transcriptomics . Nat. Biotechnol ., 41 ( 6 ): 773 – 782 , 2023 . OpenUrl CrossRef PubMed [8]. ↵ Viktor Petukhov , Rosalind J Xu , Ruslan A Soldatov , Paolo Cadinu , Konstantin Khodosevich , Jeffrey R Moffitt , and Peter V Kharchenko . Cell segmentation in imaging-based spatial transcriptomics . Nat. Biotechnol ., 40 ( 3 ): 345 – 354 , 2022 . OpenUrl CrossRef PubMed [9]. ↵ Ying Ma and Xiang Zhou . Accurate and efficient integrative reference-informed spatial domain detection for spatial transcriptomics . Nat. Methods , 21 ( 7 ): 1231 – 1244 , 2024 . OpenUrl CrossRef PubMed [10]. ↵ Haoran Zhang , Miranda V Hunter , Jacqueline Chou , Jeffrey F Quinn , Mingyuan Zhou , Richard M White , and Wesley Tansey . BayesTME: An end-to-end method for multiscale spatial transcriptional profiling of the tissue microenvironment . Cell Syst ., 14 ( 7 ): 605 – 619 .e7, 2023 . OpenUrl CrossRef PubMed [11]. ↵ Dylan M Cable , Evan Murray , Luli S Zou , Aleksandrina Goeva , Evan Z Macosko , Fei Chen , and Rafael A Irizarry . Robust decomposition of cell type mixtures in spatial transcriptomics . Nat. Biotechnol ., 40 ( 4 ): 517 – 526 , 2022 . OpenUrl CrossRef PubMed [12]. Jiawen Chen , Weifang Liu , Tianyou Luo , Zhentao Yu , Minzhi Jiang , Jia Wen , Gaorav P Gupta , Paola Giusti , Hongtu Zhu , Yuchen Yang , and Yun Li . A comprehensive comparison on cell-type composition inference for spatial transcriptomics data . Brief. Bioinform ., 23 ( 4 ), 2022 . [13]. ↵ Vitalii Kleshchevnikov , Artem Shmatko , Emma Dann , Alexander Aivazidis , Hamish W King , Tong Li , Rasa Elmentaite , Artem Lomakin , Veronika Kedlian , Adam Gayoso , Mika Sarkin Jain , Jun Sung Park , Lauma Ramona , Elizabeth Tuck , Anna Arutyunyan , Roser Vento-Tormo , Moritz Gerstung , Louisa James , Oliver Stegle , and Omer Ali Bayraktar . Cell2location maps fine-grained cell types in spatial transcriptomics . Nat. Biotechnol ., 40 ( 5 ): 661 – 671 , 2022 . OpenUrl CrossRef PubMed [14]. Bin Li , Wen Zhang , Chuang Guo , Hao Xu , Longfei Li , Minghao Fang , Yinlei Hu , Xinye Zhang , Xinfeng Yao , Meifang Tang , Ke Liu , Xuetong Zhao , Jun Lin , Linzhao Cheng , Falai Chen , Tian Xue , and Kun Qu . Benchmarking spatial and single-cell transcriptomics integration methods for transcript distribution prediction and cell type deconvolution . Nat. Methods , 19 ( 6 ): 662 – 670 , 2022 . OpenUrl CrossRef PubMed [15]. ↵ Haoyang Li , Juexiao Zhou , Zhongxiao Li , Siyuan Chen , Xingyu Liao , Bin Zhang , Ruochi Zhang , Yu Wang , Shiwei Sun , and Xin Gao . A comprehensive benchmarking with practical guidelines for cellular deconvolution of spatial transcriptomics . Nat. Commun ., 14 ( 1 ): 1548 , 2023 . OpenUrl [16]. ↵ Simon Mages , Noa Moriel , Inbal Avraham-Davidi , Evan Murray , Jan Watter , Fei Chen , Orit Rozenblatt-Rosen , Johanna Klughammer , Aviv Regev , and Mor Nitzan . TACCO unifies annotation transfer and decomposition of cell identities for single-cell and spatial omics . Nat. Biotechnol ., 41 ( 10 ): 1465 – 1473 , 2023 . OpenUrl CrossRef PubMed [17]. ↵ Yanxiang Deng , Marek Bartosovic , Sai Ma , Di Zhang , Petra Kukanja , Yang Xiao , Graham Su , Yang Liu , Xiaoyu Qin , Gorazd B Rosoklija , Andrew J Dwork , J John Mann , Mina L Xu , Stephanie Halene , Joseph E Craft , Kam W Leong , Maura Boldrini , Gonçalo Castelo-Branco , and Rong Fan . Spatial profiling of chromatin accessibility in mouse and human tissues . Nature , 609 ( 7926 ): 375 – 383 , 2022 . OpenUrl CrossRef PubMed [18]. ↵ Yang Liu , Marcello DiStasio , Graham Su , Hiromitsu Asashima , Archibald Enninful , Xiaoyu Qin , Yanxiang Deng , Jungmin Nam , Fu Gao , Pino Bordignon , Marco Cassano , Mary Tomayko , Mina Xu , Stephanie Halene , Joseph E Craft , David Hafler , and Rong Fan . High-plex protein and whole transcriptome co-mapping at cellular resolution with spatial CITE-seq . Nat. Biotechnol ., 41 ( 10 ): 1405 – 1409 , 2023 . OpenUrl CrossRef PubMed [19]. ↵ Jiadong Mao , Yidi Deng , and Kim-Anh Lê Cao . ϕ-space: Continuous phenotyping of single-cell multi-omics data . bioRxiv , page 2024.06.19.599787, 2024 . [20]. ↵ Dakai Xiao and Jianxing He . Epithelial mesenchymal transition and lung cancer . J. Thorac. Dis ., 2 ( 3 ): 154 – 159 , 2010 . OpenUrl CrossRef PubMed [21]. ↵ H Wold . Estimation of principal components and related models by iterative least squares . Multivariate Analysis , pages 391 – 420 , 1966 . [22]. ↵ Kim-Anh Lê Cao and Zoe Marie Welham . Multivariate Data Integration Using R . Chapman and Hall/CRC , 1st edition edition, 2021 . [23]. ↵ Cong Liang , FANTOM Consortium , Alistair R R Forrest , and Günter P Wagner . The statistical geometry of transcriptome divergence in cell-type evolution and cancer . Nat. Commun ., 6 ( 1 ): 6066 , 2015 . OpenUrl CrossRef PubMed [24]. ↵ Marco De Zuani , Haoliang Xue , Jun Sung Park , Stefan C Dentro , Zaira Seferbekova , Julien Tessier , Sandra Curras-Alonso , Angela Hadjipanayis , Emmanouil I Athanasiadis , Moritz Ger-stung , Omer Bayraktar , and Ana Cvejic . Single-cell and spatial transcriptomics analysis of non-small cell lung cancer . Nat. Commun ., 15 ( 1 ): 4388 , 2024 . OpenUrl CrossRef PubMed [25]. ↵ Shanshan He , Ruchir Bhatt , Carl Brown , Emily A Brown , Derek L Buhr , Kan Chantranu-vatana , Patrick Danaher , Dwayne Dunaway , Ryan G Garrison , Gary Geiss , Mark T Gregory , Margaret L Hoang , Rustem Khafizov , Emily E Killingbeck , Dae Kim , Tae Kyung Kim , Youngmi Kim , Andrew Klock , Mithra Korukonda , Alecksandr Kutchma , Zachary R Lewis , Yan Liang , Jeffrey S Nelson , Giang T Ong , Evan P Perillo , Joseph C Phan , Tien Phan-Everson , Erin Piazza , Tushar Rane , Zachary Reitz , Michael Rhodes , Alyssa Rosenbloom , David Ross , Hiromi Sato , Aster W Wardhani , Corey A Williams-Wietzikoski , Lidan Wu , and Joseph M Beechem . High-plex imaging of RNA and proteins at subcellular resolution in fixed tissue by spatial molecular imaging . Nat. Biotechnol ., 40 ( 12 ): 1794 – 1806 , 2022 . OpenUrl CrossRef PubMed [26]. ↵ Henrietta Holze , Laure Talarmain , Katie A Fennell , Enid Y Lam , Mark A Dawson , and Dane Vassiliadis . Analysis of synthetic cellular barcodes in the genome and transcriptome with BARtab and bartools . Cell Rep Methods , page 100763 , 2024 . [27]. ↵ Lisa Sikkema , Ciro Ramírez-Suástegui , Daniel C Strobl , Tessa E Gillett , Luke Zappia , Elo Madissoon , Nikolay S Markov , Laure-Emmanuelle Zaragosi , Yuge Ji , Meshal Ansari , Marie-Jeanne Arguel , Leonie Apperloo , Martin Banchero , Christophe Bécavin , Marijn Berg , Evgeny Chichelnitskiy , Mei-I Chung , Antoine Collin , Aurore C A Gay , Janine Gote-Schniering , Baharak Hooshiar Kashani , Kemal Inecik , Manu Jain , Theodore S Kapellos , Tessa M Kole , Sylvie Leroy , Christoph H Mayr , Amanda J Oliver , Michael von Papen , Lance Peter , Chase J Taylor , Thomas Walzthoeni , Chuan Xu , Linh T Bui , Carlo De Donno , Leander Dony , Alen Faiz , Minzhe Guo , Austin J Gutierrez , Lukas Heumos , Ni Huang , Ignacio L Ibarra , Nathan D Jackson , Preetish Kadur Lakshminarasimha Murthy , Mohammad Lotfollahi , Tracy Tabib , Carlos Talavera-Ĺopez , Kyle J Travaglini , Anna Wilbrey-Clark , Kaylee B Worlock , Masahiro Yoshida , Lung Biological Network Consortium , Maarten van den Berge , Yohan Bosśe , Tushar J Desai , Oliver Eickelberg , Naftali Kaminski , Mark A Krasnow , Robert Lafyatis , Marko Z Nikolic , Joseph E Powell , Jayaraj Rajagopal , Mauricio Rojas , Orit Rozenblatt-Rosen , Max A Sei-bold , Dean Sheppard , Douglas P Shepherd , Don D Sin , Wim Timens , Alexander M Tsankov , Jeffrey Whitsett , Yan Xu , Nicholas E Banovich , Pascal Barbry , Thu Elizabeth Duong , Christine S Falk , Kerstin B Meyer , Jonathan A Kropski , Dana Pe’er , Herbert B Schiller , Purushothama Rao Tata , Joachim L Schultze , Sara A Teichmann , Alexander V Misharin , Martijn C Nawijn , Malte D Luecken , and Fabian J Theis . An integrated cell atlas of the lung in health and disease . Nat. Med ., 29 ( 6 ): 1563 – 1577 , 2023 . OpenUrl CrossRef PubMed [28]. ↵ Heini M Natri , Christina B Del Azodi , Lance Peter , Chase J Taylor , Sagrika Chugh , Robert Kendle , Mei-I Chung , David K Flaherty , Brittany K Matlock , Carla L Calvi , Timothy S Blackwell , Lorraine B Ware , Matthew Bacchetta , Rajat Walia , Ciara M Shaver , Jonathan A Kropski , Davis J McCarthy , and Nicholas E Banovich . Cell-type-specific and disease-associated expression quantitative trait loci in the human lung . Nat. Genet ., 56 ( 4 ): 595 – 604 , 2024 . OpenUrl CrossRef PubMed [29]. ↵ Yin Zhang , Juan Shen , Wei Cheng , Bhaskar Roy , Ruizhen Zhao , Tailiang Chai , Yifei Sheng , Zhao Zhang , Xueting Chen , Weiming Liang , Weining Hu , Qijun Liao , Shanshan Pan , Wen Zhuang , Yangrui Zhang , Rouxi Chen , Junpu Mei , Hong Wei , and Xiaodong Fang . Microbiota-mediated shaping of mouse spleen structure and immune function characterized by scRNA-seq and stereo-seq . J. Genet. Genomics , 50 ( 9 ): 688 – 701 , 2023 . OpenUrl CrossRef PubMed [30]. ↵ Benjamin D Harris , John Lee , and Jesse Gillis . A meta-analytic single-cell atlas of mouse bone marrow hematopoietic development . bioRxiv , page 2021.08.12.456098, 2021 . [31]. ↵ Melissa S F Ng , Immanuel Kwok , Leonard Tan , Changming Shi , Daniela Cerezo-Wallis , Yin-grou Tan , Keith Leong , Gabriel F Calvo , Katharine Yang , Yuning Zhang , Jingsi Jin , Ka Hang Liong , Dandan Wu , Rui He , Dehua Liu , Ye Chean Teh , Camille Bleriot , Nicoletta Caronni , Zhaoyuan Liu , Kaibo Duan , Vipin Narang , Iván Ballesteros , Federica Moalli , Mengwei Li , Jinmiao Chen , Yao Liu , Lianxin Liu , Jingjing Qi , Yingbin Liu , Lingxi Jiang , Baiyong Shen , Hui Cheng , Tao Cheng , Veronique Angeli , Ankur Sharma , Yuin-Han Loh , Hong Liang Tey , Shu Zhen Chong , Matteo Iannacone , Renato Ostuni , Andŕes Hidalgo , Florent Ginhoux , and Lai Guan Ng . Deterministic reprogramming of neutrophils within tumors . Science , 383 ( 6679 ): eadf6493 , 2024 . OpenUrl CrossRef PubMed [32]. ↵ Adam Gayoso , Zöe Steier , Romain Lopez , Jeffrey Regier , Kristopher L Nazor , Aaron Streets , and Nir Yosef . Joint probabilistic modeling of single-cell multi-omic data with totalVI . Nat. Methods , 18 ( 3 ): 272 – 282 , 2021 . OpenUrl CrossRef PubMed [33]. ↵ Tracy L Leong and Vanessa L Bryant . B cells in lung cancer-not just a bystander cell: a literature review . Transl. Lung Cancer Res ., 10 ( 6 ): 2830 – 2841 , 2021 . OpenUrl CrossRef PubMed [34]. ↵ Ćeline M Laumont and Brad H Nelson . B cells in the tumor microenvironment: Multi-faceted organizers, regulators, and effectors of anti-tumor immunity . Cancer Cell , 41 ( 3 ): 466 – 489 , 2023 . OpenUrl CrossRef PubMed [35]. ↵ Qi Liu , Chih-Yuan Hsu , and Yu Shyr . Scalable and model-free detection of spatial patterns and colocalization . Genome Res ., 32 ( 9 ): 1736 – 1745 , 2022 . OpenUrl Abstract / FREE Full Text [36]. ↵ Yasuhiro Kojima , Shinji Mii , Shuto Hayashi , Haruka Hirose , Masato Ishikawa , Masashi Akiyama , Atsushi Enomoto , and Teppei Shimamura . Single-cell colocalization analysis using a deep generative model . Cell Syst ., 15 ( 2 ): 180 – 192 .e7, 2024 . OpenUrl CrossRef PubMed [37]. ↵ Joe W Chen and Joseph Dhahbi . Lung adenocarcinoma and lung squamous cell carcinoma cancer classification, biomarker identification, and gene expression analysis using overlapping feature selection methods . Sci. Rep. , 11 ( 1 ): 13323 , 2021 . OpenUrl CrossRef PubMed [38]. ↵ Kit Yee Wong , Alvin Ho-Kwan Cheung , Bonan Chen , Wai Nok Chan , Jun Yu , Kwok Wai Lo , Wei Kang , and Ka Fai To . Cancer-associated fibroblasts in nonsmall cell lung cancer: From molecular mechanisms to clinical implications . Int. J. Cancer , 151 ( 8 ): 1195 – 1215 , 2022 . OpenUrl CrossRef PubMed [39]. ↵ Lena Cords , Stefanie Engler , Martina Haberecker , Jan Hendrik Rüschoff , Holger Moch , Natalie de Souza , and Bernd Bodenmiller . Cancer-associated fibroblast phenotypes are associated with patient outcome in non-small cell lung cancer . Cancer Cell , 42 ( 3 ): 396 – 412 .e5, 2024 . OpenUrl CrossRef PubMed [40]. ↵ Binhui Zhou , Toby Lawrence , and Yinming Liang . The role of plasmacytoid dendritic cells in cancers . Front. Immunol ., 12 : 749190 , 2021 . OpenUrl CrossRef PubMed [41]. ↵ Aldo Pinto , Alessia Rega , Timothy R Crother , and Rosalinda Sorrentino . Plasmacytoid dendritic cells and their therapeutic activity in cancer . Oncoimmunology , 1 ( 5 ): 726 – 734 , 2012 . OpenUrl CrossRef PubMed [42]. ↵ Yiming Weng , Jingping Yuan , Xue Cui , Jinsong Wang , Honglei Chen , Li Xu , Xinyi Chen , Min Peng , and Qibin Song . The impact of tertiary lymphoid structures on tumor prognosis and the immune microenvironment in non-small cell lung cancer . Sci. Rep ., 14 ( 1 ): 16246 , 2024 . OpenUrl CrossRef PubMed [43]. ↵ J Sainz de Aja , A F M Dost , and C F Kim . Alveolar progenitor cells and the origin of lung cancer . J. Intern. Med ., 289 ( 5 ): 629 – 635 , 2021 . OpenUrl CrossRef PubMed [44]. ↵ Tomoya Fukui , Renat Shaykhiev , Francisco Agosto-Perez , Jason G Mezey , Robert J Downey , William D Travis , and Ronald G Crystal . Lung adenocarcinoma subtypes based on expression of human airway basal cell genes . Eur. Respir. J ., 42 ( 5 ): 1332 – 1344 , 2013 . OpenUrl Abstract / FREE Full Text [45]. ↵ Feng Li , Qing-Zhen Song , Yi-Fan Zhang , Xing-Ru Wang , Li-Min Cao , Nan Li , Ling-Xia Zhao , Sheng-Xiao Zhang , and Xiao-Fei Zhuang . Identifying the EMT-related signature to stratify prognosis and evaluate the tumor microenvironment in lung adenocarcinoma . Front. Genet ., 13 : 1008416 , 2022 . OpenUrl CrossRef PubMed [46]. ↵ Yuxuan Xiao , Ziyu Wang , Meng Gu , Panjian Wei , Xiaojue Wang , and Weiying Li . Cancer-associated fibroblasts: heterogeneity and their role in the tumor immune response . Clin. Exp. Med ., 24 ( 1 ): 126 , 2024 . OpenUrl CrossRef PubMed [47]. ↵ Christopher J Hanley , Sara Waise , Matthew J Ellis , Maria A Lopez , Wai Y Pun , Julian Taylor , Rachel Parker , Lucy M Kimbley , Serena J Chee , Emily C Shaw , Jonathan West , Aiman Alzetani , Edwin Woo , Christian H Ottensmeier , Matthew J J Rose-Zerilli , and Gareth J Thomas . Single-cell analysis reveals prognostic fibroblast subpopulations linked to molecular and immunological subtypes of lung cancer . Nat. Commun ., 14 ( 1 ): 387 , 2023 . OpenUrl CrossRef PubMed [48]. ↵ Simona Gurzu , Sabin Turdean , Attila Kovecsi , Anca Otilia Contac , and Ioan Jung . Epithelial-mesenchymal, mesenchymal-epithelial, and endothelial-mesenchymal transitions in malignant tumors: An update . World J. Clin. Cases , 3 ( 5 ): 393 – 404 , 2015 . OpenUrl CrossRef PubMed [49]. ↵ A Bergeron , F El-Hage , M Kambouchner , D Lecossier , and A Tazi . Characterisation of den-dritic cell subsets in lung cancer micro-environments . Eur. Respir. J ., 28 ( 6 ): 1170 – 1177 , 2006 . OpenUrl Abstract / FREE Full Text [50]. ↵ Hitesh Batra and Veena B Antony . Pleural mesothelial cells in pleural and lung diseases . J. Thorac. Dis ., 7 ( 6 ): 964 – 980 , 2015 . OpenUrl CrossRef PubMed [51]. ↵ Katie A Fennell , Dane Vassiliadis , Enid Y N Lam , Luciano G Martelotto , Jesse J Balic , Sebastian Hollizeck , Tom S Weber , Timothy Semple , Qing Wang , Denise C Miles , Laura MacPherson , Yih-Chih Chan , Andrew A Guirguis , Lev M Kats , Emily S Wong , Sarah-Jane Dawson , Shalin H Naik , and Mark A Dawson . Non-genetic determinants of malignant clonal fitness at single-cell resolution . Nature , 601 ( 7891 ): 125 – 131 , 2022 . OpenUrl CrossRef PubMed [52]. ↵ David J Reiss , Yumi Nakayama , Andrew P Weng , Matthew E Stokes , Laurie Sehn , Christian Steidl , David W Scott , C Chris Huang , and Anita K Gandhi . High-plex imaging and cellular neighborhood spatial analysis reveals multiple immune escape and suppression patterns in diffuse large B-cell lymphoma . Leukemia , 38 ( 5 ): 1164 – 1168 , 2024 . OpenUrl CrossRef PubMed [53]. ↵ Joke M den Haan , Reina E Mebius , and Georg Kraal . Stromal cells of the mouse spleen . Front. Immunol ., 3 : 201 , 2012 . OpenUrl PubMed [54]. ↵ Yixiang Han , Yuqing Dong , Qianqian Yang , Wanling Xu , Songfu Jiang , Zhijie Yu , Kang Yu , and Shenghui Zhang . Acute myeloid leukemia cells express ICOS ligand to promote the expansion of regulatory T cells . Front. Immunol ., 9 : 2227 , 2018 . OpenUrl CrossRef PubMed [55]. ↵ Sebastian Birk , Irene Bonafonte-Pardàs , Adib Miraki Feriz , Adam Boxall , Eneritz Agirre , Fani Memi , Anna Maguza , Rong Fan , Gonçalo Castelo-Branco , Fabian J Theis , Omer Ali Bayraktar , Carlos Talavera-Ĺopez , and Mohammad Lotfollahi . Quantitative characterization of cell niches in spatial atlases . bioRxiv , page 2024.02.21.581428, 2024 . [56]. ↵ J S Marron , Michael J Todd , and Jeongyoun Ahn . Distance-weighted discrimination . J. Am. Stat. Assoc. , 102 ( 480 ): 1267 – 1271 , 2007 . OpenUrl CrossRef Web of Science [57]. ↵ Boxiang Wang and Hui Zou . Another look at distance-weighted discrimination . J. R. Stat. Soc. Series B Stat. Methodol ., 80 ( 1 ): 177 – 198 , 2018 . OpenUrl CrossRef [58]. ↵ Boxiang Wang and Hui Zou . kerndwd: Distance Weighted Discrimination (DWD) and Kernel Methods , 2020 . URL https://CRAN.R-project.org/package=kerndwd . R package version 2.0.3. View the discussion thread. Back to top Previous Next Posted February 08, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Φ-Space ST: a platform-agnostic method to identify cell states in spatial transcriptomics studies Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Φ-Space ST: a platform-agnostic method to identify cell states in spatial transcriptomics studies Jiadong Mao , Jarny Choi , Kim-Anh Lê Cao bioRxiv 2025.02.05.636735; doi: https://doi.org/10.1101/2025.02.05.636735 Share This Article: Copy Citation Tools Φ-Space ST: a platform-agnostic method to identify cell states in spatial transcriptomics studies Jiadong Mao , Jarny Choi , Kim-Anh Lê Cao bioRxiv 2025.02.05.636735; doi: https://doi.org/10.1101/2025.02.05.636735 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Bioinformatics Subject Areas All Articles Animal Behavior and Cognition (7625) Biochemistry (17652) Bioengineering (13874) Bioinformatics (41890) Biophysics (21429) Cancer Biology (18567) Cell Biology (25467) Clinical Trials (138) Developmental Biology (13365) Ecology (19874) Epidemiology (2067) Evolutionary Biology (24294) Genetics (15591) Genomics (22478) Immunology (17717) Microbiology (40331) Molecular Biology (17153) Neuroscience (88496) Paleontology (666) Pathology (2828) Pharmacology and Toxicology (4817) Physiology (7635) Plant Biology (15114) Scientific Communication and Education (2044) Synthetic Biology (4286) Systems Biology (9817) Zoology (2268)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall: last seen: 2026-05-23T02:00:01.238055+00:00

License: CC-BY-NC-ND-4.0