Full text
92,785 characters
· extracted from
preprint-html
· click to expand
Image-based profiling of healthy donor immune cells with Blood Cell Painting reveals novel genotype-phenotype associations | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Image-based profiling of healthy donor immune cells with Blood Cell Painting reveals novel genotype-phenotype associations View ORCID Profile Caroline Högel-Starck , View ORCID Profile Veera A. Timonen , View ORCID Profile Gantugs Atarsaikhan , View ORCID Profile Isabel Mogollon , View ORCID Profile Minttu Polso , View ORCID Profile Antti Hassinen , View ORCID Profile Jarno Honkanen , View ORCID Profile Cindy David Sarmento , View ORCID Profile Jessica Koski , Julius Soini , View ORCID Profile Lea Urpa , View ORCID Profile Tanja Ruokoranta , Toveann Ahlnäs , Julianna Juvila , View ORCID Profile Juho J. Miettinen , View ORCID Profile Rodosthenis S. Rodosthenous , FinnGen , View ORCID Profile Outi Kilpivaara , View ORCID Profile Mikko Arvas , View ORCID Profile Caroline A. Heckman , View ORCID Profile Jukka Partanen , View ORCID Profile Mark Daly , View ORCID Profile Aarno Palotie , View ORCID Profile Hanna M. Ollila , View ORCID Profile Lassi Paavolainen , View ORCID Profile Vilja Pietiäinen , View ORCID Profile Esa Pitkänen doi: https://doi.org/10.1101/2024.05.17.594648 Caroline Högel-Starck 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 2 iCAN Digital Precision Cancer Medicine Flagship , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Caroline Högel-Starck Veera A. Timonen 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 3 Applied Tumor Genomics Research Program, Faculty of Medicine, University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Veera A. Timonen Gantugs Atarsaikhan 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 2 iCAN Digital Precision Cancer Medicine Flagship , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Gantugs Atarsaikhan Isabel Mogollon 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Isabel Mogollon Minttu Polso 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 2 iCAN Digital Precision Cancer Medicine Flagship , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Minttu Polso Antti Hassinen 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Antti Hassinen Jarno Honkanen 4 Finnish Red Cross Blood Service Biobank , Vantaa, Finland 6 Translational Immunology Program, Research Programs Unit, University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jarno Honkanen Cindy David Sarmento 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Cindy David Sarmento Jessica Koski 2 iCAN Digital Precision Cancer Medicine Flagship , Helsinki, Finland 3 Applied Tumor Genomics Research Program, Faculty of Medicine, University of Helsinki , Helsinki, Finland 9 D epartment of Medical and Clinical Genetics, Medicum, Faculty of Medicine, University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jessica Koski Julius Soini 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site Lea Urpa 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Lea Urpa Tanja Ruokoranta 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 5 Helsinki University Hospital Comprehensive Cancer Center , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Tanja Ruokoranta Toveann Ahlnäs 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site Julianna Juvila 4 Finnish Red Cross Blood Service Biobank , Vantaa, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site Juho J. Miettinen 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Juho J. Miettinen Rodosthenis S. Rodosthenous 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Rodosthenis S. Rodosthenous Outi Kilpivaara 2 iCAN Digital Precision Cancer Medicine Flagship , Helsinki, Finland 3 Applied Tumor Genomics Research Program, Faculty of Medicine, University of Helsinki , Helsinki, Finland 9 D epartment of Medical and Clinical Genetics, Medicum, Faculty of Medicine, University of Helsinki , Helsinki, Finland 10 HUSLAB Laboratory of Genetics, HUS Diagnostic Center, Helsinki University Hospital , Helsinki, Finland 11 K. Albin Johansson Cancer Research Fellow, Foundation for the Finnish Cancer Institute , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Outi Kilpivaara Mikko Arvas 8 Finnish Red Cross Blood Service, Research and Development , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Mikko Arvas Caroline A. Heckman 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 2 iCAN Digital Precision Cancer Medicine Flagship , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Caroline A. Heckman Jukka Partanen 8 Finnish Red Cross Blood Service, Research and Development , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jukka Partanen Mark Daly 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 7 Broad Institute of MIT and Harvard , Cambridge, MA, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Mark Daly Aarno Palotie 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 7 Broad Institute of MIT and Harvard , Cambridge, MA, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Aarno Palotie Hanna M. Ollila 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 12 Department o f Anesthesia, Critical Care and Pain Medicine, Massachusetts General Hospital and Harvard Medical School , Boston, MA, USA 7 Broad Institute of MIT and Harvard , Cambridge, MA, USA 13 Center for Genomic Medicine, Massachusetts General Hospital and Harvard Medical School , Boston, MA, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Hanna M. Ollila Lassi Paavolainen 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 2 iCAN Digital Precision Cancer Medicine Flagship , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Lassi Paavolainen For correspondence: lassi.paavolainen{at}helsinki.fi vilja.pietiainen{at}helsinki.fi esa.pitkanen{at}helsinki.fi Vilja Pietiäinen 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 2 iCAN Digital Precision Cancer Medicine Flagship , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Vilja Pietiäinen For correspondence: lassi.paavolainen{at}helsinki.fi vilja.pietiainen{at}helsinki.fi esa.pitkanen{at}helsinki.fi Esa Pitkänen 1 Institute for Molecular Medicine Finland (FIMM), Helsinki Institute of Life Science (HiLIFE), University of Helsinki , Helsinki, Finland 2 iCAN Digital Precision Cancer Medicine Flagship , Helsinki, Finland 3 Applied Tumor Genomics Research Program, Faculty of Medicine, University of Helsinki , Helsinki, Finland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Esa Pitkänen For correspondence: lassi.paavolainen{at}helsinki.fi vilja.pietiainen{at}helsinki.fi esa.pitkanen{at}helsinki.fi Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract The morphological diversity of blood immune cells of healthy individuals, critical for recognizing disease-related phenotypes, remains largely uncharacterized. To address this gap, we developed Blood Cell Painting (BCP): a high content, high throughput fluorescence imaging assay for peripheral blood mononuclear cells. We generated a BCP Atlas with images of 50 million cells from 390 healthy blood donors, identifying 18 distinct immune cell morphology clusters. A genome-wide association study of BCP-derived imaging-based cellular features revealed 93 significant associations across 30 genetic loci. These loci include genes linked to mast cell function, inflammation, immune signaling, mitochondrial maintenance and circadian immune modulation. We also observed correlations between immune cell morphological features and clinical traits, such as respiratory conditions and healthcare visits related to contraceptive management, potentially reflecting hormonal influences on immune cell phenotypes. As a proof of concept for clinical application, acute myeloid leukemia subtypes were distinguished by BCP. Our study establishes BCP as a versatile method for immune cell profiling to uncover genetic, phenotypic and clinical determinants of immune cell morphology in health and disease. Background Despite the success of population-scale genome-wide (GWAS) and phenome-wide association studies (PheWAS) ( 1 ), the biological mechanisms linking germline variants to phenotypes remain poorly understood. A crucial intermediate between genotypes and disease phenotypes lies at the level of cellular phenotypes, which can be interrogated at the single-cell level, for example, with single-cell RNA-sequencing (scRNA-seq) and high content imaging (HCI). Single-cell profiling has revealed an unprecedented cellular heterogeneity in healthy and diseased tissues, with implications for the diagnosis and treatment of diseases through an improved understanding of immunity ( 2 ). Sequencing-based approaches allow the identification of cell types and subtypes, and mapping of their evolutionary trajectories ( 3 ), but these methods are costly and do not capture rich cellular morphology or spatial architecture. By contrast, HCI allows millions of cells to be routinely profiled and quantified in a single experiment, providing cellular context and morphological details at a lower cost ( 4 – 6 ). Consequently, HCI has been used to reveal how immune cell phenotypes reflect molecular and personal health information and how leukemic cancer cells respond, at single-cell level, to different drugs in clinical trials ( 7 , 8 ). Cell Painting is a widely adopted HCI assay for morphological and functional profiling of single cells and cell organelles via fluorescence microscopy ( 4 , 5 ). Cellular phenotypes derived with Cell Painting have been associated with somatic variants in cancer, transcriptomics, as well as genetic and chemical perturbations ( 9 – 11 ). For example, recent large-scale studies have combined Cell Painting with transcriptomics for >28,000 perturbations ( 12 ) and performed >20,000 CRISPR perturbation experiments in >30 million cells, resulting in an atlas of biological pathways and interactions ( 13 ). To date, Cell Painting has primarily been applied to study the adherent cancer cell lines and human fibroblasts ( 4 , 14 ), with less focus on human immune cells playing a central role in health and disease. In this study, we developed the Blood Cell Painting (BCP) workflow ( Fig. 1 ) for high content fluorescence microscopy imaging of peripheral blood mononuclear cells (PBMCs), modified from the original Cell Painting assay ( 4 , 5 ). Using BCP, we profiled PBMC samples from 390 healthy blood donors, yielding 50 million imaged cells. We optimized and benchmarked a popular batch effect correction method Harmony for large-scale BCP data. Finally, we associated BCP profiles to genotypes and health registry phenotypes, revealing novel links to immune cell morphology and function. Download figure Open in new tab Figure 1. Blood Cell Painting — study design and the BCP assay. A) Overview of the workflow and study results. Created with Biorender.com. B) Example images of PBMCs stained using the BCP assay. C) Example of merged image of four channels containing stains Hoechst 33342, MitoTracker Deep Red, Wheat-germ agglutinin/Alexa Fluor 555 (WGA), Phalloidin/Alexa Fluor 568, Concanavalin A/Alexa Fluor 488 and SYTO14 green fluorescent nucleic acid. D) Visualization of nucleus and cell segmentation. Scale bars: white 20 μm and blue 10 μm. Results Morphological profiling and cell typing of 50 million PBMCs from 390 healthy blood donors with Blood Cell Painting We developed a modified Cell Painting protocol for PBMCs, termed Blood Cell Painting (BCP; Fig. 1 A ; Methods ). Using the BCP protocol, we profiled PBMCs in 400 samples from 390 healthy blood donors. For each sample, we aimed to image at least 100,000 cells distributed across five wells on the same plate. Altogether, 41 plates were imaged, yielding a total of 50 million cells in 4.74 million images after excluding control samples. We acquired confocal images with four fluorescent channels and widefield images with five fluorescent channels using six fluorescent dyes ( Fig. 1 A ; Methods ) to label different components of the cell. In addition, brightfield images were collected in both imaging modalities ( Fig. 1 B-D ). A total of 186 features were extracted from images for downstream analyses. To identify major PBMC cell types in our BCP dataset, we clustered single-cell morphologies from 20 donors and performed supervised cell type annotation where two experts labeled a subset of the cells to train a neural network classifier ( Methods ). Cells were assigned into four classes: 1) monocytes, 2) macrophages, 3) B and T cells, and 4) uncategorised ( Fig. 2 A ). We then evaluated our annotated training set with ten-fold cross-validation ( Methods ). This procedure resulted in cells classified as B and T cells (38% of all cells), monocytes (16%), macrophages (14%) and uncategorised cells or debris (32%) ( Fig. 2 B, C ; Suppl. Fig. 3 B ; Suppl. Fig. 2 ). Download figure Open in new tab Figure 2. Cell classes based on morphology by expert annotations. A) Examples of cell classes annotated for the training set. Cells were manually annotated into four classes: monocytes (i), macrophages (ii), B & T cells (iii), and uncategorised (iv). B) Single-cell predictions from a representative field-of-view. Classification of cells into four classes is highlighted with the predicted class color: monocytes (red), macrophages (blue), B & T cells (green), uncategorised (magenta). C) Cross-validation confusion matrix obtained for the cell type classifier trained in BIAS software after 10-fold cross-validation. Correct predictions are shown in the diagonal and in green color. Scale bars: 50 µm. To obtain independent estimates of cell type frequencies, we performed flow cytometry-based immunophenotyping on the same 20 samples ( Methods ; Suppl. Table 5 ). In contrast to the BCP-based typing, flow cytometry indicated B and T cells to be two-fold as frequent (87%; 76% CD3+, 11% CD19+), and five-fold fewer monocytes (3%) ( Suppl. Fig. 3 B, D ; Suppl. Fig. 4 ). Among T cells (CD3+), 23% were CD8+ cytotoxic T cells. NK and dendritic cells were rare (1% and 0.004%, respectively). Despite these differences, both BCP and flow cytometry data showed clear clustering in UMAP embeddings ( Suppl. Fig. 3 A, C ). Notably, many of the cell types that remained uncategorized in BCP formed distinct clusters, suggesting they correspond to specific cell types, dead cells or debris ( Suppl. Fig. 5 ). In general, the cell type fractions observed in flow cytometry corresponded to proportions reported in healthy individuals with the same methodology ( 15 ). Cell size estimates derived from BCP and flow cytometry ( Suppl. Fig. 3E–F ) reflected known size differences among PBMC subtypes ( 16 , 17 ). These observations across platforms further support the validity of our cell type assignments using BCP. Finally, we found that cell type proportions in BCP were moderately correlated with flow cytometry for both B & T cells and monocyte/macrophage populations ( r =0.31; Suppl. Fig. 3G,H ), indicating general concordance between the two methods despite biology- or platform-specific biases. Benchmarking batch effect correction methods for Blood Cell Painting profiling data We next examined the quality and batch effects in the full BCP dataset of 50 million cells. Each donor contributed a median of 119,008 cells, and each well contained a median of 23,682 cells ( Fig. 3 A, B ). Cellular features extracted from the BCP confocal images for the whole dataset of 390 donors revealed a degree of clustering by plate ( Fig. 3 D ), even after normalizing features for controls ( Methods ). This prompted us to quantify batch effects as the degree of unexpected co-occurrence of cells from the same plate (batch effect score; Methods ). We evaluated the data for batch effects before and after correction using Harmony ( 18 ), ComBat ( 19 , 20 ) and linear regression. As batch factors to be corrected in the data, we used plate, well and field-of-view (FOV) separately as well as combinations of these three factors. Download figure Open in new tab Figure 3. Quality control, and batch effect quantification and correction for BCP data. Cell count distributions of A) 390 donors and B) 2000 wells (4,870,934 cells in total). C) Quantification of batch effect in uncorrected data, and in data corrected with linear regression (LinearR), ComBat, and Harmony for combinations of three batch factors (Plate, Well, FOV). 95% confidence intervals indicated with bars. D) Two-dimensional UMAP representations of cellular features before and after correction with the three methods. Colors indicate the source plate of each cell (27 plates in total). We evaluated the performance of each method with a subset of the whole dataset containing 2.69 million cells from 269 donors in 27 plates (10,000 cells from each donor). Harmony outperformed the other methods when both plate and well were used as the correcting factors, decreasing the batch effect score by 65.5% compared to 59.1% of ComBat and 8.4% of linear regression ( Fig. 3 C ; Suppl. Table 6 ). Consistently, two-dimensional UMAP representations of cellular features showed minimal clustering by plate in data corrected with Harmony ( Fig. 3 D ). Although we saw improvement when using both plate and well as factors in Harmony and ComBat, we could not evaluate these methods with all three factors (plate+well+FOV) due to excessive memory requirements. Harmony batch-corrected data was used for all subsequent analyses. Blood Cell Painting Atlas of peripheral blood mononuclear cells from healthy donors We combined all 390 donor samples after batch correction to create, to our knowledge, the largest morphological atlas of PBMCs. Cell clustering by morphological profiles yielded 18 distinct clusters encompassing a total of 42.5 million cells (clusters C3-C20; Fig. 4 A ; Suppl. Table 8 ; Methods ). Applying our morphology-based cell type classifier to the BCP Atlas revealed the two largest cell clusters to be primarily composed of lymphocyte cells (C15, 58% of all cells), and monocytes and macrophages (C9, 29%), respectively ( Fig. 4 B ). Remaining smaller clusters consisted mostly of uncategorized cells (13%). Download figure Open in new tab Figure 4. GWAS reveals distinct cell phenotypes are significantly associated with variants. UMAP of the BCP Atlas colored by A) cell clusters C3-C20 and B) cell type identified by a supervised classification procedure. Cell image examples from clusters C) C3, D) C5 and C) C13. F) A combination Manhattan plot of all 93 genome-wide significant associations (-log 10 (p)), where all significant associations for BCP features and clusters are highlighted. G) Genotype-phenotype associations for phenotype F7 in cell cluster C5 (-log 10 (p)), H) Association between lead variant rs3993974 and phenotype F7 in cell cluster C5. I) A locus zoom plot at rs3993974. Visual examination of BCP images of cells from each cluster confirmed marked morphological differences between clusters ( Fig. 4 C , Suppl. Fig. 5 ). Several clusters were enriched for cells with C-shaped or otherwise non-spherical nuclei (C3–6, C9, C18, C19). Cluster C11 consisted of cells with elongated shapes, potentially due to interacting cells or active cell division. Intriguingly, cells in cluster C13 showed a striking semicircular pattern on the mitochondrial channel wrapping around a large portion of the nucleus. This pattern may reflect perinuclear mitochondrial aggregation, a localized accumulation of mitochondria around the nucleus ( 21 ). To further delineate the composition of BCP clusters, we correlated their donor frequencies with cell type counts obtained from snRNA-seq for 315 donors ( 22 ) ( Suppl. Fig. 6A, Suppl. Table 9 ) and with complete blood counts (CBC) for 321 donors ( Suppl. Fig. 6B, Suppl. Table 9; Methods ). The strongest correlations were observed between clusters C9 and monocytes (CD14+, r =0.43; CD16+, r =0.22), and C15 and lymphoid cells (CD8 naive T, r =0.25; B naive, r =0.23; CD4 naive T, r =0.27), consistent with their morphology and supervised classification ( Fig. 4B , Suppl. Fig. 3G,H ). Based on cell morphology and snRNA-seq data, we hypothesize that C18 may contain non-polarized naive T cells with deep nuclear envelope invaginations (NEIs, “stripy” phenotype; Suppl. Fig. 5 C18 ; CD8 naive r =0.13) as recently described ( 23 ). Cluster C17 correlated with lymphocytes (B-lymf r =0.22, L-lymf r =0.24), and memory B cells ( r =0.15), CD8 naive ( r =0.14) and CD8 proliferating cells ( r =0.14), suggesting that this cluster may consist of B and T cells. In cluster C12, we observed larger, possibly damaged or dying cells with strong actin staining ( Suppl. Fig. 5 C12 ), with highest correlation to snRNA-seq and CBC monocytes. We next examined whether cell-cell interactions could be observed in BCP. For each cell, we quantified the relative enrichment (RE) of neighboring cells of each type within a 22 µm radius ( Methods ). We found that each cell type was significantly enriched in neighbors of the same type (RE>1; p <1x10 -15 , one-way ANOVA; Suppl. Fig. 7 ). In contrast, other cell types were less frequent within the interaction radius (RE<1). We also quantified the RE in each of the 18 cell clusters and observed that monocytes had a RE slightly above 1 for cluster C9 cells ( Suppl. Fig. 5 ), which were earlier classified mostly as monocytes and macrophages ( Fig. 4 ). Similarly suggestive of self-enrichment, B/T cell interactions were found to be slightly more frequent in cluster C15 ( Suppl. Fig. 5 ). Genome-wide association study of Blood Cell Painting features reveals 30 loci influencing immune cell morphology To discover germline genetic variants influencing immune cell morphology, we performed a GWAS on BCP image-derived features in healthy blood donors. As quantitative traits, we used twenty principal components of donor-averaged BCP features (F1-F20; Methods ) in 17 cell clusters, capturing major axes of morphological variation, to discover associations of cellular characteristics with germline genetic variants. We analyzed ∼10 million variants (BCP donor minor allele frequency, MAF>1.25%, at least ten carriers in donors) in 368 genotyped donors (FinnGen R12) ( 1 ). This yielded 106 genome-wide significant associations ( p <5x10 -8 ) ( Suppl. Fig. 8,9 ), of which 93 passed quality control ( Methods ), spanning 30 genomic loci ( Fig. 4 f , Suppl. Table 10). Fine-mapping with SuSiE ( 24 ) implicated high-confidence variants in genes related to transcriptional regulation ( C1orf21, ZMYM2 ), inflammatory signaling and tissue remodeling ( CHI3L1 ), cell cycle and circadian regulation ( CSNK1E ), vesicle trafficking and secretion ( PTPRN2, NCALD ), and extracellular matrix interactions ( PDGFRL ) ( Suppl. Table 13; Methods ). A prominent association was found in cluster C5 at a locus containing tryptase-encoding genes TPSB2 , TPSAB1 and TPSD1 . The lead variant (rs3993974, GWAS p =5.13x10 -9 ; SuSiE PIP=0.11; Suppl. Table 11 , Suppl. Table 13, Fig. 4 h, i ) is strongly associated with increased tryptase levels in plasma (tryptase µg/l, β =0.23, p =4.63x10 -11 ; Methods ; Suppl. Table 12 ). This region had a strong expression and splicing quantitative trait locus (eQTL, sQTL) signal for tryptase genes ( Suppl. Table 14 ). In addition, this region was marked by direct transcription factor binding by CTCF and nine additional transcription factors, as assessed by ChIPseq ( Suppl. Table 15 ). Tryptases are involved in asthma and other allergic and inflammatory disorders, and are contained in mast cells ( 25 ). The associated BCP feature (F7) reflected cell length and nuclear stain intensity ( Fig. 4 g , Suppl. Fig. 9 a, e, i; Suppl. Fig. 10). Cluster C5 also showed associations for nuclear morphology (F17) with rs71330739 ( p =4.32×10⁻⁸) near cell adhesion and migration related PARVG and PARVB , and rs62486739 ( p =3.07×10⁻⁸; PIP=0.44) in SSBP1 , a housekeeping gene involved in mitochondrial biogenesis ( Suppl. Fig. 9 b, f, j; Suppl. Fig. 10) . These variants further support the notion that C5 includes rare or immature myeloid populations with distinct nuclear morphologies. While mature mast cells are not generally present in peripheral blood, we speculate that this cluster may be composed of mast or granulocyte cell precursors, or neutrophils (CBC B-neut r =0.2; Suppl. Fig. 6 ). In cell cluster C3, nucleus solidity, cavity and textural patterns (F14) were associated with rs965618 ( p =2.28x10 -8 ; PIP=0.35) ( Suppl. Fig. 9 c, g, k; Suppl. Fig. 10) . The lead variant is an expression quantitative trait locus (eQTL) across several tissues for SCO2 , CPT1B and CHKB that are central regulators of immunity and lipid metabolism across multiple tissues ( Suppl. Table 14 ). The locus was also strongly associated with increased mean corpuscular volume (Kanta β =0.02, p =4.0x10 -27 ) and monocyte counts (OpenTargets β =0.01, p =3.99x10 -8 ; Suppl. Table 12 ). In cell cluster C13, which harbored a striking phenotype possibly due to perinuclear mitochondrial aggregation discussed above ( Fig. 4e ), nuclear, mitochondrial and actin characteristics (F8) were associated with rs13251546 with a clear additive effect ( Suppl. Fig. 9 d, h, l; Suppl. Fig. 10) . The region has previously been associated with visual disorders, varicose veins and smoking status, as well as vision issues ( 26 ). As an example of variants previously implicated in immune-related conditions and highlighted by the BCP GWAS, we found psoriasis-linked variants (OpenTargets β =-3.6, p =5.00x10⁻¹⁵; Suppl. Table 12 ) at an enhancer site near CD28 to associate with BCP features (F20; rs115029131, p =3.21x10⁻⁸). Many cells in the associating cluster C4 had a non-spherical nucleus, and might thus be monocytes or macrophages ( Suppl. Fig. 5 ). Normally CD28 is not expressed in monocytes and macrophages, but can be induced under chronic inflammation ( 27 ). Finally, we performed GWAS for all BCP phenotypes without cell clustering, but no genome-wide significant associations were found. A comparison of our results to previous GWASs ( 28 – 30 ) revealed positive correlations in association strengths ( r =0.06–0.18, p <0.005) ( Suppl. Fig. 11 , Suppl. Table 16, Suppl. Table 20 ). Association of BCP cell characteristics to donor age, sex and health registry endpoints We examined how demographic factors and health registry phenotypes relate to BCP morphological characteristics. Donor age and sex were found to associate (FDR<5%; Methods ) with several features such as nucleus, mitochondria and RNA intensity and texture as well as cell shape (F1, F2, F7, F13, F16, F17, F20; Suppl. Table 18 ) in cell clusters C9 and C11 ( Suppl. Table 17 ). C9 is composed mostly of monocytes and macrophages with strong actin intensity ( Suppl. Fig. 5 ). In C11 consisting of elongated cells, sex was associated with cell shape, texture and length as well as RNA dye intensity (FDR=3%; F2). Morphological features of cells in C19 were associated (FDR<10%; F5, F9, F17) with inflammatory and allergic endpoints such as asthma, sinusitis and pneumonia ( Suppl. Table 19 ). These cells were also associated with abnormalities of breathing, septum deviation and vocal larynx issues. Nuclei in C19 exhibit a lobular structure, suggesting they may be granulocytes or their precursors that survived PBMC isolation. Morphological characteristics of cells in C8, potentially composed of T cells, were linked to common rhinitis (F13). Interestingly, healthcare visits related to contraceptive management (ICD-10 Z30) were associated with elongated cell shapes (F16) in C11 ( Suppl. Fig. 5 ). BCP profiling of acute myeloid leukemia PBMC patient samples As a proof-of-concept study to test the generalization of the pipeline developed for healthy PBMCs, we performed the BCP protocol on PBMC samples of six acute myeloid leukemia (AML) patients and an AML cell line (MOLM-13) ( Methods , Suppl. Table 7 ). PBMCs from AML patients displayed distinct morphological profiles ( Fig. 5 ). In AMLs with minimal maturation (FAB M1, AML 2-3) and acute monocytic leukemias (M5, AML 6), we observed a cell cluster not found in healthy cells nor the other AML samples. AML samples 4 (M1) and 5 (M5) had low levels of clinically malignant cells in the blood, indicated by most of their cells clustering among the healthy cells. Finally, the AML cell line (MOLM-13) forms distinct clusters within a supercluster composed of monocytes. Download figure Open in new tab Figure 5. AML samples show a distinct distribution of BCP features compared to healthy donors. A) UMAP of BCP cellular features from AML patient and cell line samples with health PBMCs. Example images of each patient and cell line samples, as well as images of healthy B and T cells and monocytes. A cell cluster not found in healthy cells is indicated with an arrow. B-G) AML patient samples 1-6 and (H) the MOLM-13 sample compared to (I) healthy PBMCs. Discussion In this study, we aimed to characterize the morphological variability of mononuclear cells in healthy blood donors. To achieve this, we developed a modified Cell Painting ( 4 ) protocol termed Blood Cell Painting (BCP), specifically for PBMCs, optimizing it for robustness and throughput. With BCP, we created the largest Cell Painting dataset of PBMCs to date, a BCP Atlas encompassing 50 million imaged cells from 390 healthy individuals. The large number of cells profiled allowed us to capture rare morphological phenotypes, such as perinuclear aggregation of mitochondria ( 31 ) in immune cells. This work adds a novel dimension to the study of the human immune system through blood profiling ( 32 ). HCI has been shown to exhibit technical variation stemming from experimental conditions such as plate effects and cell handling ( 33 , 34 ). In line with earlier studies ( 33 , 35 ), batch correction with Harmony outperformed alternatives, and we adapted it to scale across tens of millions of cells. Additionally, we observed biases in cell type representation, where monocytes and macrophages appeared more common than expected. The observed difference in cell frequency between flow cytometry and the BCP protocol likely stems from two related factors: higher concentration of B/T cells at the edges of the well and the non-adherent nature of these cell types ( 36 ), making them more susceptible to loss during washing compared to monocytes. Further optimization of Poly-L-lysine coating of the wells to improve cell adhesion can mitigate this issue. Our supervised cell type assignment was able to differentiate between lymphoid and myeloid populations. Marker-based sorting could improve cell typing accuracy for rare populations such as NK and dendritic cells. Correlating donor-level BCP cluster frequencies with cell type counts from snRNA-seq and complete blood counts provided independent support for our morphology-based cell type classification. Concordant patterns observed for myeloid and lymphoid populations indicate that variation captured by BCP reflects true biological differences in circulating immune cell composition rather than technical artefacts. These cross-platform correlations further demonstrate BCP’s capacity to capture physiologically meaningful immune cell heterogeneity. Driven by the genotyping and health registry data available in FinnGen ( 1 ) for our study cohort, we were able to examine the determinants and correlates of immune cell morphological phenotypes. We discovered 30 novel genomic loci associated with morphological cell characteristics. The genetic architecture of immune cell morphology reflected variation in immune cell activation and differentiation, subcellular structural organization, and susceptibility to allergic and inflammatory conditions. As an example, we uncovered genetic variation at tryptase-encoding genes to strongly influence morphology of a distinct cluster of cells. Tryptases, the most abundant serine proteases stored in mast cell granules, are vital for mast cell function and activation, with a key role in allergic reactions and asthma ( 25 ). While mature mast cells are not typically found in peripheral blood, immature mast cells can be present. We also observed associations between BCP features and genetic variants previously implicated in psoriasis. For instance, a psoriasis-linked variant near CD28 was associated with cells characterized by non-spherical nuclei. This morphology may reflect, for example, activated or differentiating monocytes and macrophages. These cells are known to undergo nuclear deformation in response to environmental stimuli and immune activation ( 39 ). Systemic inflammation in psoriasis has been associated with elevated levels of low-density granulocytes (LDGs), a neutrophil subset with segmented or irregular nuclei that co-fractionate with PBMCs ( 40 ). These findings suggest that inflammatory skin disorders may leave a morphological footprint in the peripheral immune system, linking genotype-associated immune dysregulation with altered nuclear architecture. Previous studies have identified numerous germline variants associated with immune cell traits measured by flow cytometry ( 28 , 29 , 41 – 44 ) and imaging ( 30 ), and immunologic endpoints ( 45 ). Although the genome-wide significant variants found in this study were novel, we found variants with p <10 -5 in our study that had been previously associated with blood indices or morphological traits. The correlation of our GWAS results with reported variant associations from flow cytometry, bulk blood traits and high content imaging studies provides orthogonal validation for the ability of BCP to capture meaningful aspects of immune cell biology ( 28 – 30 ). Compatible with our genetic findings, BCP morphological features were associated with inflammatory endpoints such as asthma, allergies and sinusitis. We also observed morphological associations in cells with elongated morphology to leukocyte counts and healthcare visits related to contraceptive management. However, a more careful examination of this association is warranted as the endpoint does not distinguish between use of specific contraceptives, and includes any contraceptive-related visits to healthcare. Similarly to previously reported age-related decline of mitochondrial activity ( 7 ), we found mitochondrial variability in these cells to correlate with donor age. We anticipate that our extensive dataset will serve as a valuable resource for future research to delineate disease phenotypes by capturing the range of normal morphological variability, and representing a reference for comparative analyses. Our and similar future datasets could establish a baseline for healthy individuals in Cell Painting-based drug screens of pathologies of the blood ( 46 ), such as leukemias. Towards this goal, our proof-of-concept application of BCP on AML patient PBMC samples differentiated between leukemia FAB subtypes. The results revealed distinct morphological and cell type-specific differences within AML samples, demonstrating the potential of BCP for profiling leukemic samples. Nevertheless, comprehensive benchmarking with a larger number of samples is essential for establishing the BCP as a reliable tool for AML classification and profiling towards diagnostics. We foresee the training of label-free models with large BCP datasets as a promising direction for inexpensive morphological profiling ( 38 , 47 ). Our publicly available BCP Atlas offers a foundation for label-free models ( 48 – 50 ) and large-scale biological discovery. Methods Healthy blood donor sample collection The healthy blood donor samples profiled in this study originate from a FinnGen project in collaboration with the Finnish Red Cross Blood Service Biobank. The Blood Service Biobank contributed DNA samples from 58,000 blood donors to FinnGen. For a subset of these donors, live-frozen PBMCs, plasma, and serum samples were collected and stored, along with genotype data generated earlier in FinnGen 1 . Full blood count and clinical chemistry analyses were also performed from collected whole blood and serum. All biobank samples from Finnish Red Cross Blood Service Biobank were collected along with normal blood donation from donors who met the blood donation health requirements and who had given biobanking consent ( 51 ). For blood donation, blood donors must be between 18 and 70 years of age, and feeling healthy and well. If a medical condition has been diagnosed, it must be well-controlled and medicated. Certain medications and medical conditions may disqualify potential donors from donating blood either temporarily or permanently. Donated blood is collected in a standard blood bag system with Citrate Phosphate Dextrose (CPD) as anticoagulant (CompoFlow®, Fresenius Kabi, Cat.No. CQ32250). After blood donation, donated blood was transported overnight to the Blood Service’s production facility and processed within 24 hours. The red blood cells and plasma were separated from the donated whole blood by centrifugation and used for preparation of blood products. The remaining Buffy Coat fraction (∼55 ml) was passed for isolation of PBMCs to the Blood Service Biobank. PBMCs were isolated from the Buffy Coat with Ficoll isogradient centrifugation ( 52 , 53 ). After the isolation, PBMCs were stored in a freezing medium (5% filtered heat-inactivated human AB serum (Valley Biomedical), 2 mM L-glutamine (Gibco), and 1% penicillin/streptomycin (10,000 units/mL and 10,000 µg/mL respectively) (Gibco) in RPMI 1640 (Gibco) containing 10% DMSO (WAK-chemie medical GMBH)) in cryotubes (1.9 ml Tri-coded Tube, FluidX 65-7641, Azenta) and transferred into the automated gas phase liquid nitrogen freezer for long-term storing at -180 C until release and transported to the research laboratory. Blood Cell Painting protocol ‒ overview of the procedure Steps involved in the modified Cell Painting protocol for PBMC samples are described below, with a more detailed protocol of the methods found in the Supplementary Text . Cell culture, staining and fixation of PBMC samples The media used for thawing and culturing the cells was a 5% filtered heat-inactivated human AB serum (Valley Biomedical), 2 mM L-glutamine (Gibco), and 1% penicillin/streptomycin (10,000 units/mL and 10,000 µg/mL respectively) (Gibco) in RPMI 1640 (Gibco). Thawing of the samples was completed according to standard protocols. The cells were washed twice to remove cytotoxic DMSO and resuspended in culture media to contain approximately 50,000 cells/ml. Prior to the seeding of the cells, the wells of 384-well plates (CellCarrier-384 Ultra/PhenoPlate 384-well, Revvity) were coated with Poly-L-lysine hydrobromide (MP Biomedicals) to enhance electrostatic interactions between the negatively charged ions on the cell membrane to the positively charged coated well ( 54 ). Each imaged plate contained ten donor samples and a control sample. As control samples, we used sister samples from a large cohort of PBMCs collected from donors during a singular blood donation. Samples collected from a singular donor were used on 11–17 plates as controls. With the aim to image at least 100,000 cells per donor, approximately 50,000 cells per well were added in parallel to five wells on 384-well imaging plates. One control sample was added on each plate to five wells, aiming for at least 100,000 imaged cells per control. The cells were incubated at 37°C for 1.5 hours prior to adding Mitotracker (see below). After a complete two-hour incubation time at 37°C and 5% CO 2 , the plate was fixed with 8% paraformaldehyde. Fluorescence staining of healthy donor PBMCs The staining pipeline used was based on an optimized Cell Painting assay ( 4 , 5 ). The mitochondria of the living PBMCs were stained with Mitotracker Deep Red (Invitrogen) before fixation of the cells. Wheat-germ agglutinin/Alexa Fluor 555 (WGA) conjugate stock (Invitrogen), Concanavalin A/Alexa Fluor 488 conjugate stock (Invitrogen), Phalloidin/Alexa Fluor 568 conjugate stock (Invitrogen), SYTO14 green fluorescent nucleic acid stain stock (Invitrogen) and Hoechst 33342 stock (Invitrogen) were added after fixation and permeabilization of the cells, described in detail in Supplementary Text . High content imaging with Opera Phenix microscope The plates were imaged with Opera Phenix High Content Screening System (Revvity, Waltham, MA, USA) using 40x water immersion objective (NA 1.1) and four lasers (405 nm, 488 nm, 561 nm and 640 nm). A total of 64 (8x8) fields-of-view (FOV) with 5% overlap were imaged per well using five predetermined Z focus planes (1.5 µm distance between planes) with laser-based autofocusing. The images were captured with two Andor Zyla sCMOS cameras (16-bit, field of view 320x320 μm 2 , effective xy resolution 0.33 µm). Both confocal and widefield images were acquired. Detailed description of excitation and emission sources are described in Supplementary Table 3 . The experimental workflow was optimized and designed so that a single person could prepare up to four plates during a week (one plate per day), and perform sample staining during the last day of the work week. Plates were then imaged by automated microscopy over the weekend, with one plate taking approximately 10 hours to image. Approximately 35 TB of images were generated during data collection (530 GB/confocal plate, 320 GB/widefield plate). Image analysis Biology Image Analysis Software (BIAS) ( https://www.sct.bio/the-bias ; Single-Cell Technologies) was used for primary image processing, segmentation, and feature extraction ( 55 ). Both confocal and widefield images were processed using the same analysis workflow with the exception that widefield images had one extra channel used in feature extraction ( Supplementary Text ). 3D image stacks were first projected into 2D images using maximum intensity projection for fluorescence images and average intensity projection for brightfield images. Non-uniform illumination was corrected on these images using the CIDRE method ( 56 ). Next, nuclear and cellular regions were segmented using two pre-trained deep learning models. Nuclei were segmented using the nucleAIzer ( 57 ) model and the cellular regions using the nucleAIzer extension for cytoplasm segmentation (available at: https://zenodo.org/records/6790845 ). These two segmented regions were linked as cell objects including one segmented region from both models. Classical intensity, shape, and texture features were extracted from all channels on cell object regions to present 186 BCP cellular features. To ensure that cellular features from different plates are comparable, features were standardized plate-wise with respect to cellular features of the control sample on the plate. First, for each feature, we calculated mean μ and standard deviation 𝜎 for control cells. Then, the donor cellular feature values 𝑥 were standardized as . Outlier and edge removal Out of ∼55 million cells imaged, approximately 5 million were from control samples and were excluded from analysis after being used for feature scaling (Methods). Outlier removal was done based on features “NUCLEUS INTENSITY-MEAN Alexa 568” and “NUCLEUS INTENSITY-MEAN Hoechst 33342”, where all cells with scaled features with values over 40 were removed from the dataset. These were mostly falsely segmented high-intensity artefacts. In addition, edge cell removal was done based on values of features “centroid_x”, “centroid_y” and “CELL ENCLOSING CIRCLE RADIUS”, where cells were removed if they were touching the edge of the well to ensure that all analyzed cells fit completely in the field-of-view. These steps resulted in 44.8 million cells for downstream analysis and batch correction. Batch correction of BCP cellular features Three methods were employed for the batch correction of cellular features: Harmony ( 18 ), pyComBat ( 20 ) and least-squares linear regression. Harmony clusters data points into temporary clusters, computes correction factors based on the cluster centroids, and repeats until satisfactory entropy and diversity in the clusters have been reached. PyComBat is a Python implementation of the ComBat ( 19 ) batch correction method, which uses parametric and non-parametric empirical Bayes approaches to correct batch effects. We evaluated three potential sources of batch effect: plate, well, and field-of-view (FOV), and their combinations. For linear regression, corrected features were derived by subtracting the observed feature value from the feature value predicted by the correction model. We used a batch effect score to evaluate the effectiveness of the above methods by measuring whether cells from the same plate are more clustered together than expected, indicative of batch effect. The score is derived by computing, for each cell 𝑖 in the data, the fraction of cells from the same plate as cell 𝑖 amongst 𝑘 nearest cells, and normalizing by the expected fraction. To find the nearest cells, Euclidean distance in the UMAP space of cellular features was used. For each batch correction experiment, let 𝑁 be the number of cells in the whole dataset, 𝑛 𝑝 be the number of cells from the plate 𝑝, and the number of cells from the same plate in the nearest 𝑘 neighbors be 𝑥 𝑖 where 𝑖 is the cell id. We define the batch effect score as or the average of the logarithm of observed to expected fractions taken over all cells. The batch effect score for an individual cell is zero if the two ratios match, and increases when there are more cells from the same plate than expected, suggesting the presence of a batch effect. The ability of the score to detect batch effects depends on the choice of 𝑘, such that larger values of 𝑘 both allow the detection of smaller batch effects and accommodate larger between-plate differences in cell amounts. The value of k used for this study was 200. We were not able to perform batch correction on the quality-controlled set of 44.8 million cells due to insufficient memory (1,490 GB RAM) to run Harmony. Therefore, we first ran Harmony on 35 million cells in a single batch, and then corrected the remaining cells as follows: for each remaining cell, feature value was assigned as the average of three Harmony-corrected cells closest with respect to Euclidean distance to the uncorrected cell in the feature space. Clustering of cells by BCP cellular features Clustering of cells by BCP features was done by first performing two-dimensional UMAP (n_neighbors=100, min_dist=0.01) and then applying DBSCAN clustering ( 58 ) on the UMAP coordinates. After clustering cells with DBSCAN, all cells not assigned to any cluster were removed as outliers, leaving eight initial clusters. After initial clustering, further subclustering was done based on visual inspection of major clusters that could be clustered further (two largest clusters C1 and C2) ( Fig. 4 ). Parameters for subclusters were assessed by testing multiple different values for maximum distance between two points to be considered neighbours (ε) and minimum number of points within ε (minPts). The parameters for initial clustering were ε=0.08 and 35 minimum samples. The parameters for subclustering of cluster C1 were ε=0.1 and 65 minimum samples, and for cluster C2 ε=0.09 and 60 minimum samples. Cell typing To classify single cells into immune subtypes, we used a supervised machine learning pipeline in the BIAS software. We manually annotated ∼200 cells per class to train a Support Vector Machine (SVM) classifier, which was refined using an active learning loop. K-means clustering (iterations = 100, max deviance = 0) was applied to assist in stratified annotation and visualization of the feature space. Cells were annotated to four categories: monocytes, macrophages, B & T cells, and uncategorised cells. The aim was to maintain class balance during annotation to support robust training and quantification. Annotation criteria were based on established morphologies in multiplexed confocal fluorescence images. Cells were assigned into the four categories as follows ( Fig. 2 A ): 1) monocytes, large cells characterized by a kidney-shaped nucleus (bi-lobed structure). These cells exhibited a bright signal in the ER/Golgi channel (green) and the mitochondrial marker (red). The actin marker (phalloidin) formed a substantial mesh around the nucleus (orange), 2) macrophages, similar to monocytes but with a more rounded nucleus that have differentiated from monocytes in wells, 3) B and T cells, small cells with a rounded nucleus showing low signal intensity in the ER/Golgi (green), mitochondrial (red) and actin channels (orange), and 4) uncategorised, including segmented objects that did not fit the morphologies described above, for instance cell debris, dead cells, and cells exhibiting only nuclear signals. All extracted intensity, texture, and morphology features were used as inputs without prior feature selection, enabling the model to determine optimal feature weighting. The classifier was evaluated with ten-fold cross-validation: the dataset was partitioned into ten subsets, each in turn used as a test set while training on the remaining data. Classification performance was assessed using a confusion matrix that confirmed high accuracy for B & T cells and moderate separation between monocytes and macrophages. The final classifier model was then trained with the complete training dataset. Correlation of cell counts between BCP clusters, and snRNA-seq cell types and blood counts We compared the proportion of cells in BCP clusters to both snRNA-seq cell type proportions and blood counts with Pearson correlation. For each cell type available in snRNA-seq data ( 59 ), we aggregated counts per cell type (“pseudobulk”) and computed the proportion of each cell type for each donor. The snRNA-seq data was released to the FinnGen sandbox in 2023 along with other multiome data ( https://docs.finngen.fi/finngen-data-specifics/red-library-data-individual-level-data/omics-data/single-cell-transcriptomics-and-immune-profiling ). Complete blood counts included both L- (percentage) and B-values (count per liter). CBC measures the number and size of red blood cells, white blood cells, and platelets in blood, with hemoglobin and hematocrit levels. Flow cytometry analysis Cell populations were profiled using high-throughput flow cytometry (HTFC; FIMM High Throughput Biomedicine unit, HiLIFE, University of Helsinki) ( Suppl. Table 4 ). The cell type markers used were CD45 (leukocyte), CD11c (dendritic cell), CD3 (T cell), CD8 (cytotoxic T cell), CD19 (B cell), CD56 (NK cell) and CD14 (monocyte/macrophage), as well as non-viable cell exclusion dye DRAQ7. Individual cell types for comparison to Cell Painting features were gated following the protocol described in Supplementary Figure 1 . Visualization of BCP cellular features Cellular features were visualized by reducing feature dimensionality to two with Uniform Manifold Approximation and Projection (UMAP) ( 60 ). UMAP is a non-linear dimensionality reduction algorithm that aims to preserve the similarities and dissimilarities between data points while reducing the feature space dimensionality. Input cellular features to UMAP were normalized to zero mean and standard deviation of one. The used UMAP parameters were n_neighbors=100 and min_dist=0.01. In order to plot millions of data points, we used Datashader (Datashader v0.16.1., 2024, April 19, https://datashader.org ) library to accurately represent the data distributions by aggregating local data points to avoid overplotting. In UMAP plots, local regions with multiple colors (labels) appear darker than regions with fewer colors. CMplot version 4.5.1 was used to visualize multiple GWAS in the same plot. Quantification of cell-cell interactions To detect and quantify cell-cell interactions, we used the subset of 2,090,581 cells from 20 donors, for which cell typing and clustering data were available. The number of proximal cells, measured as the number of cells present within the interaction radius from the center cell, was computed using the KDTree nearest neighbor algorithm (scikit-learn v.1.1.1). The co-localization of immune cells within a 22-25 µm radius has been associated with specific immune processes and clinical variables, indicating biologically significant interactions between cells ( 61 , 62 ). Therefore, given the average cell enclosing circle radius (36.33 pixels), we set the interaction distance to 146 pixels, equivalent to 22 µm or 2 cell diameters (0.15 µm/pixel image resolution). We also computed a measure of relative enrichment (RE) to determine if certain cell types were more prevalent in the set of proximal cells than expected. Let 𝑅 be the total number of cells within the interaction radius 𝑟, let be the number of cells of type 𝐶 within the interaction radius 𝑟, let 𝑁 be the total number of cells in the dataset, and 𝑛 𝐶 be the total number of cells of type 𝐶. We defined RE as: Principal component analysis of BCP cellular features Principal component analysis (PCA) was performed for 186 BCP cellular features in order to reduce data complexity and computational burden for subsequent analyses. PCA was done with 20 principal components (PCs) denoted F1–F20 which explained >95% of variance in the dataset. To obtain donor-level features, the average of each PC in each cell cluster was computed for each donor. Genome-wide association study for cellular BCP features Genome-wide association study (GWAS) was performed to find associations between BCP cell features and genotypes in FinnGen (R12). We utilized the FinnGen DF12 dataset with 500,348 donors, 2,502 disease phenotypes and over 21 million genotyped variants ( 1 ). We considered 186 BCP features of the four fluorescent channels transformed to 20 PCs ( Suppl. Fig. 10 ). GWAS was run for all combinations of the 17 cell clusters and 20 PCs. Cell cluster C7 was not included in the analysis as it contained cells from only 67 donors. The donor-level average value of each PC in each cell cluster was treated as phenotype in GWAS. Altogether 340 GWAS were run (20 phenotypes x 17 clusters). Out of 390 donors imaged, 22 did not have covariate data available or were otherwise excluded from analysis in earlier data collection of FinnGen due to quality control or ancestry ( 1 ). The remaining 368 donors had 10.4 million germline variants present with minor allele frequency (MAF) > 0.0125 in FinnGen, and were tested against altogether 22 million germline variants available in FinnGen. Rank inverse normalization transformation (RINT) was applied to features with inflation (λ>1.05) or deflation of lambda values (λ<0.98). Regenie model ( 63 ) was used to run GWAS and the model was trained with a high-quality LD-pruned genetic relationship matrix (GRM) available in FinnGen ( 1 ). This GRM contains no population outliers or genetic duplicates, and was further pruned to only contain variants for which BCP donors had MAF>0.0125. As GWAS covariates, age, sex and the first ten genetic ancestry principal components were used. A base model for associations was also investigated with cellular feature values as independent variable and age, sex and ancestry principal components as covariates. Fine-mapping of associated variants in GWAS Fine-mapping was done for all 30 genomic regions highlighted as significant in GWAS utilizing SuSIE ( 24 ) with the FinnGen R12 pipeline and default parameters (max_region_width=6,000,000; p_threshold=5x10⁻⁸; n_causal_variants=10; window_shrink_ratio=0.9; good_cred_r2=0.25). Comparing BCP GWAS results to previous studies We combined summary statistics from previous GWASs with our BCP GWAS by variant rsIDs. For each previous study, the Pearson correlation coefficient r was computed between -log 10 ( p )-values reported in the study and obtained from the BCP GWAS for variant associations ( Suppl. Fig. 11 ). Confidence intervals for r were estimated using bootstrapping with 1,000 samples. Acute myeloid leukemia (AML) patient samples and MOLM-13 cell line sample To test BCP on PBMCs from leukemia, we used six patient-derived AML (AML1-AML6) samples from five different patients ( Suppl. Table 7 ). Two of the AML samples were collected from the same patient, with a ten-month interval between collections. The AML samples were previously clinically subtyped as acute myeloid leukemia with minimal maturation (M1, n =3), acute myeloid leukemia with maturation (M2, n =1) or acute monocytic leukemia (M5, n =2) in the FAB (French-American-British) classification system ( 64 ). The two AML M5 samples are from the same patient at diagnosis (AML5) and refractory (AML6). In addition, a MOLM-13 cell line (ACC 554) acquired from the FIMM HTB unit, originally established from the peripheral blood of a patient at relapse of AML ( 65 ) (FAB M5a) was used in the study. All AML patient samples and the MOLM-13 sample were thawed, plated, fixed, stained, imaged and analyzed using the same BCP protocol as for the healthy donor PBMC samples. All AML samples were plated together with healthy PBMC samples, aiming at least 100,000 single cells dispersed over five wells, with the standard control sample and imaged with both confocal and widefield microscopy. Code availability The code used to analyze the BCP dataset, and dataset details will be available at https://github.com/bioimage-profiling/blood-cell-painting-paper . Data availability BCP image data generated in this study is publicly available in BioImage Archive (10.6019/S-BIAD2344). Instructions on how to access FinnGen genotype and health registry data are available at https://www.finngen.fi/en/access_results . Ethical approval The Coordinating Ethics Committee of the Hospital District of Helsinki and Uusimaa have approved the FinnGen study protocol Nr HUS/990/2017. A formal biobank decision for the research project has been granted by the Finnish Red Cross Blood Service Biobank. Blood was collected from volunteering blood donors that previously have partaken in a FinnGen study and have signed a biobanking consent form with the Blood Service Biobank (The Finnish Biobank Act 688/2012). The primary cells used in this project were human PBMCs, isolated from venous whole blood, and frozen according to the Blood Service Biobank guidelines and sent to FIMM for thawing, cell seeding, fixation, staining and imaging. AML samples were collected in a study approved by an ethics committee of the Helsinki University Hospital (Ethics Committee Statement 303/13/03/01/201, latest amendment 7 dated 15 June 2016; latest HUS study permit HUS/395/2018 dated 13 February 2018; Permit numbers 239/13/03/00/2010, 303/13/03/01/2011). Author contributions Blood Cell Painting Assay development: CHS, MP, VP Blood Cell Painting Assay data modeling: GA, VT, LP, EP Methodology: CHS, VT, IM, MP, GA, AH, LP, VP, EP Formal analysis: CHS, VT, GA, CDS, IM Investigation: CHS, VT, GA, IM, MP, JS, JK, CDS, LU, HMO, LP, VP, EP Visualization: MP, VT, GA, IM, CDS, CHS Wetlab: CHS, JH, JS, TR, TA Data curation: VT, GA, CHS, IM, MP Software: GA, VT, IM Resources: JP, AH, JJ, JJM, MA, CAH, RR, MD, AP, LP, VP, EP Imaging development: AH, MP, CHS, IM Flow cytometry: TR, TA Genetic analyses: VT, LU, OK, HMO, EP Registry data analyses: VT, JK, HMO, EP Conceptualization, Supervision, Funding acquisition: LP, VP, EP Acknowledgements This study was supported by funding from the Research Council of Finland (322675 and 328890 to EP; 340273 and 346604 to LP), the Research Fund of the Finnish Red Cross Blood Service, FinnGen and iCAN Flagship. The Finnish Red Cross Blood Service Biobank personnel are acknowledged for organizing research project-specific sample collection in blood donation activities. The authors wish to acknowledge CSC – IT Center for Science, Finland, for generous computational resources. HC imaging and analysis were performed at the FIMM High Content Imaging and Analysis HCA unit, and flow cytometry at the FIMM High Throughput Biomedicine HTB unit, both supported by HiLIFE, University of Helsinki, Biocenter Finland, and Euro-Bioimaging. Prof. Peter Horvath is acknowledged for his support in image analysis and for providing BIAS software (Single Cell Technologies Ltd.) for our use. We would like to thank Prof. Matti Pirinen, Pietro Della Briotta Parolo, Vincent Llorens, Dr. Markus Vähä-Koskela, Anna Nylund, and the FinnGen helpdesk for their assistance. Prof. Olli Kallioniemi is acknowledged for scientific discussions. BioRender.com was used in creating figures. We thank all the donors and patients who have participated in this project by donating their samples. We want to acknowledge the participants and investigators of the FinnGen study. The FinnGen project is funded by two grants from Business Finland (HUS 4685/31/2016 and UH 4386/31/2016) and the following industry partners: AbbVie Inc., AstraZeneca UK Ltd, Biogen MA Inc., Bristol Myers Squibb Inc. (and Celgene Corporation & Celgene International II Sàrl), Genentech Inc., Merck Sharp & Dohme LCC, Pfizer Inc., GlaxoSmithKline Intellectual Property Development Ltd., Sanofi US Services Inc., Maze Therapeutics Inc., Johnson&Johnson Innovative Medicine Inc., Novartis AG, Boehringer Ingelheim International GmbH and Bayer AG. Following biobanks are acknowledged for delivering biobank samples to FinnGen: Auria Biobank ( www.auria.fi/biopankki ), THL Biobank ( www.thl.fi/biobank ), Helsinki Biobank ( www.helsinginbiopankki.fi ), Biobank Borealis of Northern Finland ( https://www.ppshp.fi/Tutkimus-ja-opetus/Biopankki/Pages/Biobank-Borealis-briefly-in-English.aspx ), Finnish Clinical Biobank Tampere ( www.tays.fi/en-US/Research_and_development/Finnish_Clinical_Biobank_Tampere ), Biobank of Eastern Finland ( www.ita-suomenbiopankki.fi/en ), Central Finland Biobank ( www.ksshp.fi/fi-FI/Potilaalle/Biopankki ), Finnish Red Cross Blood Service Biobank ( www.veripalvelu.fi/verenluovutus/biopankkitoiminta ), Terveystalo Biobank ( www.terveystalo.com/fi/Yritystietoa/Terveystalo-Biopankki/Biopankki/ ) and Arctic Biobank ( https://www.oulu.fi/en/university/faculties-and-units/faculty-medicine/northern-finland-birth-cohorts-and-arctic-biobank ). All Finnish Biobanks are members of BBMRI.fi infrastructure ( https://www.bbmri-eric.eu/national-nodes/finland/ ). Finnish Biobank Cooperative -FINBB ( https://finbb.fi/ ) is the coordinator of BBMRI-ERIC operations in Finland. The Finnish biobank data can be accessed through the Fingenious® services ( https://site.fingenious.fi/en/ ) managed by FINBB. Footnotes We have added results of an analysis where we correlated cell counts obtained from single-nucleus RNA-seq from the same donors. https://github.com/bioimage-profiling/blood-cell-painting-paper References 1. ↵ Kurki MI , Karjalainen J , Palta P , Sipilä TP , Kristiansson K , Donner KM , et al. FinnGen provides genetic insights from a well-phenotyped isolated population . Nature [Internet] . 2023 Jan 19 [cited 2025 Sept 29]; 613 ( 7944 ): 508 – 18 . Available from: https://www.nature.com/articles/s41586-022-05473-8 OpenUrl 2. ↵ Stubbington MJT , Rozenblatt-Rosen O , Regev A , Teichmann SA . Single-cell transcriptomics to explore the immune system in health and disease . Science [Internet] . 2017 Oct 6 [cited 2024 May 20]; 358 ( 6359 ): 58 – 63 . Available from: https://www.science.org/doi/10.1126/science.aan6828 OpenUrl 3. ↵ La Manno G , Soldatov R , Zeisel A , Braun E , Hochgerner H , Petukhov V , et al. RNA velocity of single cells . Nature [Internet] . 2018 Aug [cited 2024 May 20]; 560 ( 7719 ): 494 – 8 . Available from: https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6130801/ OpenUrl 4. ↵ Bray MA , Singh S , Han H , Davis CT , Borgeson B , Hartland C , et al. Cell Painting, a high-content image-based assay for morphological profiling using multiplexed fluorescent dyes . Nat Protoc [Internet] . 2016 Sept [cited 2024 May 20]; 11 ( 9 ): 1757 – 74 . Available from: https://www.nature.com/articles/nprot.2016.105 OpenUrl 5. ↵ Cimini BA , Chandrasekaran SN , Kost-Alimova M , Miller L , Goodale A , Fritchman B , et al. Optimizing the Cell Painting assay for image-based profiling . Nat Protoc [Internet] . 2023 July [cited 2024 May 20]; 18 ( 7 ): 1981 – 2013 . Available from: https://www.nature.com/articles/s41596-023-00840-9 OpenUrl 6. ↵ Piccinini F , Balassa T , Szkalisity A , Molnar C , Paavolainen L , Kujala K , et al. Advanced Cell Classifier: User-Friendly Machine-Learning-Based Software for Discovering Phenotypes in High-Content Imaging Data . Cell Syst [Internet] . 2017 June 28 [cited 2024 May 20]; 4 ( 6 ): 651 - 655 .e5. Available from: https://www.sciencedirect.com/science/article/pii/S2405471217302272 OpenUrl 7. ↵ Severin Y , Hale BD , Mena J , Goslings D , Frey BM , Snijder B . Multiplexed high-throughput immune cell imaging reveals molecular health-associated phenotypes . Sci Adv [Internet] . 2022 Nov 4 [cited 2024 May 20]; 8 ( 44 ): eabn5631 . Available from: https://www.science.org/doi/10.1126/sciadv.abn5631 OpenUrl 8. ↵ Snijder B , Vladimer GI , Krall N , Miura K , Schmolke AS , Kornauth C , et al. Image-based ex-vivo drug screening for patients with aggressive haematological malignancies: interim results from a single-arm, open-label, pilot study . Lancet Haematol [Internet] . 2017 Dec [cited 2024 May 20]; 4 ( 12 ):e595–606. Available from: https://linkinghub.elsevier.com/retrieve/pii/S2352302617302089 9. ↵ Caicedo JC , Arevalo J , Piccioni F , Bray MA , Hartland CL , Wu X , et al. C ell Painting predicts impact of lung cancer variants . Lippincott-Schwartz J , editor. Mol Biol Cell [Internet] . 2022 May 15 [cited 2024 May 20]; 33 ( 6 ):ar49. Available from: https://www.molbiolcell.org/doi/10.1091/mbc.E21-11-0538 10. Rohban MH , Singh S , Wu X , Berthet JB , Bray MA , Shrestha Y , et al. Systematic morphological profiling of human gene and allele function via Cell Painting . Settleman J , editor. eLife [Internet] . 2017 Mar 18 [cited 2024 May 20]; 6 : e24060 . Available from : doi: 10.7554/eLife.24060 OpenUrl CrossRef PubMed 11. ↵ Sundaresh A , Meistermann D , Lampela R , Yang Z , Woldegebriel R , Ganna A , et al. Characterization of cortical neurodevelopment in vitro using gene expression and morphology profiles from single cells [Internet] . 2023 [cited 2024 May 20]. Available from: http://biorxiv.org/lookup/doi/10.1101/2023.12.03.569583 12. ↵ Haghighi M , Caicedo JC , Cimini BA , Carpenter AE , Singh S . High-dimensional gene expression and morphology profiles of cells across 28,000 genetic and chemical perturbations . Nat Methods [Internet] . 2022 Dec [cited 2024 May 20]; 19 ( 12 ): 1550 – 7 . Available from: https://www.nature.com/articles/s41592-022-01667-0 OpenUrl 13. ↵ Ramezani M , Bauman J , Singh A , Weisbart E , Yong J , Lozada M , et al. A genome-wide atlas of human cell morphology . bioRxiv [Internet] . 2023 Aug 7 [cited 2024 May 20];2023.08.06.552164. Available from: https://www.ncbi.nlm.nih.gov/pmc/articles/PMC10441312/ 14. ↵ Willis C , Nyffeler J , Harrill J . Phenotypic Profiling of Reference Chemicals across Biologically Diverse Cell Types Using the Cell Painting Assay . SLAS Discov [Internet] . 2020 Aug [cited 2024 May 20]; 25 ( 7 ): 755 – 69 . Available from: https://linkinghub.elsevier.com/retrieve/pii/S247255522206614X OpenUrl 15. ↵ Sender R , Weiss Y , Navon Y , Milo I , Azulay N , Keren L , et al. The total mass, number, and distribution of immune cells in the human body . Proc Natl Acad Sci [Internet] . 2023 Oct 31 [cited 2024 May 20]; 120 ( 44 ):e2308511120. Available from: https://pnas.org/doi/10.1073/pnas.2308511120 16. ↵ Abbas AK , Lichtman AH , Pillai S . Cellular and molecular immunology . 2023 ; 17. ↵ Palmer L , Briggs C , McFadden S , Zini G , Burthem J , Rozenberg G , et al. ICSH recommendations for the standardization of nomenclature and grading of peripheral blood cell morphological features . Int J Lab Hematol [Internet] . 2015 June [cited 2025 Sept 29]; 37 ( 3 ): 287 – 303 . Available from: https://onlinelibrary.wiley.com/doi/10.1111/ijlh.12327 OpenUrl 18. ↵ Korsunsky I , Millard N , Fan J , Slowikowski K , Zhang F , Wei K , et al. Fast, sensitive and accurate integration of single-cell data with Harmony . Nat Methods [Internet] . 2019 Dec [cited 2024 May 20]; 16 ( 12 ): 1289 – 96 . Available from: https://www.nature.com/articles/s41592-019-0619-0 OpenUrl 19. ↵ Johnson WE , Li C , Rabinovic A . Adjusting batch effects in microarray expression data using empirical Bayes methods . Biostatistics [Internet] . 2007 Jan 1 [cited 2024 May 20]; 8 ( 1 ): 118 – 27 . Available from: https://academic.oup.com/biostatistics/article/8/1/118/252073 OpenUrl 20. ↵ Behdenna A , Colange M , Haziza J , Gema A , Appé G , Azencott CA , et al. pyComBat, a Python tool for batch effects correction in high-throughput molecular data using empirical Bayes methods . BMC Bioinformatics [Internet] . 2023 Dec 7 [cited 2024 May 20]; 24 ( 1 ):459. Available from : doi: 10.1186/s12859-023-05578-5 OpenUrl CrossRef PubMed 21. ↵ Al-Mehdi AB , Pastukh VM , Swiger BM , Reed DJ , Patel MR , Bardwell GC , et al. Perinuclear Mitochondrial Clustering Creates an Oxidant-Rich Nuclear Domain Required for Hypoxia-Induced Transcription . Sci Signal [Internet] . 2012 July 3 [cited 2025 Sept 29]; 5 ( 231 ). Available from: https://www.science.org/doi/10.1126/scisignal.2002712 22. ↵ Honkanen J , Timonen VA , Koski JR , Juvila J , Arvas M , Biobank BS , et al. Blood donor biobank pipeline to collect genome-based samples for research . bioRxiv [Internet] . 2025 ; Available from: https://www.biorxiv.org/content/early/2025/10/02/2025.09.30.679473 23. ↵ Hale BD , Severin Y , Graebnitz F , Stark D , Guignard D , Mena J , et al. Cellular architecture shapes the naïve T cell response . Science [Internet] . 2024 June 7 [cited 2025 Sept 29]; 384 ( 6700 ): eadh8697 . Available from: https://www.science.org/doi/10.1126/science.adh8967 OpenUrl 24. ↵ Wang G , Sarkar A , Carbonetto P , Stephens M . A Simple New Approach to Variable Selection in Regression, with Application to Genetic Fine Mapping . J R Stat Soc Ser B Stat Methodol [Internet] . 2020 Dec 1 [cited 2025 Sept 29]; 82 ( 5 ): 1273 – 300 . Available from: https://academic.oup.com/jrsssb/article/82/5/1273/7056114 OpenUrl 25. ↵ Payne V , Kam PCA . Mast cell tryptase: a review of its physiology and clinical significance . Anaesthesia [Internet] . 2004 July [cited 2025 Sept 29]; 59 ( 7 ): 695 – 703 . Available from: https://associationofanaesthetists-publications.onlinelibrary.wiley.com/doi/10.1111/j.1365-2044.2004.03757.x OpenUrl 26. ↵ Khan NW , Wissinger B , Kohl S , Sieving PA . CNGB3 achromatopsia with progressive loss of residual cone function and impaired rod-mediated function . Invest Ophthalmol Vis Sci . 2007 ; 27. ↵ Estrada-Capetillo L , Aragoneses-Fenoll L , Domínguez-Soto Á , Fuentelsaz-Romero S , Nieto C , Simón-Fuentes M , et al. CD28 is expressed by macrophages with anti-inflammatory potential and limits their T-cell activating capacity . Eur J Immunol [Internet] . 2021 Apr [cited 2025 Sept 29]; 51 ( 4 ): 824 – 34 . Available from: https://onlinelibrary.wiley.com/doi/10.1002/eji.202048806 OpenUrl 28. ↵ Akbari P , Vuckovic D , Stefanucci L , Jiang T , Kundu K , Kreuzhuber R , et al. A genome-wide association study of blood cell morphology identifies cellular proteins implicated in disease aetiology . Nat Commun [Internet] . 2023 Aug 18 [cited 2025 Sept 29]; 14 ( 1 ):5023. Available from: https://www.nature.com/articles/s41467-023-40679-y 29. ↵ Deecke L , Homann J , Goldeck D , Luessi F , Vandebergh M , Ohlei O , et al. Genome-wide association study reveals different T cell distributions in peripheral blood of healthy individuals at high genetic risk of type 1 diabetes and long COVID [Internet] . 2024 [cited 2025 Sept 29]. Available from: http://medrxiv.org/lookup/doi/10.1101/2024.02.08.24302520 30. ↵ Tegtmeyer M , Arora J , Asgari S , Cimini BA , Nadig A , Peirent E , et al. High-dimensional phenotyping to define the genetic basis of cellular morphology . Nat Commun [Internet] . 2024 Jan 6 [cited 2025 Sept 29]; 15 ( 1 ):347. Available from: https://www.nature.com/articles/s41467-023-44045-w 31. ↵ Lee P , Chandel NS , Simon MC . Cellular adaptation to hypoxia through hypoxia inducible factors and beyond . Nat Rev Mol Cell Biol [Internet] . 2020 May [cited 2025 Sept 29]; 21 ( 5 ): 268 – 83 . Available from: https://www.nature.com/articles/s41580-020-0227-y OpenUrl 32. ↵ Brodin P , Davis MM . Human immune system variation . Nat Rev Immunol [Internet] . 2017 Jan [cited 2024 May 20]; 17 ( 1 ): 21 – 9 . Available from: https://www.nature.com/articles/nri.2016.125 OpenUrl 33. ↵ Arevalo J , Su E , van Dijk R , Carpenter AE , Singh S . Evaluating batch correction methods for image-based cell profiling . bioRxiv [Internet] . 2024 Feb 28 [cited 2024 May 20];2023.09.15.558001. Available from: https://www.ncbi.nlm.nih.gov/pmc/articles/PMC10516049/ 34. ↵ Way GP , Sailem H , Shave S , Kasprowicz R , Carragher NO . Evolution and impact of high content imaging . SLAS Discov [Internet] . 2023 Oct 1 [cited 2024 May 20]; 28 ( 7 ): 292 – 305 . Available from: https://www.sciencedirect.com/science/article/pii/S2472555223000667 OpenUrl 35. ↵ Tran HTN , Ang KS , Chevrier M , Zhang X , Lee NYS , Goh M , et al. A benchmark of batch-effect correction methods for single-cell RNA sequencing data . Genome Biol [Internet] . 2020 Jan 16 [cited 2024 May 20]; 21 ( 1 ):12. Available from : doi: 10.1186/s13059-019-1850-9 OpenUrl CrossRef PubMed 36. ↵ Rajaraman R , Fox RA , Vethamany VG , Fernandez LA , MacSween JM . Adhesion and spreading behaviour of human peripheral blood mononuclear cells (PBMC) in vitro . Exp Cell Res [Internet] . 1977 June 1 [cited 2024 May 20]; 107 ( 1 ): 179 – 90 . Available from: https://www.sciencedirect.com/science/article/pii/0014482777903998 OpenUrl 37. Ziegler-Heitbrock L . The CD14+ CD16+ blood monocytes: their role in infection and inflammation . J Leucoc Biol [Internet] . 2007 [cited 2025 Oct 2]; 81 ( 3 ): 584 – 92 . Available from: https://academic.oup.com/jleukbio/article-abstract/81/3/584/6975555 OpenUrl 38. ↵ Timonen VA , Kerkelä E , Impola U , Penna L , Partanen J , Kilpivaara O , et al. DeepIFC: Virtual fluorescent labeling of blood cells in imaging flow cytometry data with deep learning . Cytometry A . 2023 ; 103 ( 10 ): 807 – 17 . OpenUrl PubMed 39. ↵ Trescos Y , Tessier E , Rougeaux C , Goossens PL , Tournier JN . Micropatterned Macrophage Analysis Reveals Global Cytoskeleton Constraints Induced by Bacillus anthracis Edema Toxin . Blanke SR , editor. Infect Immun [Internet] . 2015 Aug [cited 2025 Sept 29]; 83 ( 8 ): 3114 – 25 . Available from: https://journals.asm.org/doi/10.1128/IAI.00479-15 OpenUrl 40. ↵ Czerwińska J , Owczarczyk-Saczonek A . The Role of the Neutrophilic Network in the Pathogenesis of Psoriasis . Int J Mol Sci [Internet] . 2022 Feb 6 [cited 2025 Sept 29]; 23 ( 3 ):1840. Available from: https://www.mdpi.com/1422-0067/23/3/1840 41. ↵ Astle WJ , Elding H , Jiang T , Allen D , Ruklisa D , Mann AL , et al. The Allelic Landscape of Human Blood Cell Trait Variation and Links to Common Complex Disease . Cell [Internet] . 2016 Nov [cited 2025 Sept 29]; 167 ( 5 ): 1415 - 1429 .e19. Available from: https://linkinghub.elsevier.com/retrieve/pii/S0092867416314635 OpenUrl 42. Chen MH , Raffield LM , Mousas A , Sakaue S , Huffman JE , Moscati A , et al. Trans-ethnic and Ancestry-Specific Blood-Cell Genetics in 746,667 Individuals from 5 Global Populations . Cell [Internet] . 2020 Sept [cited 2025 Sept 29]; 182 ( 5 ): 1198 - 1213 .e14. Available from: https://linkinghub.elsevier.com/retrieve/pii/S0092867420308229 OpenUrl 43. Nalls MA , Couper DJ , Tanaka T , Van Rooij FJA , Chen MH , Smith AV , et al. Multiple Loci Are Associated with White Blood Cell Phenotypes . Visscher PM , editor. PLoS Genet [Internet] . 2011 June 30 [cited 2025 Sept 29]; 7 ( 6 ):e1002113. Available from: https://dx.plos.org/10.1371/journal.pgen.1002113 44. ↵ Vuckovic D , Bao EL , Akbari P , Lareau CA , Mousas A , Jiang T , et al. The Polygenic and Monogenic Basis of Blood Traits and Diseases . Cell [Internet] . 2020 Sept [cited 2025 Sept 29]; 182 ( 5 ): 1214 - 1231 .e11. Available from: https://linkinghub.elsevier.com/retrieve/pii/S0092867420309995 OpenUrl 45. ↵ Kundu K , Tardaguila M , Mann AL , Watt S , Ponstingl H , Vasquez L , et al. Genetic associations at regulatory phenotypes improve fine-mapping of causal variants for 12 immune-mediated diseases . Nat Genet [Internet] . 2022 Mar [cited 2025 Sept 29]; 54 ( 3 ): 251 – 62 . Available from: https://www.nature.com/articles/s41588-022-01025-y OpenUrl 46. ↵ Chandrasekaran SN , Cimini BA , Goodale A , Miller L , Kost-Alimova M , Jamali N , et al. Three million images and morphological profiles of cells treated with matched chemical and genetic perturbations . Nat Methods [Internet] . 2024 June [cited 2025 Sept 29]; 21 ( 6 ): 1114 – 21 . Available from: https://www.nature.com/articles/s41592-024-02241-6 OpenUrl 47. ↵ Cross-Zamirski JO , Mouchet E , Williams G , Schönlieb CB , Turkki R , Wang Y . Label-free prediction of cell painting from brightfield images . Sci Rep [Internet] . 2022 June 15 [cited 2024 May 20]; 12 ( 1 ):10001. Available from: https://www.nature.com/articles/s41598-022-12914-x 48. ↵ Atarsaikhan G , Mogollon I , Välimäki K , iCAN , Mirtti T , Pellinen T , et al. Self-supervised learning enables unbiased patient characterization from multiplexed cancer tissue microscopy images [Internet] . 2025 [cited 2025 Sept 29]. Available from: http://biorxiv.org/lookup/doi/10.1101/2025.03.05.640729 49. Bommasani R , Hudson DA , Adeli E , Altman R , Arora S , von Arx S , et al. On the Opportunities and Risks of Foundation Models . 2021 [cited 2024 May 20]; Available from: https://arxiv.org/abs/2108.07258 50. ↵ Pfaendler R , Hanimann J , Lee S , Snijder B. Self-supervised vision transformers accurately decode cellular state heterogeneity [Internet] . 2023 [cited 2024 May 20]. Available from: http://biorxiv.org/lookup/doi/10.1101/2023.01.16.524226 51. ↵ Clancy J , Ritari J , Vaittinen E , Arvas M , Tammi S , Koskela S , et al. Blood donor biobank as a resource in personalised biomedical genetic research . Eur J Hum Genet [Internet] . 2024 Jan 12 [cited 2024 May 20];1–9. Available from: https://www.nature.com/articles/s41431-023-01528-0 52. ↵ Boyum A . Isolation of mononuclear cells and granulocytes from human blood . Scand J Clin Lab Invest [Internet] . 1968 [cited 2025 Sept 29]; 21 : 77 – 89 . Available from: https://cir.nii.ac.jp/crid/1573387449149116928 OpenUrl 53. ↵ Noble PB , Cutts JH . Separation of blood leukocytes by Ficoll gradient . Can Vet J [Internet] . 1967 May [cited 2025 Sept 29]; 8 ( 5 ): 110 – 1 . Available from: https://www.ncbi.nlm.nih.gov/pmc/articles/PMC1696854/ OpenUrl 54. ↵ Jacobson BS , Branton D . Plasma Membrane: Rapid Isolation and Exposure of the Cytoplasmic Surface by Use of Positively Charged Beads . Science [Internet] . 1977 Jan 21 [cited 2024 May 20]; 195 ( 4275 ): 302 – 4 . Available from: https://www.science.org/doi/10.1126/science.831278 OpenUrl 55. ↵ Mund A , Coscia F , Kriston A , Hollandi R , Kovács F , Brunner AD , et al. Deep Visual Proteomics defines single-cell identity and heterogeneity . Nat Biotechnol [Internet] . 2022 Aug [cited 2025 Sept 29]; 40 ( 8 ): 1231 – 40 . Available from: https://www.nature.com/articles/s41587-022-01302-5 OpenUrl 56. ↵ Smith K , Li Y , Piccinini F , Csucs G , Balazs C , Bevilacqua A , et al. CIDRE: an illumination-correction method for optical microscopy . Nat Methods [Internet] . 2015 May [cited 2024 May 20]; 12 ( 5 ): 404 – 6 . Available from: https://www.nature.com/articles/nmeth.3323 OpenUrl 57. ↵ Hollandi R , Szkalisity A , Toth T , Tasnadi E , Molnar C , Mathe B , et al. nucleAIzer: A Parameter-free Deep Learning Framework for Nucleus Segmentation Using Image Style Transfer . Cell Syst [Internet] . 2020 May 20 [cited 2024 May 20]; 10 ( 5 ): 453 - 458 .e6. Available from: https://www.sciencedirect.com/science/article/pii/S2405471220301174 OpenUrl 58. ↵ Hahsler M , Piekenbrock M, dbscan DD. Fast density-based clustering with R . J Stat Softw . 2019 ; 91 : 1 – 30 . OpenUrl CrossRef 59. ↵ Jarno Honkanen , Veera A. Timonen , Jessica Koski , Julianna Juvila , Mikko Arvas , Blood Service Biobank , et al. Blood donor biobank pipeline to collect genome-based samples for research . bioRxiv . 2025 Oct; 60. ↵ McInnes L , Healy J , Melville J . UMAP: Uniform Manifold Approximation and Projection for Dimension Reduction . 2018 [cited 2024 May 20]; Available from: https://arxiv.org/abs/1802.03426 61. ↵ Brück O , Lee MH , Turkki R , Uski I , Penttilä P , Paavolainen L , et al. Spatial immunoprofiling of the intratumoral and peritumoral tissue of renal cell carcinoma patients . Mod Pathol [Internet] . 2021 Dec [cited 2025 Sept 29]; 34 ( 12 ): 2229 – 41 . Available from: https://linkinghub.elsevier.com/retrieve/pii/S0893395222003842 OpenUrl 62. ↵ Liarski VM , Sibley A , Van Panhuys N , Ai J , Chang A , Kennedy D , et al. Quantifying in situ adaptive immune cell cognate interactions in humans . Nat Immunol [Internet] . 2019 Apr [cited 2025 Sept 29]; 20 ( 4 ): 503 – 13 . Available from: https://www.nature.com/articles/s41590-019-0315-3 OpenUrl 63. ↵ Mbatchou J , Barnard L , Backman J , Marcketta A , Kosmicki JA , Ziyatdinov A , et al. Computationally efficient whole-genome regression for quantitative and binary traits . Nat Genet [Internet] . 2021 July [cited 2025 Sept 29]; 53 ( 7 ): 1097 – 103 . Available from: https://www.nature.com/articles/s41588-021-00870-7 OpenUrl 64. ↵ Bennett JM , Catovsky D , Daniel M , Flandrin G , Galton DAG , Gralnick HR , et al. Proposals for the Classification of the Acute Leukaemias F RENCH -A MERICAN -B RITISH (FAB) C O-OPERATIVE G ROUP . Br J Haematol [Internet] . 1976 Aug [cited 2024 May 20]; 33 ( 4 ): 451 – 8 . Available from: https://onlinelibrary.wiley.com/doi/10.1111/j.1365-2141.1976.tb03563.x OpenUrl 65. ↵ Matsuo Y , MacLeod R a. F , Uphoff CC , Drexler HG , Nishizaki C , Katayama Y , et al. Two acute monocytic leukemia (AML-M5a) cell lines (MOLM-13 and MOLM-14) with interclonal phenotypic heterogeneity showing MLL-AF9 fusion resulting from an occult chromosome insertion, ins(11;9)(q23;p22p23) . Leukemia [Internet] . 1997 Sept [cited 2024 May 20]; 11 ( 9 ): 1469 – 77 . Available from: https://www.nature.com/articles/2400768 OpenUrl View the discussion thread. Back to top Previous Next Posted November 16, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Image-based profiling of healthy donor immune cells with Blood Cell Painting reveals novel genotype-phenotype associations Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Image-based profiling of healthy donor immune cells with Blood Cell Painting reveals novel genotype-phenotype associations Caroline Högel-Starck , Veera A. Timonen , Gantugs Atarsaikhan , Isabel Mogollon , Minttu Polso , Antti Hassinen , Jarno Honkanen , Cindy David Sarmento , Jessica Koski , Julius Soini , Lea Urpa , Tanja Ruokoranta , Toveann Ahlnäs , Julianna Juvila , Juho J. Miettinen , Rodosthenis S. Rodosthenous , FinnGen , Outi Kilpivaara , Mikko Arvas , Caroline A. Heckman , Jukka Partanen , Mark Daly , Aarno Palotie , Hanna M. Ollila , Lassi Paavolainen , Vilja Pietiäinen , Esa Pitkänen bioRxiv 2024.05.17.594648; doi: https://doi.org/10.1101/2024.05.17.594648 Share This Article: Copy Citation Tools Image-based profiling of healthy donor immune cells with Blood Cell Painting reveals novel genotype-phenotype associations Caroline Högel-Starck , Veera A. Timonen , Gantugs Atarsaikhan , Isabel Mogollon , Minttu Polso , Antti Hassinen , Jarno Honkanen , Cindy David Sarmento , Jessica Koski , Julius Soini , Lea Urpa , Tanja Ruokoranta , Toveann Ahlnäs , Julianna Juvila , Juho J. Miettinen , Rodosthenis S. Rodosthenous , FinnGen , Outi Kilpivaara , Mikko Arvas , Caroline A. Heckman , Jukka Partanen , Mark Daly , Aarno Palotie , Hanna M. Ollila , Lassi Paavolainen , Vilja Pietiäinen , Esa Pitkänen bioRxiv 2024.05.17.594648; doi: https://doi.org/10.1101/2024.05.17.594648 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Cell Biology Subject Areas All Articles Animal Behavior and Cognition (7649) Biochemistry (17737) Bioengineering (13925) Bioinformatics (42059) Biophysics (21495) Cancer Biology (18643) Cell Biology (25576) Clinical Trials (138) Developmental Biology (13405) Ecology (19946) Epidemiology (2067) Evolutionary Biology (24370) Genetics (15626) Genomics (22551) Immunology (17769) Microbiology (40480) Molecular Biology (17209) Neuroscience (88782) Paleontology (667) Pathology (2843) Pharmacology and Toxicology (4835) Physiology (7662) Plant Biology (15177) Scientific Communication and Education (2047) Synthetic Biology (4304) Systems Biology (9838) Zoology (2272)
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.