Cell-type specific inference from bulk RNA-sequencing data by integrating single cell reference profiles via EPIC-unmix | Research Square window.SnipcartSettings = { analytics: { enabled: false } }; (function() { var accessVector = localStorage.getItem('access_vector') || ''; window.dataLayer = window.dataLayer || []; if (accessVector) { window.dataLayer.push({ user: { profile: { profileInfo: { snid: accessVector } } } }); } })(); (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0],j=d.createElement(s),dl=l!='dataLayer'?'&l='+l:'';j.async=true;j.src='https://www.googletagmanager.com/gtm.js?id='+i+dl;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-K279D39R'); Browse Preprints In Review Journals COVID-19 Preprints AJE Video Bytes Research Tools Research Promotion AJE Professional Editing AJE Rubriq About Preprint Platform In Review Editorial Policies Our Team Advisory Board Help Center Sign In Submit a Preprint Cite Share Download PDF Method Article Cell-type specific inference from bulk RNA-sequencing data by integrating single cell reference profiles via EPIC-unmix Chenwei Tang, Quan Sun, Xinyue Zeng, Gang Li, Xiaoyu Yang, Fei Liu, and 5 more This is a preprint; it has not been peer reviewed by a journal. https://doi.org/ 10.21203/rs.3.rs-4979032/v1 This work is licensed under a CC BY 4.0 License Status: Published Journal Publication published 20 Nov, 2025 Read the published version in Genome Biology → Version 1 posted 14 You are reading this latest preprint version Abstract Cell type-specific (CTS) analysis is crucial for uncovering biological insights hidden in bulk tissue data, yet single-cell (sc) or single-nuclei (sn) approaches are often cost-prohibitive for large samples. We introduce EPIC-unmix, a novel two-step empirical Bayesian method combining reference sc/sn and bulk RNA-seq data to improve CTS inference, accounting for the difference between reference and target datasets. Under comprehensive simulations, EPIC-unmix outperformed alternative methods in accuracy. Applied to Alzheimer's disease (AD) brain RNA-seq data, EPIC-unmix identified multiple differentially expressed genes in a CTS manner, and empowered CTS eQTL analysis. Full Text Additional Declarations No competing interests reported. Supplementary Files SupplementalFigures.pdf SupplementalTablefinal.xlsx Cite Share Download PDF Status: Published Journal Publication published 20 Nov, 2025 Read the published version in Genome Biology → Version 1 posted Editorial decision: Revision requested 24 Mar, 2025 Reviews received at journal 14 Mar, 2025 Reviews received at journal 09 Mar, 2025 Reviews received at journal 06 Mar, 2025 Reviewers agreed at journal 23 Feb, 2025 Reviewers agreed at journal 23 Feb, 2025 Reviewers agreed at journal 18 Feb, 2025 Reviewers agreed at journal 17 Sep, 2024 Reviewers agreed at journal 16 Sep, 2024 Reviewers invited by journal 12 Sep, 2024 Editor invited by journal 02 Sep, 2024 Editor assigned by journal 30 Aug, 2024 Submission checks completed at journal 27 Aug, 2024 First submitted to journal 26 Aug, 2024 You are reading this latest preprint version Research Square lets you share your work early, gain feedback from the community, and start making changes to your manuscript prior to peer review in a journal. As a division of Research Square Company, we’re committed to making research communication faster, fairer, and more useful. We do this by developing innovative software and high quality services for the global research community. Our growing team is made up of researchers and industry professionals working together to solve the most critical problems facing scientific publishing. Also discoverable on Platform About Our Team In Review Editorial Policies Advisory Board Help Center Resources Author Services Accessibility API Access RSS feed Manage Cookie Preferences © Research Square 2026 | ISSN 2693-5015 (online) Privacy Policy Terms of Service Do Not Sell My Personal Information {"props":{"pageProps":{"initialData":{"identity":"rs-4979032","acceptedTermsAndConditions":true,"allowDirectSubmit":false,"archivedVersions":[],"articleType":"Method Article","associatedPublications":[],"authors":[{"id":357490519,"identity":"8031fe74-34de-4dee-8df9-7b13fea82284","order_by":0,"name":"Chenwei Tang","email":"","orcid":"","institution":"University of North Carolina at Chapel Hill","correspondingAuthor":false,"prefix":"","firstName":"Chenwei","middleName":"","lastName":"Tang","suffix":""},{"id":357490524,"identity":"48f9c66e-d40c-4ec3-b444-f871ce417088","order_by":1,"name":"Quan Sun","email":"","orcid":"","institution":"University of North Carolina at Chapel Hill","correspondingAuthor":false,"prefix":"","firstName":"Quan","middleName":"","lastName":"Sun","suffix":""},{"id":357490527,"identity":"acb9be3f-9d30-4ad1-8df3-3f4d0151ac06","order_by":2,"name":"Xinyue Zeng","email":"","orcid":"","institution":"University of North Carolina at Chapel Hill","correspondingAuthor":false,"prefix":"","firstName":"Xinyue","middleName":"","lastName":"Zeng","suffix":""},{"id":357490528,"identity":"0247ae6b-9f9a-4741-bdb5-4afdc301f5f0","order_by":3,"name":"Gang Li","email":"","orcid":"","institution":"University of Washington","correspondingAuthor":false,"prefix":"","firstName":"Gang","middleName":"","lastName":"Li","suffix":""},{"id":357490529,"identity":"67dd9ebd-8ca5-4d2b-a807-3c3aabc3a0cf","order_by":4,"name":"Xiaoyu Yang","email":"","orcid":"","institution":"University of California, San Francisco","correspondingAuthor":false,"prefix":"","firstName":"Xiaoyu","middleName":"","lastName":"Yang","suffix":""},{"id":357490530,"identity":"223c530c-5f1d-4a42-a2c6-926aebbf28f9","order_by":5,"name":"Fei Liu","email":"","orcid":"","institution":"National University of Singapore","correspondingAuthor":false,"prefix":"","firstName":"Fei","middleName":"","lastName":"Liu","suffix":""},{"id":357490532,"identity":"aaab86ef-da5f-4817-a05c-5a4ebaf15e23","order_by":6,"name":"Jinying Zhao","email":"","orcid":"","institution":"University of Florida","correspondingAuthor":false,"prefix":"","firstName":"Jinying","middleName":"","lastName":"Zhao","suffix":""},{"id":357490534,"identity":"d2bf4adf-d753-4510-903f-35150fb9ef67","order_by":7,"name":"Yin Shen","email":"","orcid":"","institution":"University of California, San Francisco","correspondingAuthor":false,"prefix":"","firstName":"Yin","middleName":"","lastName":"Shen","suffix":""},{"id":357490535,"identity":"c34321ae-0efb-42e9-8c7b-038defbf3ae7","order_by":8,"name":"Boxiang Liu","email":"","orcid":"","institution":"National University of Singapore","correspondingAuthor":false,"prefix":"","firstName":"Boxiang","middleName":"","lastName":"Liu","suffix":""},{"id":357490536,"identity":"b7eba42c-193a-4921-ad85-cf790b8a1cc2","order_by":9,"name":"Jia Wen","email":"","orcid":"","institution":"University of North Carolina at Chapel Hill","correspondingAuthor":false,"prefix":"","firstName":"Jia","middleName":"","lastName":"Wen","suffix":""},{"id":357490538,"identity":"cfa796d2-3446-43be-ad60-4e23c79108fe","order_by":10,"name":"Yun Li","email":"data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAZAAAAAyAQMAAABI0h/eAAAABlBMVEX///8AAABVwtN+AAAACXBIWXMAAA7EAAAOxAGVKw4bAAAAu0lEQVRIiWNgGAWjYLCCBwY2QDIByjtAjJYEgzSStTAcJkGLwY3cAwwJBeej+dkT2KQLahjk+G4kENKSlwB02O3cmT0P2KRnHGMwliSsJccArGXDDaAtvA0MiRuI1HIudz9USz2xWg7kbpCAaEkwIKRF8swbkJbk3BlnHjZb8xyTMJx55gF+LXzHgbZ8+GOX29+efPA2T42NPN9xArYoHGBg/wFhMjYACQn8ykFAvoGwmlEwCkbBKBjpAACKpUR3AdaE4gAAAABJRU5ErkJggg==","orcid":"","institution":"University of North Carolina at Chapel Hill","correspondingAuthor":true,"prefix":"","firstName":"Yun","middleName":"","lastName":"Li","suffix":""}],"badges":[],"createdAt":"2024-08-26 15:28:04","currentVersionCode":1,"declarations":"","doi":"10.21203/rs.3.rs-4979032/v1","doiUrl":"https://doi.org/10.21203/rs.3.rs-4979032/v1","draftVersion":[],"editorialEvents":[{"content":"https://doi.org/10.1186/s13059-025-03847-5","type":"published","date":"2025-11-20T15:58:29+00:00"}],"editorialNote":"","failedWorkflow":false,"files":[{"id":96650200,"identity":"56741692-8b76-46d9-aa52-787d82175fba","added_by":"auto","created_at":"2025-11-24 16:09:39","extension":"pdf","order_by":1,"title":"","display":"","copyAsset":false,"role":"manuscript-pdf","size":1066616,"visible":true,"origin":"","legend":"","description":"","filename":"finalcleanedGBEPICunmixmanuscriptcoauthoerreviewed.pdf","url":"https://assets-eu.researchsquare.com/files/rs-4979032/v1_covered_8cce57d7-98ad-4ce9-a950-c462b309f0aa.pdf"},{"id":65337946,"identity":"3f0a497d-9f7e-4221-aa1d-8f990b55183e","added_by":"auto","created_at":"2024-09-26 08:33:15","extension":"pdf","order_by":1,"title":"","display":"","copyAsset":false,"role":"supplement","size":675054,"visible":true,"origin":"","legend":"","description":"","filename":"SupplementalFigures.pdf","url":"https://assets-eu.researchsquare.com/files/rs-4979032/v1/9f1e99a7659a23fc9d0c4a74.pdf"},{"id":65339469,"identity":"46a0e7b4-2cfc-4f71-ae6f-91419094f0ba","added_by":"auto","created_at":"2024-09-26 08:41:15","extension":"xlsx","order_by":2,"title":"","display":"","copyAsset":false,"role":"supplement","size":230965,"visible":true,"origin":"","legend":"","description":"","filename":"SupplementalTablefinal.xlsx","url":"https://assets-eu.researchsquare.com/files/rs-4979032/v1/cbf068a37862013ed87492c0.xlsx"}],"financialInterests":"No competing interests reported.","formattedTitle":"Cell-type specific inference from bulk RNA-sequencing data by integrating single cell reference profiles via EPIC-unmix","fulltext":[],"fulltextSource":"","fullText":"","funders":[],"hasAdminPriorityOnWorkflow":false,"hasManuscriptDocX":false,"hasOptedInToPreprint":true,"hasPassedJournalQc":"","hasAnyPriority":false,"hideJournal":false,"highlight":"","institution":"","isAcceptedByJournal":true,"isAuthorSuppliedPdf":true,"isDeskRejected":"","isHiddenFromSearch":false,"isInQc":false,"isInWorkflow":false,"isPdf":true,"isPdfUpToDate":true,"isWithdrawnOrRetracted":false,"journal":{"display":true,"email":"
[email protected]","identity":"genome-biology","isNatureJournal":false,"hasQc":true,"allowDirectSubmit":false,"externalIdentity":"gbio","sideBox":"Learn more about [Genome Biology](https://genomebiology.biomedcentral.com/)","snPcode":"13059","submissionUrl":"https://submission.springernature.com/new-submission/13059/3","title":"Genome Biology","twitterHandle":"","acdcEnabled":true,"dfaEnabled":true,"editorialSystem":"stoa","reportingPortfolio":"BMC/SO AJ","inReviewEnabled":true,"inReviewRevisionsEnabled":true},"keywords":"","lastPublishedDoi":"10.21203/rs.3.rs-4979032/v1","lastPublishedDoiUrl":"https://doi.org/10.21203/rs.3.rs-4979032/v1","license":{"name":"CC BY 4.0","url":"https://creativecommons.org/licenses/by/4.0/"},"manuscriptAbstract":"\u003cp\u003eCell type-specific (CTS) analysis is crucial for uncovering biological insights hidden in bulk tissue data, yet single-cell (sc) or single-nuclei (sn) approaches are often cost-prohibitive for large samples. We introduce EPIC-unmix, a novel two-step empirical Bayesian method combining reference sc/sn and bulk RNA-seq data to improve CTS inference, accounting for the difference between reference and target datasets. Under comprehensive simulations, EPIC-unmix outperformed alternative methods in accuracy. Applied to Alzheimer's disease (AD) brain RNA-seq data, EPIC-unmix identified multiple differentially expressed genes in a CTS manner, and empowered CTS eQTL analysis.\u003c/p\u003e","manuscriptTitle":"Cell-type specific inference from bulk RNA-sequencing data by integrating single cell reference profiles via EPIC-unmix","msid":"","msnumber":"","nonDraftVersions":[{"code":1,"date":"2024-09-26 08:33:10","doi":"10.21203/rs.3.rs-4979032/v1","editorialEvents":[{"type":"communityComments","content":0},{"type":"decision","content":"Revision requested","date":"2025-03-24T06:27:21+00:00","index":"","fulltext":""},{"type":"editorInvitedReview","content":"","date":"2025-03-14T04:18:59+00:00","index":"hide","fulltext":""},{"type":"editorInvitedReview","content":"","date":"2025-03-10T02:12:57+00:00","index":"hide","fulltext":""},{"type":"editorInvitedReview","content":"","date":"2025-03-06T23:30:46+00:00","index":"hide","fulltext":""},{"type":"reviewerAgreed","content":"160253346831729292111913178806361229656","date":"2025-02-24T03:24:00+00:00","index":"hide","fulltext":""},{"type":"reviewerAgreed","content":"82208486400123330069543991329053358324","date":"2025-02-23T21:14:31+00:00","index":"hide","fulltext":""},{"type":"reviewerAgreed","content":"28250551483355518387538240839630486373","date":"2025-02-18T14:25:21+00:00","index":"hide","fulltext":""},{"type":"reviewerAgreed","content":"187918661905222279349928949757800493102","date":"2024-09-17T15:26:42+00:00","index":"hide","fulltext":""},{"type":"reviewerAgreed","content":"185687190905621548851363932374311268001","date":"2024-09-16T14:51:04+00:00","index":"hide","fulltext":""},{"type":"reviewersInvited","content":"","date":"2024-09-12T04:44:20+00:00","index":"","fulltext":""},{"type":"editorInvited","content":"","date":"2024-09-02T07:13:04+00:00","index":"","fulltext":""},{"type":"editorAssigned","content":"","date":"2024-08-30T12:37:50+00:00","index":"","fulltext":""},{"type":"checksComplete","content":"","date":"2024-08-27T08:37:08+00:00","index":"","fulltext":""},{"type":"submitted","content":"Genome Biology","date":"2024-08-26T15:26:53+00:00","index":"","fulltext":""}],"status":"published","journal":{"display":true,"email":"
[email protected]","identity":"genome-biology","isNatureJournal":false,"hasQc":true,"allowDirectSubmit":false,"externalIdentity":"gbio","sideBox":"Learn more about [Genome Biology](https://genomebiology.biomedcentral.com/)","snPcode":"13059","submissionUrl":"https://submission.springernature.com/new-submission/13059/3","title":"Genome Biology","twitterHandle":"","acdcEnabled":true,"dfaEnabled":true,"editorialSystem":"stoa","reportingPortfolio":"BMC/SO AJ","inReviewEnabled":true,"inReviewRevisionsEnabled":true}}],"origin":"","ownerIdentity":"7295f935-6097-49c4-a908-a5421836053c","owner":[],"postedDate":"September 26th, 2024","published":true,"recentEditorialEvents":[],"rejectedJournal":[],"revision":"","amendment":"","status":"published-in-journal","subjectAreas":[],"tags":[],"updatedAt":"2025-11-24T16:03:20+00:00","versionOfRecord":{"articleIdentity":"rs-4979032","link":"https://doi.org/10.1186/s13059-025-03847-5","journal":{"identity":"genome-biology","isVorOnly":false,"title":"Genome Biology"},"publishedOn":"2025-11-20 15:58:29","publishedOnDateReadable":"November 20th, 2025"},"versionCreatedAt":"2024-09-26 08:33:10","video":"","vorDoi":"10.1186/s13059-025-03847-5","vorDoiUrl":"https://doi.org/10.1186/s13059-025-03847-5","workflowStages":[]},"version":"v1","identity":"rs-4979032","journalConfig":"researchsquare"},"__N_SSP":true},"page":"/article/[identity]/[[...version]]","query":{"redirect":"/article/rs-4979032","identity":"rs-4979032","version":["v1"]},"buildId":"qtupq5eGEP_6zYnWcrvyt","isFallback":false,"isExperimentalCompile":false,"dynamicIds":[84888],"gssp":true,"scriptLoader":[]}
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.