scDock: Streamlining drug discovery targeting cell-cell communication via scRNA-seq analysis and molecular docking

doi:10.1101/2025.11.20.689638

scDock: Streamlining drug discovery targeting cell-cell communication via scRNA-seq analysis and molecular docking

2025 · doi:10.1101/2025.11.20.689638

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 29,323 characters · extracted from preprint-html · click to expand

scDock: Streamlining drug discovery targeting cell-cell communication via scRNA-seq analysis and molecular docking | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results scDock: Streamlining drug discovery targeting cell-cell communication via scRNA-seq analysis and molecular docking Chen-Hao Huang , Yen-Jen Oyang , Hsuan-Cheng Huang , Hsueh-Fen Juan doi: https://doi.org/10.1101/2025.11.20.689638 Chen-Hao Huang 1 Graduate Institute of Biomedical Electronics and Bioinformatics, National Taiwan University , Taipei 106, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site Yen-Jen Oyang 1 Graduate Institute of Biomedical Electronics and Bioinformatics, National Taiwan University , Taipei 106, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site Hsuan-Cheng Huang 2 Institute of Biomedical Informatics, National Yang Ming Chiao Tung University , Taipei 112, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: yukijuan{at}ntu.edu.tw hsuancheng{at}nycu.edu.tw Hsueh-Fen Juan 1 Graduate Institute of Biomedical Electronics and Bioinformatics, National Taiwan University , Taipei 106, Taiwan 3 Department of Life Science, National Taiwan University , Taipei 106, Taiwan 4 Center for Computational and Systems Biology, National Taiwan University , Taipei 106, Taiwan Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: yukijuan{at}ntu.edu.tw hsuancheng{at}nycu.edu.tw Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Summary Identifying drugs that target intercellular communication networks represents a promising therapeutic strategy, yet linking single-cell RNA sequencing (scRNA-seq) analysis to structure-based drug screening remains technically challenging and requires substantial bioinformatics expertise. We present scDock, an integrated and user-friendly pipeline that seamlessly connects scRNA-seq data processing, cell–cell communication inference, and molecular docking-based drug discovery. Through a single configuration file, users can execute the complete workflow, from raw scRNA-seq data to ranked drug candidates, without programming skills. scDock automates the identification of disease-relevant ligand–receptor interactions from scRNA-seq data and perfoms structure-based virtual screening against these communication targets using Protein Data Bank (PDB) or AlphaFold-predicted protein structures. The pipeline generates comprehensive outputs at each stage, enabling users to explore intercellular signaling alterations and discover therapeutic compounds targeting specific cell–cell communications. scDock addresses a critical gap by providing an accessible end-to-end solution for communication-targeted drug discovery from single-cell data. Availability and Implementation scDock is freely available at https://github.com/Andrewneteye4343/scDock . It is implemented in R, Python, shell scripts, and supports Linux systems, including Ubuntu and Debian. 1 Introduction Single-cell RNA sequencing (scRNA-seq) provides high-resolution gene expression profiling at the level of individual cells, offering insights into cellular heterogeneity and complex biological processes that cannot be captured by bulk RNA sequencing ( Cao et al., 2017 ). Recent methodological advances, including cell–cell communication inference ( Jin et al., 2025 ), transcription factor prediction ( Aibar et al., 2017 ), and transcriptional dynamics modeling ( Bergen et al., 2020 ), have further expanded the analytical scope of scRNA-seq, enabling a more comprehensive characterization of transcriptomic landscapes and the mechanisms that underlie diverse biological states. In particular, intercellular communication inference has emerged as a powerful approach for identifying ligand–receptor pairs interactions associated with dysregulated signaling pathways in disease. Despite offering a broader analytical repertoire than bulk RNA sequencing, scRNA-seq workflows often require complex implementation steps involving multiple programming languages and substantial computational environment setup. These technical demands pose significant challenges to many biologists and can hinder both accessibility and reproducibility. Establishing an intuitive, user-friendly analytical framework is therefore essential to lowering these barriers and improving the usability of scRNA-seq analyses. Here, we present scDock, a command-line–based integrative toolkit that unifies core scRNA-seq analysis, intercellular communication inference, and drug screening through molecular docking of key signaling molecules. scDock accommodates multiple scRNA-seq input formats and offers accessible options for normalization, dimensionality reduction, clustering, tissue-specific annotation, and data integration. Beyond these core functionalities, the toolkit supports both single-group and comparative analyses of cell–cell communication inference and identifies molecules involved in differential signaling as candidate targets for molecular docking. Targeting critical components of disease-related interactomes has proven to be an effective drug discovery strategy ( Lu et al., 2020 ), and scDock brings this capability into an end-to-end single-cell analysis workflow. Despite its broad functionality, scDock remains easy to perform analytic workflow and requires only a single configuration file, which provides detailed descriptions and default settings for users with limited computational experience while allowing customization for advanced analyses. Collectively, these features position scDock as a versatile and accessible platform that streamlines single-cell transcriptomic analysis and accelerates the identification of potential therapeutic targets. 2 Implementation scDock is implemented as an integrated toolkit that streamlines complex scRNA-seq analyses and downstream computational workflows for both human and mouse datasets. Its primary goal is to simplify the execution of scRNA-seq analysis and related bioinformatics tasks, thereby reducing the technical burden for users with limited programming experience. To achieve this, scDock is organized into three interconnected functional modules: core scRNA-seq analysis, intercellular communication inference, and molecular docking, all of which operate together to support a fully automated and customizable end-to-end workflow ( Fig. 1 ). These modules are coordinated through R, Python, and shell scripts, enabling the entire process to be executed with a single command and a user-defined configuration file. Download figure Open in new tab Fig. 1. Overview of the scDock analytical workflow. The pipeline consists of three major modules: the core scRNA-seq analysis module, the intercellular communication inference module, and the molecular docking module. The core scRNA-seq analysis module performs quality control, normalization, scaling, dimensionality reduction, clustering, integration, and cell type annotation. The intercellular communication inference module identifies key signaling pathways by comparing signaling probabilities across groups and determines potential therapeutic targets based on the ligand–receptor pairs involved. In the molecular docking module, protein and compound structures are retrieved, preprocessed, and subjected to docking analysis. Compounds are then ranked by their predicted binding affinities to individual target proteins, enabling the identification of candidate drugs that may modulate disease-associated ligand–receptor interactions. The configuration file specifies all key analytical parameters, including input and output paths, selected analysis methods, algorithms, and the definition of cell types or groups of interest. It provides both default and fully customizable settings, accommodating the needs of novice users while offering flexibility for advanced users. scDock can be downloaded, installed, and executed locally by following the instructions provided on GitHub. Once a scRNA-seq dataset is supplied, the pipeline automatically performs marker gene identification, cell annotation, intercellular communication inference, and molecular docking, producing outputs such as cell-annotated dimensionality reduction plot, summaries of signaling pathways, protein and compound structures, docking results, and other associated files. All intermediate data generated throughout the workflow are also saved automatically, allowing users to reuse, inspect, or extend these results for additional downstream analyses. 2.1 Core scRNA-seq analysis In the core scRNA-seq analysis module, data are processed using the Seurat v5 framework (Hao et al., 2024), which performs quality control, normalization, scaling, dimensionality reduction, clustering, and integration steps when required. To ensure broad compatibility, scDock supports multiple commonly used scRNA-seq matrix formats, including 10x Genomics Cell Ranger outputs (barcodes.tsv.gz, features.tsv.gz, matrix.mtx.gz), hierarchical data format files (.h5), and plain text files (.txt). Both gene symbols and Ensembl identifiers are accepted as input formats. Since non–gene symbol identifiers can reduce annotation accuracy and slow downstream analyses, scDock automatically converts Ensembl identifiers to their corresponding gene symbols during preprocessing. For datasets involving multiple experimental or biological conditions, users may provide a metadata file specifying sample group information. These grouping labels are automatically incorporated into a standardized field named sample_group , which can be used directly in downstream comparative analyses and integration workflows. During clustering and dimensionality reduction, the number of principal components (PCs) selected has a critical impact on the amount of biologically informative variation preserved in the dataset ( Stuart et al., 2019 , Becht et al., 2019 ). To determine the optimal number of PCs, scDock uses the geometric elbow method as its default strategy. This approach identifies the point with the greatest perpendicular distance from the line connecting the first and last PCs on the variance-explained plot, as previously described ( Zhuang et al., 2022 ). Because batch effects can introduce unwanted technical variability that obscures true biological signals ( Hie et al., 2019 ), scDock incorporates several integration methods to mitigate such artifacts, including canonical correlation analysis (CCA) ( Butler et al., 2018 ), reciprocal PCA (RPCA) ( Hao et al., 2024 ), and the Harmony algorithm ( Korsunsky et al., 2019 ). Manual cell type annotation is often labor-intensive, requires substantial domain expertise, and must account for tissue-specific context. To address these challenges, scDock integrates scMayoMap ( Yang et al., 2023 ) for automated cell-type annotation across a broad range of tissues. Beyond the original reference database, scDock further expands the annotation resources to improve performance in disease-specific settings. These extensions currently include neuroblastoma, an uncommon and non–tissue-specific cancer that can originate in multiple organs, and breast cancer, enabling more accurate identification of malignant cells and subtype-specific populations. 2.2 Intercellular communication inference The intercellular communication inference module uses CellChat v2 ( Jin et al., 2025 ) to evaluate ligand–receptor expression patterns across cell types and infer their potential communication networks, including secreted signaling, extracellular matrix-receptor interactions, and cell–cell contact-mediated communication. Identifying ligand-receptor pairs involved in prominent signaling pathways reveals key intercellular interactions that may represent promising therapeutic targets. By default, scDock operates in a single-group mode and computes the signaling pathways with the highest interaction probabilities across all cell types, recording both incoming and outgoing signals as well as global interaction patterns. A central feature of scDock is its ability to investigate disease-associated signaling pathways as the initial step toward therapeutic target discovery. When a metadata file specifying experimental or biological groups is provided, scDock performs group-wise comparisons to quantify differences in intercellular communication patterns. Signaling pathways exhibiting the greatest shifts in interaction probabilities are identified, and their corresponding differentially active ligand–receptor pairs are designated as candidate therapeutic targets. These targets are then automatically forwarded to the molecular docking module for downstream evaluation. scDock also supports cell type-specific communication analyses. By adjusting the parameters Run_CellChat_source_celltype and Run_CellChat_target_celltype in the configuration file, users can restrict the analysis to selected source and target populations, enabling more focused and biologically informed investigations of intercellular signaling events. 2.3 Molecular docking In the molecular docking module, scDock uses AutoDock Vina (Trott and Olson, 2010) to estimate the binding affinities between small molecules and the target proteins identified through the intercellular communication analysis. Constructing compound and protein structure libraries is typically time-consuming and requires technical expertise; scDock streamlines this process by providing three options for compound library generation: (i) a built-in FDA-approved compound library, (ii) a customized library generated from Chemical Abstracts Service (CAS) registry numbers, and (iii) user-supplied compound structures. For the first option, scDock includes a curated list of FDA-approved small-molecule drugs (version 2 September 2025) within its GitHub repository, allowing users to rapidly assemble a ready-to-use library for systematic screening. For the second option, users may supply CAS identifiers, and scDock automatically retrieves the corresponding compound structures from PubChem ( Kim et al., 2025 ) and converted them into AutoDock Vina-compatible formats using OpenBabel ( O’Boyle et al., 2011 ) and RDKit ( Rational Discovery LLC, 2025 ). For the third option, users may directly provide pre-processed compound structures that meet AutoDock Vina input specifications. For protein structure determination, scDock provides curated reference lists ( ligand_reference . csv and receptor_reference . csv ) containing the best available protein models identified via UniProt-PDB-Mapper ( Riziotis, 2025 ). These structures are retrieved from the SWISS-MODEL Template Library ( Bienert et al., 2017 ). When no experimentally determined structures are available, scDock automatically obtains predicted models from the AlphaFold Protein Structure Database ( Jumper et al., 2021 ). Users may update the curated lists when improved structures becomes available or supply their own protein models directly. scDock performs compound screening using a global docking strategy, automatically defining the docking grid box for each protein to ensure comprehensive exploration of potential binding sites. During the docking procedure, scDock records all protein and compound structures along with the resulting predicted binding poses and binding affinities. The toolkit also summarizes and ranks the affinities of all screened compounds for each target protein, enabling efficient identification of high-priority therapeutic candidates. 3 Application To demonstrate the utility of scDock, we analyzed a scRNA-seq dataset (GSE218563) from diabetic mouse kidneys ( Liu et al., 2023 ), which includes samples from 16 mice representing both control and diabetic nephropathy (DN) groups. A complete walkthrough of this analysis is provided in the GitHub repository. Using the group information specified in the metadata, we examined differences in intercellular communication between the control and DN groups. Using a single configuration file, scDock produced the following results. First, it identified major kidney cell populations, including distal convoluted tubule cells, proximal tubule cells, and mesangial cells (Supplementary Figure 1). In the intercellular communication analysis, scDock visualized global signaling networks and revealed pathways with increased interaction probabilities in the DN group relative to controls (Supplementary File 2). Among the differential signaling pathways, the interaction between peptidyl-prolyl cis-trans isomerase A (PPIA) and basigin (BSG) was highlighted as associated with DN, leading to the selection of these two proteins as targets for molecular docking. scDock then performed molecular docking on the selected targets using a common library assembled from user-provided CAS registry numbers. The pipeline generated binding poses and calculated binding affinities for each compound–protein pair. Notably, the predicted complex between glimepiride and PPIA was visualized using PyMOL ( Schrödinger LLC, 2021 ) to provide additional structural illustration (Supplementary Figure 3). 4 Conclusions We developed scDock as an integrative and user-friendly toolkit that streamlines the complex analytical steps and computational expertise typically required for scRNA-seq data analysis. By unifying single-cell transcriptomic processing, inter-cellular communication inference, and molecular docking–based compound screening, scDock lowers the technical barrier for researchers and enables efficient identification of disease-associated therapeutic targets. Comprehensive documentation, installation instructions, and tutorials are available on GitHub. We anticipate that scDock will expand the accessibility of scRNA-seq–based analyses and accelerate the discovery of potential therapeutics across a wide range of biological and disease contexts. Data availability The scDock source code is publicly available on GitHub at https://github.com/Andrewneteye4343/scDock . The single-cell RNA-seq dataset used in the demonstration analysis was obtained from NCBI GEO database under accession number GSE218563 ( https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE218563 ). Author contributions CHH: data curation, investigation, formal analysis, methodology, validation, visualization, writing original draft. YJO: methodology. HCH: conceptualization, methodology, writing original draft, supervision, project administration, funding acquisition. HFJ: conceptualization, methodology, writing original draft, supervision, project administration, funding acquisition. Funding This work was supported by the National Science and Technology Council (NSTC 112-2221-E-A49-061-MY3, NSTC 114-2221-E-A49-144-MY3, NSTC 113-2320-B-002-025-MY3, NSTC 113-2221-E-002-149-MY3, and NSTC 114-2321-B-002-022), Research Proposal for NTU Core Consortiums (NTU-CC-114L892702), NTU Seed Projects for Interdisciplinary Research (NTU-SPIR-114L8417) and Center for Advanced Computing and Imaging in Biomedicine (NTU-114L900701) from The Featured Areas Research Center Program within the framework of the Higher Education Sprout Project by the Ministry of Education (MOE) in Taiwan. Conflict of Interest none declared. Acknowledgements We thank Dr. Kai-Pu Chen at Center for Computational and Systems Biology, National Taiwan University, Dr. Ching-Chia Yang, Hong-Shian Yang, Hsin-Yo Yuan, and Hong-Ming Tseng for their valuable and constructive feedbacks. Funder Information Declared National Science and Technology Council , NSTC 112-2221-E-A49-061-MY3 , NSTC 114-2221-E-A49-144-MY3 , NSTC 113-2320-B-002-025-MY3 , NSTC 113-2221-E-002-149-MY3 , NSTC 114-2321-B-002-022 Research Proposal for NTU Core Consortiums , NTU-CC-114L892702 NTU Seed Projects for Interdisciplinary Research , NTU-SPIR-114L8417 Center for Advanced Computing and Imaging in Biomedicine from The Featured Areas Research Center Program within the framework of the Higher Education Sprout Project by the Ministry of Education (MOE) in Taiwan. , NTU-114L900701 Footnotes https://github.com/Andrewneteye4343/scDock References ↵ Aibar S et al. SCENIC: single-cell regulatory network inference and clustering . Nat Methods . 2017 ; 14 ( 11 ): 1083 – 1086 . OpenUrl CrossRef PubMed ↵ Becht E et al. Dimensionality reduction for visualizing single-cell data using UMAP . Nat Biotechnol . 2019 ; 37 : 38 – 44 . OpenUrl CrossRef ↵ Bergen V et al. Generalizing RNA velocity to transient cell states through dynamical modeling . Nat Biotechnol . 2020 ; 38 ( 12 ): 1408 – 1414 . OpenUrl CrossRef PubMed ↵ Bienert S et al. The SWISS-MODEL Repository-new features and functionality . Nucleic Acids Res . 2017 ; 45 ( D1 ): D313 – D319 . OpenUrl CrossRef PubMed ↵ Butler A et al. Integrating single-cell transcriptomic data across different conditions, technologies, and species . Nat Biotechnol . 2018 ; 36 ( 5 ): 411 – 420 . OpenUrl CrossRef PubMed ↵ Cao J et al. Comprehensive single-cell transcriptional profiling of a multicellular organism . Science . 2017 ; 357 ( 6352 ): 661 – 667 . OpenUrl Abstract / FREE Full Text ↵ Hao Y et al. Dictionary learning for integrative, multimodal and scalable single-cell analysis . Nat Biotechnol . 2024 ; 42 ( 2 ): 293 – 304 . OpenUrl CrossRef PubMed ↵ Hie B , Bryson B , Berger B. Efficient integration of heterogeneous single-cell transcriptomes using Scanorama . Nat Biotechnol . 2019 ; 37 ( 6 ): 685 – 691 . OpenUrl CrossRef PubMed ↵ Jin S , Plikus MV , Nie Q. CellChat for systematic analysis of cell-cell communication from single-cell transcriptomics . Nat Protoc . 2025 ; 20 ( 1 ): 180 – 219 . OpenUrl CrossRef PubMed ↵ Jumper J et al. Highly accurate protein structure prediction with AlphaFold . Nature . 2021 ; 596 ( 7873 ): 583 – 589 . OpenUrl CrossRef PubMed ↵ Kim S et al. PubChem 2025 update . Nucleic Acids Res . 2025 ; 53 ( D1 ): D1516 – D1525 . OpenUrl CrossRef PubMed ↵ Korsunsky I et al. Fast, sensitive and accurate integration of single-cell data with Harmony . Nat Methods . 2019 ; 16 ( 12 ): 1289 – 1296 . OpenUrl CrossRef PubMed ↵ Liu S et al. Single-cell transcriptomics reveals a mechanosensitive injury signaling pathway in early diabetic nephropathy . Genome Med . 2023 ; 15 ( 1 ): 2 . OpenUrl PubMed ↵ Lu H et al. Recent advances in the development of protein-protein interactions modulators: mechanisms and clinical trials . Signal Transduct Target Ther . 2020 ; 5 ( 1 ): 213 . OpenUrl PubMed ↵ O’Boyle NM et al. Open Babel: An open chemical toolbox . J Cheminform . 2011 ; 3 : 33 . OpenUrl CrossRef PubMed ↵ Rational Discovery LLC et al. 2025 . RDKit (version 2025.3.6). Github . https://github.com/rdkit/rdkit . ↵ Riziotis I. 2025 . Uniprot-PDB-mapper (version 0.2.1). Github . https://github.com/iriziotis/Uniprot-PDB-mapper . ↵ Schrödinger LLC . 2021 . The PyMOL Molecular Graphics System (version 2.5.2) https://www.pymol.org/ . ↵ Stuart T et al. Comprehensive Integration of Single-Cell Data . Cell . 2019 ; 177 ( 7 ): 1888 - 1902 .e21. OpenUrl CrossRef PubMed Trott O , Olson AJ. AutoDock Vina: improving the speed and accuracy of docking with a new scoring function, efficient optimization, and multithreading . J Comput Chem . 2010 ; 31 ( 2 ): 455 – 461 . OpenUrl CrossRef PubMed Web of Science ↵ Yang L et al. Single-cell Mayo Map (scMayoMap): an easy-to-use tool for cell type annotation in single-cell RNA-sequencing data analysis . BMC Biol . 2023 ; 21 ( 1 ): 223 . OpenUrl PubMed ↵ Zhuang H , Wang H , Ji Z. findPC: An R package to automatically select the number of principal components in single-cell analysis . Bioinformatics . 2022 ; 38 ( 10 ): 2949 – 2951 . OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted November 21, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following scDock: Streamlining drug discovery targeting cell-cell communication via scRNA-seq analysis and molecular docking Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share scDock: Streamlining drug discovery targeting cell-cell communication via scRNA-seq analysis and molecular docking Chen-Hao Huang , Yen-Jen Oyang , Hsuan-Cheng Huang , Hsueh-Fen Juan bioRxiv 2025.11.20.689638; doi: https://doi.org/10.1101/2025.11.20.689638 Share This Article: Copy Citation Tools scDock: Streamlining drug discovery targeting cell-cell communication via scRNA-seq analysis and molecular docking Chen-Hao Huang , Yen-Jen Oyang , Hsuan-Cheng Huang , Hsueh-Fen Juan bioRxiv 2025.11.20.689638; doi: https://doi.org/10.1101/2025.11.20.689638 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Bioinformatics Subject Areas All Articles Animal Behavior and Cognition (7629) Biochemistry (17660) Bioengineering (13881) Bioinformatics (41913) Biophysics (21436) Cancer Biology (18578) Cell Biology (25482) Clinical Trials (138) Developmental Biology (13372) Ecology (19889) Epidemiology (2067) Evolutionary Biology (24302) Genetics (15599) Genomics (22483) Immunology (17728) Microbiology (40365) Molecular Biology (17163) Neuroscience (88540) Paleontology (666) Pathology (2830) Pharmacology and Toxicology (4821) Physiology (7637) Plant Biology (15130) Scientific Communication and Education (2045) Synthetic Biology (4290) Systems Biology (9818) Zoology (2269)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall: last seen: 2026-06-20T06:35:16.286784+00:00