Ligand-binding pockets in RNA, and where to find them

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 62,107 characters · extracted from preprint-html · click to expand
Ligand-binding pockets in RNA, and where to find them | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Ligand-binding pockets in RNA, and where to find them Seth D. Veenbaas , Jordan T. Koehn , Patrick S. Irving , Nicole N. Lama , Kevin M. Weeks doi: https://doi.org/10.1101/2025.03.13.643147 Seth D. Veenbaas 1 Department of Chemistry, University of North Carolina , Chapel Hill NC 27599-3290 Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jordan T. Koehn 1 Department of Chemistry, University of North Carolina , Chapel Hill NC 27599-3290 Find this author on Google Scholar Find this author on PubMed Search for this author on this site Patrick S. Irving 1 Department of Chemistry, University of North Carolina , Chapel Hill NC 27599-3290 Find this author on Google Scholar Find this author on PubMed Search for this author on this site Nicole N. Lama 1 Department of Chemistry, University of North Carolina , Chapel Hill NC 27599-3290 Find this author on Google Scholar Find this author on PubMed Search for this author on this site Kevin M. Weeks 1 Department of Chemistry, University of North Carolina , Chapel Hill NC 27599-3290 Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: weeks{at}unc.edu Abstract Full Text Info/History Metrics Supplementary material Preview PDF ABSTRACT RNAs are critical regulators of gene expression, and their functions are often mediated by complex secondary and tertiary structures. Structured regions in RNA can selectively interact with small molecules – via well-defined ligand binding pockets – to modulate the regulatory repertoire of an RNA. The broad potential to modulate biological function intentionally via RNA-ligand interactions remains unrealized, however, due to challenges in identifying compact RNA motifs with the ability to bind ligands with good physicochemical properties (often termed drug-like). Here, we devise fpocketR , a computational strategy that accurately detects pockets capable of binding drug-like ligands in RNA structures. Remarkably few, roughly 50, of such pockets have ever been visualized. We experimentally confirmed the ligandability of novel pockets detected with fpocketR using a fragment-based approach introduced here, Frag-MaP, that detects ligand-binding sites in cells. Analysis of pockets detected by fpocketR and validated by Frag-MaP reveals dozens of newly identified sites able to bind drug-like ligands, supports a model for RNA secondary structural motifs able to bind quality ligands, and creates a broad framework for understanding the RNA ligand-ome. INTRODUCTION A subset of RNAs fold into complex secondary and tertiary structures capable of forming ligand-binding pockets that can engage small molecules with high affinity and specificity. RNA molecules lie upstream of most biological functions, both encoding proteins and broadly regulating gene expression. Small molecules that bind to and modulate the function of RNA thus have the potential to regulate diverse processes, including the levels of otherwise “undruggable” protein targets lacking well-defined ligand binding pockets ( 1 – 3 ). Further, non-coding RNAs present a vast scope of unexploited targets to manipulate biological processes ( 4 ). However, the promise of selectively targeting RNA with small molecules remains incompletely realized. Our current molecular understanding of RNA-ligand interactions is limited to a few classes of highly structured RNAs, including riboswitches ( 5 ), ribozymes ( 6 ), and ribosomal RNAs (rRNAs) ( 7 ). The lack of an understanding of the types of RNA structures that form high-affinity and selective interactions with small-molecule ligands remains a major challenge for ligand discovery efforts targeting RNA. Pockets in RNA have previously been computationally detected using approaches originally developed for finding pockets in proteins, including V3 ( 8 , 9 ) and mkgrid ( 10 , 11 ), which are rolling probe-based approaches, and PocketFinder ( 12 , 13 ), which is energy based. In addition, the ROBIN database uses machine learning to characterize RNA-binding ligands ( 14 ) and SHAMAN leverages RNA-focused molecular dynamics and fragment docking to identify small-molecule binding sites ( 15 ). These studies suggest that ligand-binding pockets in RNA and protein molecules have similar bulk properties of volume, buriedness, and solvent accessibility ( 9 , 11 , 13 , 14 ). In contrast, RNA pockets have been proposed to be less hydrophobic and to bind more rod-like ligands ( 9 , 11 , 13 , 16 ), features which are generally viewed unfavorably for medicinal chemistry ( 17 ). Prior work tended to include (nearly) all known ligand-bound RNA structures – containing a preponderance of simple organic molecules and less-complex stem-loop RNA structures – in contrast to focusing on RNA structures that bind to ligands with favorable (often called drug-like) physicochemical properties. There is also intense debate regarding what kinds of specific RNA structures are capable of harboring pockets able to bind ligands with favorable physicochemical properties. The current dialogue centers on the relative importance of targeting simple stem-loop or bulge containing motifs, which may have stronger current biological validation, versus targeting complex RNA motifs which can potentially form more selective interactions with small molecules, but are harder to identify ( 3 , 18 – 20 ). Most recent work has focused on the former class of simple RNA targets. We posited, first, that differences in physicochemical properties between proteins and RNAs require that pocket-finding algorithms be optimized specifically for RNA structures. Second, pockets that bind ligands with favorable physicochemical properties (and are plausibly drug-like) should be prioritized to best understand RNA-ligand interactions in the context of structure-based ligand discovery ( 3 , 21 ). Here we introduce fpocketR and Frag-MaP, two frameworks for identifying ligandable pockets in RNA. fpocketR is a software package optimized to identify, visualize, and characterize pockets in RNA, built around the open-source pocket detection software fpocket ( 22 ). We optimized fpocketR , focusing on the limited examples of RNAs with known complex structures that bind small-molecule ligands with favorable physicochemical properties. fpocketR can be used as a discovery tool to identify novel pockets that specifically bind drug-like ligands in both apo (ligand free) and (low resolution) dynamic RNA tertiary structures. fpocketR provides users the flexibility to analyze single RNA structures or RNA ensembles, including experimentally solved structures, molecular dynamics simulations, or from computational modeling. We experimentally validated the ligandability of pockets detected by fpocketR using Frag-MaP. Frag-MaP uses photocrosslinkable small-molecule probes and mutational profiling (MaP) technology ( 23 , 24 ) to identify the nucleotide position of RNA-ligand interactions in a direct experimental step, in cells. Finally, we analyzed pocket-forming RNA secondary structures identified using fpocketR and propose a framework for understanding RNA secondary structures that specifically interact with favorable (drug-like) small-molecule ligands. RESULTS Geometry-based analysis reveals differences in protein versus RNA pockets We used the open-source, geometry-based pocket finding framework, fpocket , to detect ligandable pockets in RNA. fpocket places alpha spheres throughout the structure of a biomolecule, where every alpha sphere is in contact with the center point of exactly four atoms in the biomolecule ( Fig. 1A ). The radius of each alpha sphere reflects the local curvature of the biomolecule ( 22 ), allowing solvent accessible cavities to be identified as groups of appropriately sized alpha spheres. Ligand-binding pockets are detected by clustering groups of alpha spheres that are close in three-dimensional space. Finally, pockets are characterized and scored based on their physical and electrostatic properties. The default fpocket algorithm is widely used and successful for detecting ligandable pockets in proteins ( 22 , 25 ). Download figure Open in new tab Figure 1. Geometry-based pocket finding approach and optimization for detecting sites in RNAs that bind ligands with favorable physicochemical properties. ( A ) Illustration of the fpocket algorithm and use of alpha spheres to detect pockets (PDB: 1F27) ( 47 ). ( B ) fpocket performance before and after optimization using a curated library of RNAs in complex with high QED ligands. Distinct pockets are indicated by differently colored alpha spheres. (Examples shown, PDB: 1Q8N, 2GDI, 5KX9) ( 48 – 50 ). ( C ) Curation and abundances of drug-like RNA-ligand complexes in the Protein Data Bank. RNA-ligand complexes were filtered from the HARIBOSS database ( 11 ). QED quantifies eight fundamental properties of a small molecule ligand into a single metric of drug-likeness ( 21 ). The fpocke t algorithm was optimized to detect pockets in proteins and tuned for the properties of amino acids ( Fig. 1A ). When fpocket is applied to protein structures, the highest scoring pocket corresponds to the known ligand-binding site 83% of the time ( 22 ). We applied fpocket to a curated library of RNA-ligand complexes, selected for inclusion of drug-like ligands. Using the default, protein-optimized, parameters fpocket detects many (incorrect) pockets for each RNA structure, and the highest scoring pocket overlaps with the known ligand-binding site only 63% of the time. More worryingly, many pockets detected using the default parameters are located on the RNA surface or in non-selective and solvent-exposed grooves, making these “pockets” poor targets for selective, small-molecule ligands ( Fig. 1B ). The discrepancy in fpocket performance between protein and RNA structures, first, reveals that a refinement of the algorithm is required to reliably detect RNA pockets capable of binding ligands with favorable physicochemical properties and, second, emphasizes there are fundamental differences between the ligand-facing surfaces of RNA and protein. A curated structure database of drug-like ligands bound to RNA To optimize fpocket for RNA, we curated a library of short (≤ 200 nt), high resolution (≤ 3.5 Å) RNA-ligand complexes from the 538 structures available in the non-redundant version of the HARIBOSS database ( Fig. 1C ) ( 11 ). We selected non-redundant RNAs containing ligands with favorable physicochemical properties, defined as a quantitative estimate of drug-likeness (QED) score ( 21 ) of ≥ 0.3. The QED score is an evolution of Lipinski’s rules that ranks small molecules based on eight fundamental physicochemical properties including molecular mass, hydrophobicity, number of rotatable bonds, and number of hydrogen bond donors and acceptors. With the QED metric, overall favorable molecular properties can compensate for one or more less desirable features to provide a holistic view of ligand quality in a single value that ranges from 0 (worse) to 1 (best). Requiring a QED score of ≥ 0.3 naturally excludes ligands that bind to or intercalate with RNA non- or semi-specifically. In the following text, for simplicity, we refer to ligands with QED (drug-likeness) scores ≥ 0.3 as drug-like RNA-binding ligands. However, we note that few of the small molecules discussed here, or known to bind RNA generally, are true drugs. Instead, we use the term drug-like to emphasize compounds with good physicochemical properties, consistent with general medicinal chemistry convention. By these definitions, we identified 48 high-resolution structures of RNA-ligand interactions in which the small molecule ligand is plausibly drug-like ( Fig. 1C ). The paucity of structures in this list emphasizes that we have much to learn about the ligandability of RNA. fpocketR : fpocket optimized for RNA Of the 48 RNA-ligand complexes, 38 had deep, well-defined pockets. We divided these 38 complexes into a training set ( n = 13), used for optimization of fpocketR ( Table S1 ), and a test set ( n = 25), for validation ( Fig. 1C , Table S2 ). Four core parameters ( m, M , D, i ) in the fpocket algorithm strongly affect RNA pocket detection by controlling alpha sphere size and clustering ( Fig. 1A ). We systematically evaluated 1820 combinations of these four parameter values in a three round multi-objective optimization to maximize sensitivity (sens) and positive predictive value (ppv) for detecting the known ligand-binding sites in our RNA-ligand training set ( Fig. S1, Table S3 ). Optimization of fpocket yielded parameters that accurately detect binding sites for drug-like ligands in RNA ( Fig. 1B and S1 ). We incorporated these optimized parameters into fpocketR , a custom python package that detects, characterizes, and visualizes pockets in RNA. The optimized parameters ( m = 3.0, M = 5.7, D = 1.65, and i = 42) used in fpocketR differ markedly from the default fpocket parameters ( m = 3.4, M = 6.2, D = 2.4, and i = 15). Critical changes were to require both smaller alpha spheres and larger numbers of alpha spheres to comprise a pocket. Using these changes, the probability that the top-scoring pocket overlapped with a known ligand binding site increased from 63% ( fpocket ) to 92% ( fpocketR ), corresponding to a five-fold reduction in false positives ( Table S4 ). Furthermore, fpocketR identified 100% of known ligand-binding sites in the training and test sets with a minimum positive predictive value of 78% ( Fig. 1B and 2 ). fpocketR also detected eight novel pockets that do not overlap known ligand-binding sites. These novel pockets appear to be high quality (buried, sufficient volume, supporting π-π stacking) ( Fig. 2 ) and may bind cryptic ligands (suggesting the true positive predictive value is notably higher than 78%). For example, we detected a novel pocket in the SAM-III riboswitch, buried in the RNA structure between a multi-helix junction and a bulge, that is less solvent exposed than the known ligand-binding site ( Fig. S2 ). fpocketR significantly outperformed fpocket in detecting binding sites for drug-like ligands in RNA structures ( Fig. 2B ; Table S4 ). Download figure Open in new tab Figure 2. Pockets detected in RNA structures with fpocketR . Selected examples from the training and test sets are shown. Known and novel pockets indicated in orange and green, respectively. Frag-MaP: Experimental validation of fpocketR predictions We applied fpocketR to the E. coli (PDB: 7K00) and B. subtilis (PDB: 7AS8) ribosomes ( 26 , 27 ) and identified 46 and 52 pockets in the 23S rRNAs, respectively ( Fig. S3 ). The ribosomal pocket-ome identified in this analysis includes most known ligand-binding sites for drug-like ligands, including binding sites for the antibiotics linezolid, sparsomycin, and spectinomycin. However, most predicted pockets are novel, suggesting the universe of RNA pockets capable of binding drug-like ligands might be quite large. We therefore experimentally evaluated if the novel pockets identified by fpocketR bind drug-like small molecules in cells. We developed Frag-MaP, which leverages tri-functionalized probes containing a small-molecule fragment (MW ≤ 300) linked to a photocrosslinkable diazirine and “clickable” alkyne handle ( Fig. 3A ) ( 28 , 29 ). Probes penetrate cells and crosslink to nucleotides proximal to their RNA-ligand binding sites, yielding RNA-ligand adducts. Frag-MaP exploits mutational profiling (MaP) ( 23 , 24 ) for the step that identifies ligand-binding sites. MaP is direct and experimentally concise, and yields low sequencing and library-preparation biases, high sensitivity, and single nucleotide resolution. RNA-ligand adducts induce mutations in the cDNA synthesized during reverse transcription, which are quantified through massively parallel sequencing. These improvements are analogous to the advantages of using MaP to read out chemical probing experiments ( 23 , 24 ). Frag-MaP sites are identified as nucleotides that interact with a fragment probe with significantly higher mutation rates compared to a control probe bearing a simple methyl group ( Fig. 3B ). Download figure Open in new tab Figure 3. Experimental detection of RNA-ligand binding sites by Frag-MaP. ( A ) Frag-MaP experimental scheme. ( B ) Structure of high-QED probes used in Frag-MaP experiments. Mutation rate of Frag-MaP sites (orange, labeled) detected in the 23S rRNA for ( C ) linezolid and ( D ) quinoxaline probes. ( E ) Distance to a pocket predicted by fpocketR from all nucleotides in the 23S rRNA compared to Frag-MaP sites for linezolid and quinoxaline. *, p < 0.03; Mann Whitney test. Note: Frag-MaP sites occur at residues with relative solvent accessible surface area (rSASA) spanning 0.05 to 0.89 (0.0 and 1.0 equal to buried versus fully accessible). rSASA is not significantly different for Frag-MaP sites (mean: 0.44, stdev: 0.25) compared to all RNA residues (mean: 0.43, stdev: 0.22); p = 0.52, Mann-Whitney test. ( F ) Visualization of all Frag-MaP sites detected using the linezolid-based probe. Frag-MaP sites are orange; linezolid is shown bound in the peptidyl transferase center (PDB: 7AS8) ( 27 ). ( G ) Visualization of the most reactive Frag-MaP sites detected in the 23S rRNA using the quinoxaline-based probe. Pockets detected using fpocketR are shown as spheres. We first validated the Frag-MaP strategy using a known RNA-ligand interaction based on a functionalized linezolid probe ( Fig. 3B ). Linezolid is a fragment- and drug-like (QED = 0.79) antibiotic with activity against Gram-positive bacteria and binds with low micromolar affinity to a pocket in the peptidyl transferase center (PTC) in the 23S rRNA ( 30 , 31 ). The pocket in which linezolid binds is robustly predicted by fpocketR ( Fig. 3F ). The acetamidomethyl group is oriented toward the exit tunnel and provides a vector to functionalize linezolid without interfering with binding. We treated B. subtilis cells with the linezolid probe and detected four Frag-MaP sites as positions highly reactive toward the linezolid probe (mutation rates: 3-18%) relative to the fragment-less control probe (median mutation rate: 0.5%) ( Fig. 3C , Fig. S4A ). The four Frag-MaP sites detected for the linezolid probe (nucleotides 2089, 2091, 2613, 2614) are hundreds of nucleotides apart in primary sequence but lie within 7 Å of the linezolid binding site in three-dimensional space ( Fig. 3F , Fig.S4A ). Frag-MaP thus detects RNA-ligand binding sites with nucleotide resolution in cells, with high sensitivity and specificity. We next screened for new ligand-binding sites in the B. subtilis 23S rRNA using 6- aminoquinoxaline (QED = 0.57) ( Fig. 3B ) and fragment 206 (QED = 0.81) probes ( Fig. S3C ). The quinoxaline probe yielded ten Frag-MaP sites with mutation rates up to 6% ( Fig. 3D ). Some of these sites were tens of nucleotides apart from each other in sequence, but clustered at compact locations in the 23S rRNA ( Fig. 3G ). Strikingly, 9 out of 10 Frag-MaP sites occurred at pockets predicted by fpocketR with a median distance of 4.5 Å ( Fig. 3E , Fig. S4B ). Probe 206 yielded an additional 4 Frag-MaP sites, 3 of which are near pockets (median distance of 5 Å) ( Fig. S4C ). Both probes bound to pockets in functionally interesting areas within the large ribosomal subunit. The quinoxaline probe bound to a pocket formed by a pseudoknot within the exit tunnel (nucleotides: 63 and 88) and to three nucleotides in the L1 stalk (nucleotides: 2145, 2154, 2198). Both the quinoxaline (nucleotides: 2582, 2613) and 206 (nucleotides: 2613, 2614) probes also bound at the P-site within the PTC, adjacent to the linezolid binding site. Identification of these site, in functionally important regions, demonstrate the ligandability and relevance of pockets detected by fpocketR . Most (89%) ligand binding sites detected by Frag-MaP are close in three-dimensional space (median distance 4.8 Å) to pockets detected by fpocketR. Frag-MaP sites are significantly closer to pockets identified by fpocketR than expected by chance and occur at residues with both high and low solvent accessibility ( Fig. 3E ). The juxtaposition of pockets – predicted by fpocketR and validated experimentally by Frag-MaP – emphasizes that pockets detected by fpocketR are reflective of authentic, in-cell ligand-binding sites for drug-like small-molecule ligands. Pocket ligandability: validation of sites for drug-like small molecules In a second validation strategy, we evaluated 17 RNA-ligand complexes comprised of antibiotics bound to bacterial rRNAs to assess the capacity of pockets detected by fpocketR to bind drug-like ligands. The 17 small-molecule ligands bind the 30S and 50S rRNAs at ten distinct binding sites, span multiple chemical classes, and have QED scores ranging from 0.01 (not drug-like) to 0.89 (highly drug-like) ( Fig. 4A , Fig. S5 ). This is a rigorous test of fpocketR as rRNAs are significantly larger than and not evolved to bind small-molecule ligands compared to the RNA aptamers and riboswitches used to train fpocketR . Download figure Open in new tab Figure 4. Pockets detected by fpocketR in the bacterial rRNA, compared to small-molecule antibiotic binding sites. ( A ) Ligand binding sites, listed by (QED) drug-likeness score. Sites detected with fpocketR indicated with check marks. ( B ) Contrasting examples of a drug-like ligand (sparsomycin) that binds a well-defined pocket (orange) and a non-drug-like ligand (edeine) that binds a non-pocket-like structure. An illustration of ligands bound near the PTC is provided in Fig. S5 . The known ligand-binding site was detected as a pocket by fpocketR for 7 of the 17 RNA-ligand complexes, across 4 distinct binding sites. fpocketR differentiated ligand-binding sites based on the drug-likeness of the bound ligands. fpocketR detected six of the seven pockets for ligands with a QED score above the training threshold of 0.3 ( Fig. 4A ). In addition, fpocketR detected the pocket for the highly conjugated ligand thermorubin that forms extensive π-π interactions with rRNA at the junction of the 50S and 30S ribosomal subunits. This pocket appears able to bind drug-like ligands, even though the ligand in this case is not drug-like. There are clear structural differences between ligand-binding sites that interact with druglike and non-druglike ligands ( Fig. 4B ). Pockets that bind drug-like ligands are buried, generally encapsulate their ligands, and form both hydrogen bonding and π-π interactions. By contrast, RNA motifs that interact with less drug-like ligands, such as aminoglycosides and the extended edeine chain, are characterized by a high number of hydrogen bonding interactions and are located at solvent exposed RNA surfaces ( Fig. 4B ). All low-QED (and thus undrug-like) ligands in our analysis are natural products. Apparently, bacteria can evolve anti-ribosome antibiotics that do not follow human-compiled rules for drug-likeness and, further, can target ribosome regions that do not contain conventional pockets. In sum, based on both direct experimental interrogation with Frag-MaP ( Fig. 3 ) and by evaluating drug-like and non-drug-like molecules that bind the ribosome ( Fig. 4 ), we validate that fpocketR selectively identifies pockets in RNA capable of binding ligands with drug-like physicochemical properties. We now use fpocketR to understand features of ligand-binding pockets in RNA. Detection of pockets in unliganded (apo) structures We used fpocketR to examine binding sites in both apo (ligand-free) and dynamic structures. We analyzed paired ligand-free (apo) and ligand-bound (holo) RNA structures for ten RNA-ligand complexes spanning a wide-range of QED scores (0.23 to 0.89; Table S5 ). Most of these structures were determined by X-ray crystallography, so crystal packing partially stabilized the apo state. fpocketR detected the known ligand binding site in 9 of the 10 holo complexes, only failing to detect the ligand binding site for the least drug-like ligand, phosphoribosyl pyrophosphate (QED 0.23). fpocketR also detected the known ligand binding site in 9 of 10 apo (ligand-free) structures, including RNAs with global ligand-induced conformation changes (for example, the TPP riboswitch). The size, shape, and position of predicted pockets are often affected by ligand-induced conformational changes in the RNA structure, meaning that pockets in apo structures do not always perfectly align with known ligand bind-sites ( Fig. 5A ). However, fpocketR -detected pockets in the apo structures reliably determined the local capacity of an RNA to bind a small-molecule ligand. Download figure Open in new tab Figure 5. Detection of ligand-binding sites in apo (ligand-free) sites and in RNA ensembles. ( A ) Pockets detected by fpocketR in apo (pink) and ligand-bound (blue) RNA structures for the lysine riboswitch, SAM-I riboswitch, and adenine riboswitch (PDB: 3D0U & 3D0X, 3IQN & 3IQP, 5SWE & 5E54) ( 51 – 53 ). ( B ) Pockets detected in individual RNA states for ensembles of HIV-TAR, measured by NMR (PDB: 7JU1) ( 33 ), and the SAM-IV riboswitch, measured by cryo-EM (PDB: 6WLQ) ( 34 ). Known and novel pockets, detected by fpocketR , are orange and green, respectively. Structures are depicted as transparent backbones; pockets are shown as transparent surfaces. RNA molecules often populate structural ensembles and the underlying structural dynamics influence biological function and response to ligand binding ( 32 ). This intrinsic dynamism in RNA structure also means that RNA structures in ensembles, especially for smaller RNAs, are visualized at modest resolution. We visualized pockets in a carefully refined NMR-based model of the HIV-1 TAR RNA hairpin ( 33 ). Of the 20 structures modeled for the TAR RNA, seven (35%) contained pockets overlapping the binding site for the known ligand ( Fig. 5B ). Similarly, an ensemble of structures was reported for the apo state of the of the SAM-IV riboswitch (determined by cryo-EM; 3.7 Å resolution) ( 34 ). In this case, pockets formed in four states (20%) ( Fig. 5B ). Novel pockets were observed for a single state for both RNAs. Thus, in these two examples of unliganded RNA structures with multiple states, pockets formed in only a minor subset of conformations but were concentrated at known ligand-binding sites. Small molecule binding then selects for the subset of structures with a ligandable pocket. Importantly, fpocketR finds ligandable sites even in ensembles based on modest-resolution structure models. Tripling the known universe of RNA pockets able to bind drug-like ligands Non-redundant, high-resolution structures for RNAs are limited, and are especially sparse for RNAs bound to ligands with good (drug-like) physicochemical properties ( Fig. 1C ). Prior to this study, roughly 50 pockets capable of binding drug-like ligands had ever been visualized, these are those found in small RNAs ( Fig. 1C and Fig. 2 ) and in the ribosomal RNAs ( Fig. 4 ). Based on fpocketR , this work substantially expands this universe to 138, and could be made larger by extending the analysis developed here to additional RNAs. RNA secondary structures that harbor pockets We examined RNA structures from the training set, test set, bacterial rRNAs, and a group II intron and identified all nucleotides that form pockets detected by fpocketR , and thus likely to bind drug-like ligands. We then annotated the nucleotides that form pockets in secondary structure diagrams ( Fig. 6 ). In larger multi-domain RNAs, such as the ribosome or group II intron, pockets form both from nucleotides localized in secondary structure space (local interactions) and from nucleotides that become juxtaposed via through-space interactions involving multiple domains (long-range interactions) ( Fig. 7 , Fig. S6-S7 , Tables S6-S9 ). Download figure Open in new tab Figure 6. Scheme for mapping RNA pockets, visualized in three-dimensional structures, onto secondary structure diagrams. Nucleotides are colored to match the pocket they contact, in both tertiary and secondary structure images (PDB: 3E5C) ( 54 ). In this structure, both pockets are local. Download figure Open in new tab Figure 7. Representative illustration of pockets formed by local versus long-range interactions, detected in a group II intron RNA. Pockets formed by local domains are boxed. ( A ) Pockets identified by number and color, and superimposed on the RNA secondary structure. ( B ) Pockets visualized in the three-dimensional RNA structure (colored by domain). Complex contains a reverse transcriptase cofactor (pink) (PDB: 5G2X) ( 55 ). ( C ) Examples of pockets formed by local versus long-range RNA interactions. RNA backbone is colored by domain. Pockets formed by long-range interactions in large RNA structures would be difficult or impossible to identify from a secondary structure model alone. Thus, we focused our analysis on local pockets. Small RNAs (< 200 nucleotides) form local pockets exclusively. A majority (66%) of pockets in multi-domain RNAs also occur in local secondary structures ( Fig. 7C ), which emphasizes that readily characterized secondary structure motifs form pockets in both small and large RNAs. We assigned each pocket detected by fpocketR to a class defined by the most complex secondary structural motif that contributes to pocket formation. Secondary structure motifs that formed pockets varied in complexity and included ( i ) simple loops and bulges, ( ii ) consecutive loops or bulges separated by a contact distance of 5 nucleotides or less, ( iii ) multi-helix junctions, and ( iv ) pseudoknots. Simple bulges and loops are, as expected, extremely common and we observed 402 in our dataset; only 3% of these motifs formed a pocket. In addition, we observed that pockets in simple RNA motifs typically did not form independently but tended to form in large, multi-domain RNAs, where the global architecture could stabilize a local pocket in a simple structure ( Fig. 8A ). Pockets were slightly more common among consecutive loops (4% of which formed pockets; among 273 examples). Download figure Open in new tab Figure 8. Secondary structural motifs that form pockets able to bind ligands with (drug-like) high-quality physicochemical properties. ( A ) Likelihood of secondary motifs to form pockets, in ascending order of complexity and information content. *, simple pockets were observed primarily in large multi-domain RNAs. ( B ) Examples of novel pockets in RNA secondary structural motifs most likely to form pockets. Known pockets are orange; novel pockets are green and magenta. Pockets were much more common among complex structures, multi-helix junctions and pseudoknots, based on our all-pockets dataset (48% and 63% of which formed pockets, respectively) ( Fig. 8A ). Across our full dataset, the number of multi-helix junction and pseudoknot motifs is artificially increased, due to the inclusion of many riboswitch and aptamer motifs. Therefore, we additionally determined the local structure among only our novel pockets. Simple motifs and consecutive loops very rarely formed novel pockets (3% and 1%, respectively). Multi-helix junctions and pseudoknots formed novel pockets at high rates (39% and 53%, respectively) ( Fig. 8A ), comparable to those in the all-pockets dataset. This analysis emphasizes that any given simple motif is unlikely to contain a pocket able to bind small molecules with good physicochemical properties; but that many complex multi-helix junction and pseudoknot motifs will. DISCUSSION A very small number of compounds, with plausibly drug-like physicochemical properties, have ever been visualized bound to compact RNA motifs at high resolution. A few additional drug-like (and actual drug) compounds have been visualized bound to the ribosome. The sizes of our training and test sets were therefore necessarily small, but the selection of these sets is a strength, not a weakness, of our approach. The field is not quite ready for machine learning to characterize these sites. fpocketR was optimized stringently using RNAs in complex with drug-like ligands ( Fig. 1 ). We used the QED framework ( 21 ), which integrates eight physical features strongly associated with druglikeness into a single metric. We required ligands to have QED values greater than 0.3, which tends to eliminate non-selective RNA binders. Our analysis of antibiotic binding pockets in the ribosome found that fpocketR selectively detected pockets that bind drug-like ligands and, critically, distinguishes between pockets that bind drug-like versus un-drug-like ligands. We were then able to leverage fpocketR to substantially expand the number of identified pockets able to bind drug-like ligands. In principle, RNA-targeted ligand discovery could open broad opportunities for manipulating gene expression, especially for targeting difficult-to-ligand proteins and non-coding RNAs. A critical starting point is to understand the rules that underlie RNA targets containing pockets able to bind small molecule ligands with good physicochemical features. When applied to RNA, the protein-optimized fpocket algorithm (mis)identified numerous near- or non-pockets and, moreover, did not accurately rank accepted pockets. Ultimately, fpocket , with default parameters, did not perform well with RNA, emphasizing that fundamental differences exist between the ligand-facing surfaces of proteins and RNA. We identify three broad differences between pockets in RNA and protein. First, pockets detected in RNA (using fpocketR ) and protein (using either algorithm) have broadly similar physical properties with the critical difference that pockets in RNA are more polar and less hydrophobic ( Table S10 ). Second, electrostatic properties significantly influence the pocket scoring functions used to rank pockets by their quality, and the distinctive electrostatics of RNA cause true pockets to be mis-ranked using current algorithms. Third, the ubiquitous presence of solvent-exposed major and minor grooves on the surface of RNA creates pseudo-pockets. False pocket exclusion by fpocketR was achieved by reducing reliance on pocket scoring functions to rank pockets and by imposing stricter geometric requirements that penalize highly solvent-exposed pockets. We validated predictions made by fpocketR with Frag-MaP, which is unique relative to current approaches for detecting RNA-ligand interactions in complex mixtures ( 29 , 35 – 37 ). Frag-MaP leverages mutational profiling (MaP) to identify RNA-ligand binding sites with high sensitivity and independently from biases introduced by biotin pulldown and adapter-ligation steps in seq-based experiments ( 24 , 38 ). Here we used Frag-MaP in a simple way, to detect fragment binding sites in abundant rRNAs. Ligand-binding sites identified by Frag-MaP consistently surrounded pockets detected by fpocketR , demonstrating the general ligandability of novel pockets detected by fpocketR. A powerful future application will be to use Frag-MaP as an in-cell RNA tertiary structure discovery tool because ligand-binding pockets form preferentially and specifically in regions with complex RNA structures. Analyses enabled by fpocketR emphasize that many pockets are created by nucleotides that are localized in RNA secondary structure. Local RNA secondary structures harbor nearly all the pockets in small RNAs (< 200 nucleotides) and form most pockets in large multi-domain RNAs. Pockets in secondary structures are primarily formed by complex motifs, including multi-helix junctions and pseudoknots, compared to simpler RNA structures such as bulges and loops. Complex structural motifs both have a much higher rate of forming drug-like pockets and also have higher information content, which facilitates selective interactions with drug-like ligands across RNA transcriptomes ( 3 ) ( Fig. 8A ). For riboswitches, ligand binding sites were noted to form from residues far away in sequence but close in three-dimensional space, corresponding to regions of maximum contact order ( 39 ). Similarly, the multi-helix junctions and pseudoknots evaluated here have the highest rates of forming pockets and the largest contact orders. Despite these clear advantages of targeting complex structures, a significant component of current work directed at discovery of RNA-targeting small molecules focuses on RNA motifs with simple structures (reviewed in ( 3 , 18 – 20 )). Our study indicates that simple bulge and consecutive loop motifs contain pockets only infrequently ( Fig. 8A ). These observations emphasize that RNA secondary structure is a useful tool to estimate RNA targetability and that RNAs with complex structural motifs are likely the best targets for drug-like small molecules ( Fig. 8B ). De novo design of small-molecule ligands that target RNA and modulate function remains challenging. This work provides critical computational and experimental tools for identifying and understanding features of RNA structures that form targetable pockets, specifically able to bind drug-like small molecule ligands with high potential for therapeutic development. MATERIALS AND METHODS Curation of RNA-ligand complexes containing ligands with favorable (drug-like) physicochemical properties RNA structures used to optimize fpocketR were obtained from the HARIBOSS non-redundant RNA-ligand database ( 11 ). RNA-ligand complex structures were required to ( i ) bind to a drug-like small molecule ligand (QED score ≥ 0.3), ( ii ) be high-resolution (≤ 3.5 Å), ( iii ) be a unique RNA in our data set, and ( iv ) ≤ 200 nucleotides (this requirement removes ligands that bind the ribosome). The quantitative estimate of drug-likeness (QED) score ( 21 ) was calculated using the QED module in the rdkit library ( 40 ). We emphasize that the QED metric is an open source and highly useful measure of fundamental physicochemical properties: molecular mass, hydrophobicity, hydrogen bond donors and acceptors, polarizable surface area, number of rotatable bonds, number of aromatic rings, and structural alerts ( 21 ). As defined by these criteria, there were 48 known RNA-ligand complexes with plausible drug-like ligands, that bind compact RNA sites. These RNA-ligand complexes were manually evaluated in PYMOL ( 41 ) to assess the solvent accessibility and cavity depth of the ligand binding pocket. Ultimately, 38 unique RNA structures were chosen and randomly split into a training set (n=13) and test set (n=25). For analysis of paired ligand-bound and apo structures ( Fig. 5A and Table S5 ), we assessed all examples (10 total) of small RNA structures (< 500 nt) with published holo (bound to small-molecule ligands) and apo structures available in the PDB at the time of our study. Pocket evaluation metrics Only pockets with an fpocket score ≥ 0 were analyzed. Pockets identified by fpocket were required to meet three criteria to be classified as a known pocket that binds a small-molecule ligand. The geometric center criterion is met if the geometric center of a pocket is within 4.5 Å of any atom of the ligand. The ligand overlap criterion is met if at least 25% of the alpha spheres in a pocket overlap the ligand (within 3 Å). The pocket overlap criterion is met if at least 25% of the atoms in the ligand overlap with a pocket (within 3 Å). Pockets that do not meet all three criteria are classified as novel pockets. However, we note that several novel pockets are occupied by biomolecules and ions ( Table S6-S9 ). Software used to evaluate these criteria are provided (see data and software availability section). Multivariate optimization of fpocket We optimized fpocket 4.0.3 ( 22 ) for detecting pockets in RNA by systematically adjusting values of six core parameters ( M , m , D , i , A , p ). Parameters A and p filter pockets based on polarity and, in preliminary analyses, were not effective at improving pocket detection in highly polar RNA molecules. The remaining four parameters ( m , M , D, i ) control the minimum ( m ) and maximum ( M ) alpha sphere radii, clustering distance ( D ), and minimum cluster size ( i ) ( Fig. 1A ) and were systematically optimized in 3 rounds of multivariate optimization using our training set of RNA-ligand complexes ( n = 13). We evaluated fpocket performance to detect ligand binding sites in a large parameter space (1820 parameter combinations) by performing a coarse, medium, and fine round of optimization ( Table S3 ). In each round, we evaluated 5 values for each parameter with progressively smaller increments between the values. We started with the default fpocket parameters and their flanking values and used the best performing parameters from each round of optimization to generate values for the subsequent round. The best performing parameters were selected by calculating a pareto set that maximized sensitivity and positive predictive value (ppv) and by applying some intuition intended to avoid overtraining ( 42 ). We also propose alternative relaxed parameters for investigation of pockets and near-pockets that lie just outside of these criteria (see Supporting Information). fpocketR usage RNA pockets were detected using fpocketR . fpocketR is a wrapper for fpocke t 4.0.3 ( 22 ) that provides options for advanced analysis and visualization of pockets detected in RNA structures. RNA pockets were detected using the input --pdb option for a .pdb or .cif file, the --chain option (maximum of 2 RNA chains), and the newly defined fpocketR parameters (-- m 3.0, -- M 5.7, -- D 1.65, -- i 42). Multistate NMR ensembles were analyzed using the --state 0 and - -qualityfilter 0.4 options. Known binding ligands were specified using the --ligand and -- ligandchain options, allowing fpocketR to differentiate known pockets (visualized in output files as orange to yellow) from novel pockets (green to pink). Visualizations for pockets in secondary structure space were generated by inputting a secondary structure drawing using the --nsd and --connectpocket options. Pocket visualization Figures visualizing predicted pockets were generated using the fpocketR software package. fpocketR generates tertiary structure figures using the PyMOL API ( 41 ) and secondary structure figures using RNAvigate ( 43 ). fpocketR visualizes pockets as a group of alpha-atoms (computed by subtracting 1.65 Å from the fpocketR -generated alpha sphere radius) ( Fig. 1A ). Pockets are visualized in secondary structures by coloring the nucleotides that contact alpha spheres from a pocket. RNA secondary structure drawing templates (.nsd) were generated from PDB structures using RNApdbee ( 44 ) manually edited in StructureEditor ( 45 ), and input into fpocketR using the --nsd option. Classifying pocket structural motifs Pocket-forming secondary structures were classified by the types of RNA structure in contact with alpha spheres. The classes identified and used in this work were, in order of structural complexity: simple structures, consecutive loops, multi-helix junctions, pseudoknots, and long-range structures. Specific structural definitions were: Simple structure, pocket only contacts nucleotides in an apical loop, internal loop, or bulge. Consecutive loops, pocket contacts a pair of loops/bulges within a contact distance of 5 nucleotides from each other (contact distance is defined as the shortest path length through the secondary structure graph between two nucleotides). Multi-helix junction, pocket contacts single-stranded nucleotides in the junction or base-paired nucleotides within 3 nucleotides of the multi-helix junction. Pseudoknot, pocket contacts base-paired nucleotides involved in a non-nested interaction or single-stranded nucleotide located between non-nested helices. Long-range structure, pocket contacts motifs in a structure that have a contact distance of >15 nucleotides. If a structure fit the criteria for multiple motif classifications, the structure was assigned to the most complex structural motif. Structures (4 observed) containing g-quadruplexes were not analyzed. In-cell Frag-MaP Experiments were performed in Bacillus subtilis subsp. subtilis strain 168 (ATCC) in LB at 30 °C. Cell were probed with 200 µM fragment probe or control probe for 30 min in the dark, placed on ice, and then exposed to 3 J/cm2 of 365-nm-wavelength UV light for 9 minutes (Analytik Jena). RNA was extracted and subjected to two bead-based clean up steps (silica-based SPE, Monarch RNA Cleanup Kit; NEB; and click chemistry-based, Magnefy Azide, medium 1.0 µm beads; Bangs Laboratories). RNA was then subjected to mutational profiling reverse transcription (MaP-RT) with random nonamer primers to generate cDNAs ( 46 ). Extended and detailed methods are provided in the Supporting Information. Sequencing and Data Analysis cDNAs were sequenced (NEBNext Ultra II DNA Library Prep Kit for Illumina, NEB) using standard methods ( 46 ). Ligand-binding sites were identified using a new software package, FragMapper , implemented in RNAvigate (v1.0) ( 43 ). Frag-MaP sites were visualized in RNA tertiary structures using PyMOL ( 41 ). These steps are described in detail in the Supporting Methods. DATA AVAILABILITY All data and software generated or used in this work are freely available. The fpocketR datasets reported in this study and fpocketR software suite and user manual are available at https://github.com/Weeks-UNC/2025_Veenbaas and https://github.com/Weeks-UNC/fpocketR , respectively. FragMapper software is available as an analysis module in RNAvigate, https://github.com/Weeks-UNC/RNAvigate . Frag-MaP datasets have been deposited in the Gene Expression Omnibus (GEO) database, https://www.ncbi.nlm.nih.gov/geo (accession no. GSE276279). Competing Interest Statement K.M.W. is a founder at ForagR Medicines, Ribometrix, and A- Form Solutions. J.T.K. is a founder and employee of ForagR Medicines. ACKNOWLEDGEMENTS This work was supported by NIH grant R35 GM122532 (to K.M.W.); software development for tertiary structure discovery by Frag-MaP was supported by the NSF (MCB-2027701 to K.M.W.). J.T.K. is a UNC Lineberger Integrated Training in Cancer Model Systems Fellow (T32 CA009156) and an NIH Kirschstein Postdoctoral Fellow (F32 GM143863). We are indebted to Rachel M. Johnson (University of North Carolina) for performing high-resolution mass spectrometry experiments. We are grateful to members of the Weeks Laboratory, especially to Drs. Simon Felder and Alexandra Khitun, for their continued mentorship and thoughtful input to this work. REFERENCES 1. ↵ A. L. Hopkins , C. R. Groom , The druggable genome . Nat Rev Drug Discov 1 , 727 – 730 ( 2002 ). OpenUrl CrossRef PubMed Web of Science 2. S. J. Dixon , B. R. Stockwell , Identifying druggable disease-modifying gene products . Curr Opin Chem Biol 13 , 549 – 555 ( 2009 ). OpenUrl CrossRef PubMed Web of Science 3. ↵ K. D. Warner , C. E. Hajdin , K. M. Weeks , Principles for targeting RNA with drug-like small molecules . Nat Rev Drug Discov 17 , 547 – 558 ( 2018 ). OpenUrl CrossRef PubMed 4. ↵ S. Djebali , et al. , Landscape of transcription in human cells . Nature 489 , 101 – 108 ( 2012 ). OpenUrl CrossRef PubMed Web of Science 5. ↵ K. Kavita , R. R. Breaker , Discovering riboswitches: the past and the future . Trends Biochem Sci 48 , 119 – 141 ( 2023 ). OpenUrl CrossRef PubMed 6. ↵ M. Felletti , J. S. Hartig , Ligand-dependent ribozymes . WIREs RNA 8 ( 2017 ). 7. ↵ D. N. Wilson , Ribosome-targeting antibiotics and mechanisms of bacterial resistance . Nat Rev Microbiol 12 , 35 – 48 ( 2014 ). OpenUrl CrossRef PubMed 8. ↵ N. R. Voss , M. Gerstein , 3V: cavity, channel and cleft volume calculator and extractor . Nucleic Acids Res 38 , W555 – W562 ( 2010 ). OpenUrl CrossRef PubMed Web of Science 9. ↵ T. Zhou , H. Wang , C. Zeng , Y. Zhao , RPocket: an intuitive database of RNA pocket topology information with RNA-ligand data resources . BMC Bioinformatics 22 , 428 ( 2021 ). OpenUrl CrossRef PubMed 10. ↵ D. Monet , N. Desdouits , M. Nilges , A. Blondel , MkgridXf: Consistent Identification of Plausible Binding Sites despite the Elusive Nature of Cavities and Grooves in Protein Dynamics . J Chem Inf Model 59 , 3506 – 3518 ( 2019 ). OpenUrl CrossRef PubMed 11. ↵ F. P. Panei , R. Torchet , H. Mé Nager , P. Gkeka , M. Bonomi , HARIBOSS: a curated database of RNA-small molecules structures to aid rational drug design . Bioinformatics 38 , 4185 – 4193 ( 2022 ). OpenUrl CrossRef PubMed 12. ↵ J. An , M. Totrov , R. Abagyan , Pocketome via comprehensive identification and classification of ligand binding envelopes . Mol Cell Proteomics 4 , 752 – 761 ( 2005 ). OpenUrl Abstract / FREE Full Text 13. ↵ W. M. Hewitt , D. R. Calabrese , J. S. Schneekloth , Evidence for ligandable sites in structured RNA throughout the Protein Data Bank . Bioorg Med Chem 27 , 2253 – 2260 ( 2019 ). OpenUrl CrossRef 14. ↵ K. Yazdani , et al. , Machine Learning Informs RNA-Binding Chemical Space . Angew Chem Int Ed Engl . 62 , e202211358 ( 2023 ). OpenUrl CrossRef 15. ↵ F. P. Panei , P. Gkeka , M. Bonomi , Identifying small-molecules binding sites in RNA conformational ensembles with SHAMAN . Nat Commun 15 ( 2024 ). 16. ↵ A. Donlic , et al. , R-BIND 2.0: An Updated Database of Bioactive RNA-Targeting Small Molecules and Associated RNA Secondary Structures . ACS Chem Biol 17 , 1556 – 1566 ( 2022 ). OpenUrl CrossRef PubMed 17. ↵ R. P. Sheridan , V. N. Maiorov , M. K. Holloway , W. D. Cornell , Y. D. Gao , Drug-like density: A method of quantifying the “bindability” of a protein target based on a very large set of pockets and drug-like ligands from the protein data bank . J Chem Inf Model 50 , 2029 – 2040 ( 2010 ). OpenUrl CrossRef PubMed 18. ↵ A. Umuhire Juru , A. E. Hargrove , Frameworks for targeting RNA with small molecules . J Biol Chem 296 , 100191 ( 2021 ). OpenUrl CrossRef PubMed 19. J. L. Childs-Disney , et al. , Targeting RNA structures with small molecules . Nat Rev Drug Discov 21 , 736 – 762 ( 2022 ). OpenUrl CrossRef PubMed 20. ↵ S. Kovachka , et al. , Small molecule approaches to targeting RNA . Nat Rev Chem 8 , 120 – 135 ( 2024 ). OpenUrl CrossRef PubMed 21. ↵ G. R. Bickerton , G. V. Paolini , J. Besnard , S. Muresan , A. L. Hopkins , Quantifying the chemical beauty of drugs . Nat Chem 4 , 90 – 98 ( 2012 ). OpenUrl CrossRef PubMed 22. ↵ V. Le Guilloux , P. Schmidtke , P. Tuffery , Fpocket: An open source platform for ligand pocket detection . BMC Bioinformatics 10 , 168 ( 2009 ). OpenUrl CrossRef PubMed 23. ↵ P. J. Homan , et al. , Single-molecule correlated chemical probing of RNA . Proc Natl Acad Sci U S A 111 , 13858 – 13863 ( 2014 ). OpenUrl Abstract / FREE Full Text 24. ↵ K. M. Weeks , SHAPE Directed Discovery of New Functions in Large RNAs . Acc Chem Res 54 , 2502 – 2517 ( 2021 ). OpenUrl CrossRef PubMed 25. ↵ J. J. Clark , Z. J. Orban , H. A. Carlson , Predicting binding sites from unbound versus bound protein structures . Sci Rep 10 , 15856 ( 2020 ). OpenUrl CrossRef PubMed 26. ↵ Z. L. Watson , et al. , Structure of the bacterial ribosome at 2 Å resolution . Elife 9 , e60482 ( 2020 ). OpenUrl CrossRef PubMed 27. ↵ C. Crowe-McAuliffe , et al. , Structural Basis for Bacterial Ribosome-Associated Quality Control by RqcH and RqcP . Mol Cell 81 , 115 – 126 ( 2021 ). OpenUrl CrossRef PubMed 28. ↵ C. G. Parker , et al. , Ligand and Target Discovery by Fragment-Based Screening in Human Cells . Cell 168 , 527 – 541 ( 2017 ). OpenUrl CrossRef PubMed 29. ↵ S. Balaratnam , et al. , A chemical probe based on the PreQ1 metabolite enables transcriptome-wide mapping of binding sites . Nat Commun 12 , 5856 ( 2021 ). OpenUrl CrossRef PubMed 30. ↵ D. N. Wilson , et al. , The oxazolidinone antibiotics perturb the ribosomal peptidyl-transferase center and effect tRNA positioning . Proc Natl Acad Sci U S A 105 , 13339 – 13344 ( 2008 ). OpenUrl Abstract / FREE Full Text 31. ↵ J. A. Ippolito , et al. , Crystal structure of the oxazolidinone antibiotic linezolid bound to the 50S ribosomal subunit . J Med Chem 51 , 3353 – 3356 ( 2008 ). OpenUrl CrossRef PubMed Web of Science 32. ↵ L. R. Ganser , M. L. Kelly , D. Herschlag , H. M. Al-Hashimi , The roles of structural dynamics in the cellular functions of RNAs . Nat Rev Mol Cell Biol 20 , 474 – 489 ( 2019 ). OpenUrl CrossRef PubMed 33. ↵ H. Shi , et al. , Rapid and accurate determination of atomistic RNA dynamic ensemble models using NMR and structure prediction . Nat Commun 11 , 5531 ( 2020 ). OpenUrl CrossRef PubMed 34. ↵ K. Zhang , et al. , Cryo-EM structure of a 40 kDa SAM-IV riboswitch RNA at 3.7 Å resolution . Nat Commun 10 , 5511 ( 2019 ). OpenUrl CrossRef PubMed 35. ↵ H. Mukherjee , et al. , PEARL-seq: A Photoaffinity Platform for the Analysis of Small Molecule-RNA Interactions . ACS Chem Biol 15 , 2374 – 2381 ( 2020 ). OpenUrl CrossRef PubMed 36. Y. Tong , et al. , Transcriptome-Wide Mapping of Small-Molecule RNA-Binding Sites in Cells Informs an Isoform-Specific Degrader of QSOX1 mRNA . J Am Chem Soc 144 , 11620 – 11625 ( 2022 ). OpenUrl CrossRef PubMed 37. ↵ L. Fang , et al. , Pervasive transcriptome interactions of protein-targeted drugs . Nat Chem 15 , 1374 – 1383 ( 2023 ). OpenUrl CrossRef PubMed 38. ↵ N. A. Siegfried , S. Busan , G. M. Rice , J. A. E. Nelson , K. M. Weeks , RNA motif discovery by SHAPE and mutational profiling (SHAPE-MaP) . Nat Methods 11 , 959 – 964 ( 2014 ). OpenUrl CrossRef PubMed Web of Science 39. ↵ C. P. Jones , A. R. Ferré-D’Amaré , Long-Range Interactions in Riboswitch Control of Gene Expression . Annu Rev Biophys 46 , 455 – 481 ( 2017 ). OpenUrl CrossRef PubMed 40. ↵ Greg Landrum, Julie Penzotti, “RDKit” ( https://www.rdkit.org/ , 2010 ). 41. ↵ Schrödinger LLC, “The PyMOL Molecular Graphics System, Version 2.5.4” ( 2015 ). 42. ↵ T. Odland , K. Subbarao , “paretoset” (Github, 2024 ). 43. ↵ P. S. Irving , K. M. Weeks , RNAvigate: efficient exploration of RNA chemical probing datasets . Nucleic Acids Res 52 , 2231 – 2241 ( 2024 ). OpenUrl CrossRef PubMed 44. ↵ T. Zok , et al. , RNApdbee 2.0: multifunctional tool for RNA structure annotation . Nucleic Acids Res 46 , W30 – W35 ( 2018 ). OpenUrl CrossRef PubMed 45. ↵ J. S. Reuter , D. H. Mathews , RNAstructure: Software for RNA secondary structure prediction and analysis . BMC Bioinformatics 11 , 129 ( 2010 ). OpenUrl CrossRef PubMed 46. ↵ M. J. Smola , G. M. Rice , S. Busan , N. A. Siegfried , K. M. Weeks , Selective 2′-hydroxyl acylation analyzed by primer extension and mutational profiling (SHAPE-MaP) for direct, versatile, and accurate RNA structure analysis HHS Public Access . Nat Protoc 10 , 1643 – 1669 ( 2015 ). OpenUrl CrossRef PubMed 47. ↵ J. Nix , D. Sussman , C. Wilson , The 1.3 å crystal structure of a biotin-binding pseudoknot and the basis for RNA molecular recognition . J Mol Biol 296 , 1235 – 1244 ( 2000 ). OpenUrl CrossRef PubMed Web of Science 48. ↵ J. Flinders , et al. , Recognition of Planar and Nonplanar Ligands in the Malachite Green– RNA Aptamer Complex . ChemBioChem 5 , 62 – 72 ( 2004 ). OpenUrl CrossRef PubMed Web of Science 49. A. Serganov , A. Polonskaia , A. T. Phan , R. R. Breaker , D. J. Patel , Structural basis for gene regulation by a thiamine pyrophosphate-sensing riboswitch . Nature 441 , 1167 – 1171 ( 2006 ). OpenUrl CrossRef PubMed Web of Science 50. ↵ J. A. Howe , et al. , Atomic resolution mechanistic studies of ribocil: A highly selective unnatural ligand mimic of the E. coli FMN riboswitch . RNA Biol 13 , 946 – 954 ( 2016 ). OpenUrl CrossRef PubMed 51. ↵ A. D. Garst , A. Héroux , R. P. Rambo , R. T. Batey , Crystal Structure of the Lysine Riboswitch Regulatory mRNA Element . J Biol Chem 283 , 22347 – 22351 ( 2008 ). OpenUrl Abstract / FREE Full Text 52. J. L. Jenkins , J. Krucinska , R. M. McCarty , V. Bandarian , J. E. Wedekind , Comparison of a PreQ1 Riboswitch Aptamer in Metabolite-bound and Free States with Implications for Gene Regulation . J Biol Chem 286 , 24626 – 24637 ( 2011 ). OpenUrl Abstract / FREE Full Text 53. ↵ J. R. Stagno , et al. , Structures of riboswitch RNA reaction states by mix-and-inject XFEL serial crystallography . Nature 541 , 242 – 246 ( 2017 ). OpenUrl CrossRef PubMed 54. ↵ C. Lu , et al. , Crystal structures of the SAM-III/SMK riboswitch reveal the SAM-dependent translation inhibition mechanism . Nat Struct Mol Biol 15 , 1076 – 1083 ( 2008 ). OpenUrl CrossRef PubMed Web of Science 55. ↵ G. Qu , et al. , Structure of a group II intron in complex with its reverse transcriptase . Nat Struct Mol Biol 23 , 549 – 557 ( 2016 ). OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted March 15, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Ligand-binding pockets in RNA, and where to find them Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Ligand-binding pockets in RNA, and where to find them Seth D. Veenbaas , Jordan T. Koehn , Patrick S. Irving , Nicole N. Lama , Kevin M. Weeks bioRxiv 2025.03.13.643147; doi: https://doi.org/10.1101/2025.03.13.643147 Share This Article: Copy Citation Tools Ligand-binding pockets in RNA, and where to find them Seth D. Veenbaas , Jordan T. Koehn , Patrick S. Irving , Nicole N. Lama , Kevin M. Weeks bioRxiv 2025.03.13.643147; doi: https://doi.org/10.1101/2025.03.13.643147 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Biophysics Subject Areas All Articles Animal Behavior and Cognition (7642) Biochemistry (17715) Bioengineering (13907) Bioinformatics (42003) Biophysics (21470) Cancer Biology (18624) Cell Biology (25533) Clinical Trials (138) Developmental Biology (13390) Ecology (19935) Epidemiology (2067) Evolutionary Biology (24356) Genetics (15617) Genomics (22529) Immunology (17753) Microbiology (40432) Molecular Biology (17200) Neuroscience (88681) Paleontology (667) Pathology (2840) Pharmacology and Toxicology (4828) Physiology (7653) Plant Biology (15161) Scientific Communication and Education (2046) Synthetic Biology (4304) Systems Biology (9826) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00