Full text
52,620 characters
· extracted from
preprint-html
· click to expand
Halogen bonds between ligands and proteins: can we use them in validation? | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Halogen bonds between ligands and proteins: can we use them in validation? View ORCID Profile Ida de Vries , Georgia Tsiompanaki , View ORCID Profile Anastassis Perrakis , View ORCID Profile Robbie P. Joosten doi: https://doi.org/10.1101/2025.06.24.661284 Ida de Vries 1 Oncode Institute and The Netherlands Cancer Institute, Department of Biochemistry , Plesmanlaan 121, Amsterdam, 1066 CX, The Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Ida de Vries For correspondence: i.d.vries{at}nki.nl r.joosten{at}nki.nl Georgia Tsiompanaki 1 Oncode Institute and The Netherlands Cancer Institute, Department of Biochemistry , Plesmanlaan 121, Amsterdam, 1066 CX, The Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site Anastassis Perrakis 1 Oncode Institute and The Netherlands Cancer Institute, Department of Biochemistry , Plesmanlaan 121, Amsterdam, 1066 CX, The Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Anastassis Perrakis Robbie P. Joosten 1 Oncode Institute and The Netherlands Cancer Institute, Department of Biochemistry , Plesmanlaan 121, Amsterdam, 1066 CX, The Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Robbie P. Joosten For correspondence: i.d.vries{at}nki.nl r.joosten{at}nki.nl Abstract Full Text Info/History Metrics Supplementary material Preview PDF Abstract Halogen bonds are polar interactions between a halogen atom and its acceptor. They have characteristic geometry induced by the positively charged σ-hole on the halogen atom. Despite their importance in drug development, halogen bonds are often overlooked in the analysis and validation of ligand-protein complexes. We analysed halogen bonds between ligands and proteins in structure models from the PDB-REDO databank and defined key geometric parameters. These are the donor-acceptor distance, and two bond angles (θ1 and θ2) for interatomic halogen bonds, or in the case of halogen-π interactions, the distance between the halogen and acceptor π-system and a bond angle (θ1). Based on the distribution of these geometric parameters, we introduce a score, HalBS, that marks whether halogen bonds are adopting the preferred or allowed geometry or are an outlier and should be examined critically. A reference implementation of this score is now available in PDB-REDO. This is a first step towards improving halogen bond treatment in the analysis of macromolecular structure models. Introduction Halogen bonds are polar interactions between a halogen atom and an acceptor atom. A halogen bond occurs due to polarisation of the σ-bond between the halogen and its connecting atom. This causes a positive charge on the opposite site of the halogen atom, the so-called σ-hole ( Figure 1A ) ( Clark et al. 2007 ). As a result, the acceptor of the halogen bond is typically an atom with a free lone-pair, like an oxygen, nitrogen, sulfur, phosphorus or selenium atom. Additionally, halogen atoms can interact with π-systems ( Bent 1968 ). Due to differences in polarisation properties, halogen bonds with iodine are the strongest, followed by bromine, chlorine and finally halogen bonds with a fluorine atom are the weakest halogen bonds ( Politzer et al. 2010 ; Gilday et al. 2015 ; Cavallo et al. 2016 ). Download figure Open in new tab Figure 1. Schematic representation of the σ-hole on a halogen atom (left), and halogen bond characteristics of C-X··Y halogen bonds (middle) and C-X⋯Π halogen bonds (right). Halogen bonds can be characterized based on key geometric parameters. For the “regular” interatomic halogen bond, in this work referred to as C-X··Y halogen bonds, the first parameter is the distance (d) between the halogen and acceptor atom. As halogen bonds are attractive interactions, the distance can be shorter than the sum of the Van der Waals radii of the atoms ( Hassel 1970 ; Auffinger et al. 2004 ). For the orientation of the acceptor with respect to the halogen atom two angles are defined: θ1, the angle between the halogen containing compound and the acceptor, and θ2, the angle between the halogen atom and the acceptor containing compound ( Figure 1B ). These angles show distinct ranges, caused by the position of the σ-hole of the halogen atom. For C-X··Y halogen bonds ideally θ1 spans between ∼150° and ∼180° and θ2 between ∼90° and ∼120° ( Bent 1968 ; Desiraju et al. 2013 ; Scholfield et al. 2013 ; Cavallo et al. 2016 ; Turunen et al. 2021 ). In the case of halogen bonds between a halogen atom and a π-system, the halogen-π interaction, in this work referred to as C-X ⋯ Π halogen bonds ( Figure 1C ), only the distance between the halogen atom and the π-system, and the θ1 angle are defined ( Desiraju et al. 2013 ; Cavallo et al. 2016 ; Jubb et al. 2017 ; Kellett et al. 2020 ). Halogen atoms and their potential to form halogen bonds are used in drug design, as halogens affect the affinity, selectivity and efficacy of therapeutics ( Kortagere et al. 2008 ; Lu et al. 2009 ; Lu et al. 2010 ; Fraley and Sherman 2018 ). Halogen substituents increase the overall hydrophobicity of a ligand, thereby enhancing the hydrophobic effect of binding, driven by the minimization of unfavourable water–nonpolar contacts upon binding, and yielding a favourable entropic contribution to the binding free energy ( Langton et al. 2016 ). Thus, halogenation of ligands alters the conventional hydrophobic effect by combining the nonspecific entropic gain of water release with the specific directional interactions inherent to halogen bonds ( Wang et al. 2019 ; Verteramo et al. 2024 ). These properties make halogens attractive features in drug design but also in the earlier, more explorative drug lead discovery phase. Herein, halogens are often found in molecules used in virtual and fragment screening libraries, used to discover potential new binders to a target protein ( Heidrich et al. 2019 ; Dammann et al. 2022 ; Chopra et al. 2023 ). Particularly, libraries that include fluorine containing compounds are especially valuable in fragment screening using Nuclear Magnetic Resonance (NMR) ( Troelsen et al. 2020 ; Li and Kang 2024 ). Fluorine atoms are not abundant in endogenous molecules but are favourable for NMR due to their high sensitivity and wide chemical shift range ( Buchholz and Pomerantz 2021 ). Hence, fragment screening NMR is typically used to discover protein binding sites and protein dynamics ( Danielson and Falke 1996 ; Li and Kang 2024 ). They can also be used to identify compounds that bind to RNA ( Kreutz et al. 2006 ). Despite their overall benefits for drug design and discovery, halogen bonds are often overlooked in macromolecular structure model validation ( Zhang et al. 2017 ). One of the few places where halogen bonds are explicitly considered is at the PDBe-KB (Protein Data Bank in Europe Knowledge Base) (PDBe-KB consortium 2022 ; Choudhary et al. 2025 ) pages for ligands, where the determination of halogen bonds originates from Arpeggio ( Jubb et al. 2017 ). Here, we analyse halogen bonds found in PDB-REDO structure models and propose validation metrics for halogen bonds between a halogen containing ligands and amino acid residues. in the protein. Using such metrics, halogen bonds can be incorporated and integrated into pipelines that validate protein-ligand interactions. Results and Discussion Defining halogen bonds between ligands and proteins in PDB-REDO To define halogen bonds in macromolecular structure models, we selected every fluorine (F), chlorine (Cl), bromine (Br) and iodine (I) atom present in PDB-REDO structure models. These were stored together with their most likely acceptor atoms (i.e. O, N, S, P or Se). We used the structure models from the PDB-REDO databank to ensure all models are uniformly treated and no specific restraints for halogen bond interactions were used ( Joosten et al. 2009 ). To ensure high quality data, we selected halogen atoms with a B-factor equal to or below 100, a Real Space Correlation Coefficient (RSCC, ( Jones et al. 1991 )) for the compounds containing the halogen or acceptor atom equal to or above 0.9 which were in structure models with a resolution equal to or better than 2.5Å (complete distributions in supplemental Figure S1). Halogen bonds can be formed with different acceptor atoms and residues in proteins. Backbone oxygen atoms, but also oxygen atoms in the side chains of amino acids can serve as acceptor atoms. Furthermore, nitrogen atoms with a free lone pair and sulphur atoms in amino acid side chains can fulfil this role ( Wilcken et al. 2013 ). Regarding the nitrogen atom as acceptor, only histidine residues are, depending on the context-specific protonation state, potential acceptors within a protein. However, within our initial data we did not find high-confidence observations, hence nitrogen atoms were excluded for the remainder of this study. To be able to differentiate between acceptors for C-X··Y bonds in macromolecular structure models, we mined the acceptor with its neighbouring connecting atom. For example, if the acceptor is an oxygen atom of a hydroxyl group on a carbon atom, the carbon atom is stored with the oxygen atom and the acceptor is marked as ‘O-C’. The acceptors of the found halogen bonds mainly appear to be O-C acceptors, followed by S-C. There are a few observations for acceptor atoms attached to a non-carbon atom (supplemental Table S1), which for example occurs when the acceptor is a non-canonical amino acid. These were too few observations to define sensible validation targets for these acceptors. Therefore, only O-C and S-C acceptors were finally selected for further analysis of C-X··Y bonds. For the halogen bonds involving a π-system, the side chains of histidine, phenylalanine, tyrosine, and tryptophan are acceptor candidates ( Wilcken et al. 2013 ). We mined these to identify C-X ⋯ Π halogen-acceptor pairs in PDB-REDO structure models. Halogen bonding interactions with the π-system of phenylalanine are found most (3481), followed by tyrosine (2442), histidine (1549), and tryptophan (935) (supplemental Table S1). We then selected only the halogen bonds in which the halogen atom is in a ligand, i.e. any compound marked as ‘non-polymer’ in the CCD, (supplemental Table S2) and the acceptor is a canonical amino acid in a protein. The final dataset contains 8,423 C-X··Y and 8,096 C-X ⋯ Π ligand-protein halogen bonding interactions ( Table 1 ), which were used in downstream analyses. View this table: View inline View popup Download powerpoint Table 1: Number of observations of halogen-acceptor pairs of ligand-protein interactions for C-X··Y and C-X⋯Π bonds found in PDB-REDO structure models. For C-X··Y bonds the acceptor is listed with its neighbouring atom, e.g. O-C is an oxygen atom as acceptor, connected to a carbon atom. Accepting π-systems are listed by amino acid. The geometry of ligand-protein halogen bonds in PDB-REDO For the ligand-protein halogen bonds in the dataset, we calculated the characteristic halogen bond geometries: distance, Van der Waals overlap, and the θ1 and θ2 angles for C-X··Y halogen bonds; and distance and θ1 angle for C-X ⋯ Π halogen bonds. We then investigated the distribution of these metrics and visualized them as boxplots ( Krzywinski and Altman 2014 ), unless there were 25 or fewer observations, in which case individual observations are shown ( Figure 2 ). Download figure Open in new tab Figure 2. A) Geometry of ligand-protein C-X··Y halogen bonds found in PDB-REDO. For each halogen (from left to right: fluorine (light green), chlorine (dark green), bromine (brown), iodine (purple)) the overall distance, Van der Waals overlap, θ1 and θ2 angles are shown on the left panel. In the panels on the right-hand side these values are split per acceptor: Oxygen (red, O-C), and Sulfur (yellow, S-C). Note that a positive value for the Van der Waals overlap means that the distance between halogen and acceptor atom is shorter than sum of the Van der Waals radii. B) Geometry of ligand-protein C-X⋯Π halogen bonds found in PDB-REDO. For each halogen (from left to right: fluorine (light green), chlorine (dark green), bromine (brown), iodine (purple)) the overall distance and θ1 angle are shown on the left panel. In the panels on the right-hand side these values are split by acceptor: the π-system in the side chains of histidine (yellow), phenylalanine (red), tyrosine (blue) and tryptophan (pink). Grey areas indicate the expected ranges of the geometries. Boxes span from first to third quartile, the median is depicted as the middle line and whiskers extend to 1.5 times the interquartile range (IQR). Statistical values corresponding to the boxplots (number of observations, mean, median, Q1, Q3 and Median absolute deviation (MAD)) can be found in Supplemental Tables S3 and S4 for panels A and B, respectively. For clarity a strip plot is created when there are 25 or fewer observations. From the boxplots for C-X··Y halogen bonds ( Figure 2A ), we observe that the distribution of the distance of the halogen bond is rather narrow (around 3.5Å), independent of halogen type or acceptor atom. Note that the median distance becomes shorter and the distribution broader for halogen bonds involving iodine. A Van der Waals overlap between the halogen atom and its acceptor is barely present for fluorine and chlorine. Notably, for bromine and even more so for iodine, halogen-acceptor pairs do show an overlap with their Van der Waals radii. When investigating the θ1 angle for protein-ligand C-X··Y halogen bonds, we observe smaller median angles than the expected range of 150° - 180°. Particularly halogen-acceptor pairs involving fluorine (132°), chlorine (143°) have smaller median θ1 angles, while for bromine (154°) and iodine the median θ1 angle (169°) is within the expected range. Contrary to the θ1 angles, the median θ2 angles are within their expected range of 90° - 120°, independent of the halogen type. For C-X ⋯ Π halogen bonds ( Figure 2B ), we observe that the median distance of the halogen bond is rather stable (around 4.8Å) for fluorine, chlorine and bromine, while the halogen bonds involving iodine are longer (median 5.1 Å). The observed θ1 angles for the halogen-π bonds have a median around 110°-140°, whereas we would expect them to range between 150° and 180°. While the distances between halogen and acceptor π-system is not substantially different for different acceptor amino acids, the θ1 angles show different preferences. Particularly the histidine and tryptophan residues seem to have a smaller θ1 angle in halogen bonds with chlorine and bromine. Validation of halogen bonds For the C-X··Y halogen bonds, we observe increasing Van der Waals overlap for halogen-acceptor pairs with increasing halogen atom size (fluorine < chlorine < bromine < iodine). Following a similar trend, the θ1 and θ2 angles reach their expected values with increasing halogen atom size. This fits the increasing polarization of the σ-hole and the electron negativity of halogen atoms ( Politzer et al. 2010 ; Cavallo et al. 2016 ), resulting in strongest halogen bonds involving iodine and weakest for fluorine atoms. Hence, halogen interaction pairs involving fluorine or chlorine should be interpreted with care and might not be considered ‘true’ halogen bonds. On the other hand, halogen-acceptor pairs with bromine and iodine are more in line with theory and hence can be considered ‘true’ halogen bonds. Note that C-X··Y halogen bonds involving bromine show little Van der Waals overlap, but the θ1 and θ2 angles are within the expected ranges. Halogen bonds involving iodine are even more in line with “textbook” halogen bonds: they show Van der Waals overlap, their θ1 angle nicely ranges between 150° and 180°, and the θ2 angles also obeys their theoretic values by averaging around 120°. Note that the θ1 angle in C-X ⋯ Π halogen bonds is on average 127°, which is substantially smaller than the expected 150° till 180° range ( Figure2B ). This trend is independent of the type of halogen atom. As no restraints were applied on the θ1 and θ2 angles in the PDB-REDO model generation, these angles are unbiased. The Van der Waals overlap is weakly restrained compared to the distances, so the bias for the Van der Waals overlap is considered to be minimal. Furthermore, our data quality is sufficient for analysis of distributions (Supplemental Figures S2 and S3). Therefore, we proceed with defining target values for all halogen bond categories, except C-I ⋯ Π halogen bonds involving tryptophan, as there are fewer than five observations for these cases. We define a way to judge the quality of halogen-acceptor pairs, while considering that the distributions of the metrics regarding the geometry are mono-disperse, but not normally distributed (Supplemental Figures S4 and S5). Hence, it is not prudent to determine targets as means with standard deviations for a halogen bond. We evaluate the geometric quality of a potential halogen bond by calculating a score for each relevant geometric parameter, referred to as Score geom , using the following equation: Here, value is the measured value of a geometric parameter; Q1 and Q3 are the first and third quartiles, respectively; and IQR is the interquartile range (Q3 − Q1), derived from the boxplot statistics of the applicable reference dataset. The score expresses the distance of a value from the boundaries of the ‘box’ of the reference dataset in terms of the number of IQRs. Taken that a value within Q1–Q3 (i.e., the interquartile range) is considered preferred, a value within 1.5 × IQR of the quartiles (i.e., within the whiskers) is allowed, and a value outside the whiskers is treated as an outlier, this means that any outlier will have a Score geom > 1.5 We then apply Equation (1) independently to each geometric parameter relevant to the halogen bond geometry. For C–X··Y interactions, Score geom is computed for distance, θ1 and θ2; and for C– X⋯Π interactions, it is computed for distance and θ1 only, as θ2 is not defined in this context. We then define an overall Halogen Bond Score (HalBS) as the maximum of the individual geometric scores: This score reflects the least favourable geometric feature of the halogen bond and is used as a proxy for assessing bond quality. A HalBS > 1.5 indicates that at least one geometric parameter is an outlier, suggesting that the halogen bond geometry may be abnormal and should be examined more closely. The robustness and accuracy of HalBS improve with the quantity and diversity of data used to compute the reference boxplot statistics. For example, in C–X⋯Π interactions involving amino acids like tyrosine, histidine, or tryptophan, limited available data may affect the reliability of the scoring. HalBS implementation in PDB-REDO A reference implementation of HalBS reports scores for C-X··O, C-X··S, C-X ⋯ His, C-X ⋯ Phe, C-X ⋯ Tyr and C-X ⋯ Trp halogen bonds where X=F, Cl, Br, I, with the exception of C-I ⋯ Trp, for which boxplot statistics could not be calculated due to insufficient data (Supplemental Table S4). Halogen atoms in alternate conformations are excluded, as well as water molecules functioning as potential acceptor. Furthermore, the θ1 angle between the halogen atom and its potential acceptor must be larger than 90°. When multiple halogen bonds are possible for a single halogen atom (C-X··Y and C-X ⋯ Π combined), the bond with the lowest HalBS score is selected and reported. Note that while the boxplots were generated for halogen containing ligands, the implementation of HalBS is calculated for any type of halogen containing compound, including non-canonical amino acids and nucleotides. The implementation is added to PDB-REDO (version 8.16) which now reports the number of halogen bonds and the mean HalBS for each structure model in mmCIF ( Westbrook et al. 2022 ) format. Hereby we aim to increase awareness and create more data to improve the halogen bond definitions and validation pipelines in the future. PDB-REDO entries with detected halogen bonds can be retrieved through the PDB-REDO archive manager at https://pdb-redo.eu/archive/ . Example cases The binding of the anti-microbial agent triclosan (TCS) to its target protein enoyl-[acyl-carrier-protein] reductase (ENR), one of the proteins involved in fatty acid synthesis in bacteria, causes ENR to change to a closed conformational state, as seen in PDB entry 3GR6 ( Priyadarshi et al. 2010 ). Besides the described electrostatic interactions between the binding pocket and triclosan, the inhibitor forms a halogen bond with its chlorine close to the carbonyl oxygen atom of the Ala97 backbone ( Figure 3A ). Notably, this alanine is in the loop that is involved in the conformation change suggesting that the halogen bond contributes to the change in conformation of the loop in ENR. Download figure Open in new tab Figure 3. Examples of halogen bonds (marked as a black dotted lines). A) C-X··Y halogen bond between chlorine of triclosan (atom CL14 of TCL A371) and the carbonyl oxygen atom of alanine A97 (PDB-ID: 3GR6, HalBS: 0.36. B) C-X··Y halogen bond between iodine of erythrosine extra bluish (atom I of 9ZZ A303) and hydroxylic oxygen of threonine A77 (PDB-ID 5OOH, HalBS: 1.63. C) C-X⋯Π halogen bond between bromine atom BR4 of BYZ B201 with the π-system of phenylalanine B154 (PDB-ID: 8CZM, HalBS: 0.07) D) C-X⋯Π halogen bond between iodine (atom I1 of TYI C6) with the π-system of tyrosine A159 (PDB-ID 4PGC, HalBS: 0.90). An example where halogen bonds play a role is in drug development is erythrosin extra bluish, which was found to be a hit compound in a study targeting biliverdin reductases type B (BLVRB) ( Nesbitt et al. 2018 ). In PDB entry 5OOH we observe that the compound has multiple interactions with the protein, among which the iodine atom, that is forming a C-X··Y halogen bond ( Figure 3B ). Halogen atoms often appear in crystallographic fragment screening experiments, where multiple small organic compounds are screened towards a target protein. Bacterial oxidoreductase in E . coli DsbA (EcDsbA) is such a target. It is responsible for the formation of disulfide bonds into many bacterial factors causing disease, and hence is considered a target in the treatment of drug resistant bacterial infections ( Whitehouse et al. 2023 ). In PDB entry 8CZM, one of the bromine-containing fragments is BYZ (4-bromo-1H-pyrazole), which binds to EcDsbA and forms a C-X ⋯ Π halogen bond with the π-system of phenylalanine in the protein ( Figure 3C ). An example of a modified amino acid containing halogens is 3,5-diiodotyrosine (TYI), which was used to investigate peptide selectivity in the major histocompatibility complex (MHC) class I (PDB-ID 4PGC) ( Garstka et al. 2015 ). In this study, increasingly larger residues were used to probe the peptide binding site of MHC class I. Although the iodine atoms were used for their size, one iodine makes a clear C-X ⋯ Π halogen bond with a tyrosine in the binding site ( Figure 3D ). The examples described above demonstrate perfectly fine halogen bonds according to theory. The halogen bonds involving triclosan, the BYZ fragment and the modified amino acid TYI ( Figures 3A, C and D , respectively) all have a HalBS 1.5, suggesting it should be considered with caution. We suggest that the current HalBS cannot be used as a direct validation metric but can provide indication of genuine halogen bonds and “not so proper” halogen bonds. Future considerations To further optimize validation of C-X··Y halogen bonds it could be investigated whether different types of halogen bond geometries are possible ( Ibrahim et al. 2022 ). Separating C-X··O halogen bonds into carbonyl oxygen, carboxyl and hydroxyl oxygen atoms might improve the accuracy of halogen bond descriptions (Supplemental Figure S6) ( Costa 2017 ; Zhang et al. 2017 ). Another challenge is to identify C-X··N halogen bonds with histidine as acceptor. The histidine protonation state defines whether such interaction is possible, but depending of the local molecular context reliably establishing this can range from straightforward to computationally expensive ( Hooft et al. 1996 ; Evans and Murshudov 2013 ). It should also be considered to relate our findings to halogen bonds identified by Arpeggio ( Jubb et al. 2017 ), which uses slightly different definitions for halogen bond distances and angles. To further investigate C-X ⋯ Π halogen bonds, the distance from the halogen perpendicular to the π-system of the acceptor is worth to calculate and include as geometric parameter ( Riley and Tran 2017 ). Another option could be to use a θ2-equivalent angle between the halogen atom: the centroid of the π-system and one carbon atom in the π-system, which has an ideal value around 90°. This should ease the filtering of halogen-acceptor pairs into actual halogen bonds wherein the σ-hole of the halogen is positioned perpendicular to the π-system. More critical filtering or more accurate data can distinguish between a genuine halogen bond and “a halogen in proximity of a possible acceptor atom”, which will be particularly effective for fluorine and chlorine. To add more observations and hereby increase the dataset size, halogen bonds between other types of macromolecules can be considered, like modified amino acids or nucleotides. Also, halogen bonds can be formed with the π-system of peptide bonds ( Auffinger et al. 2004 ). Identifying such interactions in PDB-REDO structure models would add an extra halogen bond type to the dataset that we have not examined here. Additionally, interactions between halogen atoms and water molecules could be investigated further. While visually inspecting hundreds of example cases, we observed false positives where the halogen bond with a water molecule would be more likely than the acceptor we found while datamining. These should be considered in future pipelines. Note that with water molecules there comes an extra complication, as the location of the free lone pairs depends on the hydrogen bonding network and is not always clear. Besides these optimizations with respect to defining halogen-acceptor pairs, more (high quality) data could contribute to the differentiation between a genuine halogen bond and “a halogen in proximity of a possible acceptor”. A valuable source of potential ligand-protein halogen bonds can be crystallographic fragment screening data. The fragment libraries used in such screens typically hold many halogen containing compounds, albeit more fluorine and chlorine than bromine and iodine atoms. Overcoming data archiving issues ( Jaskolski et al. 2022 ; Weiss et al. 2022 ; Erlanson et al. 2025 ; Perrakis 2025 ) could allow valuable data from hundreds or even thousands of ligand-protein complexes obtained from fragment screening to enrich halogen bond observations and hereby ease the definition of validation targets. Conclusion We identified halogen bonds between ligands and proteins in PDB-REDO structure models. With HalBS, we introduce a metric that annotates halogen bonds adopting preferred or allowed geometry, or are an outlier and should be examined critically. This approach is integrated into the PDB-REDO pipeline and can be used in other ligand validation pipelines. By increasing awareness and accumulating (high quality) data of halogen bonds in ligand-protein complexes, it could become possible to determine validation targets with ideal values and corresponding standard deviations for each halogen-acceptor pair. Methods Data mining Compound IDs of halogen containing compounds were mined from the Chemical Component Dictionary (CCD, ( Westbrook et al. 2015 )) of the Protein Data Bank ( Burley et al. 2019 ) and stored with their type and the name(s) of the halogen atom(s) in the molecule. Compounds in which the halogen atom is not connected to a carbon atom, e.g. in halogen-metal complexes and halogen acids, and the single ion halogens (F-, Cl-, Br-, I-) were removed from this list to focus on organic halogen bonds. The identifiers of excluded halogen containing compounds are: F, CL, BR, IOD, 08T, 0JC, 0OD, 0TE, 202, 2T8, 4IR, 4KV, 5LN, 61C, 61D, 6BP, 6O0, 73M, 7GE, 8TH, 8TR, 8WV, 9QB, 9RU, 9TH, A9J, AF3, ALF, BE7, BEF, BF2, BF4, BFD, BPT, C2C, C7P, CFO, CPT, CUL, D0X, D7Z, DAA, DAE, DAQ, E3D, E5O, ELJ, F6Q, F7T, FPO, HG2, HGI, I2I, I3M, I83, J0K, J0N, JR3, KQB, KYS, KYT, LCO, LCP, LN8, MF4, MGF, MNQ, N2N, N2R, N2S, N2W, NG8, NMQ, NXC, O1N, ONP, ORS, OS1, OT1, P3C, PC4, PCL, PEJ, PNQ, PT7, QLT, R1N, RAX, RBN, RHE, RSW, RU0, RU7, RUD, RUH, SFL, SRX, SVP, SXC, TBR, TPT, U0J, VKZ, VL2, YPT, YXX, YXZ, ZN0, ZN5, ZN6, ZN7, ZN8, ZN9, ZPT. Defining halogen bonds in PDB-REDO structure models For each of the PDB-REDO ( Joosten et al. 2009 ) structure models with at least one halogen containing compound, the halogen atoms were mined and stored with their possible acceptor atoms. An acceptor atom is an oxygen (O), nitrogen (N), sulfur (S), phosphor (P) or selenium (Se) atom in an organic compound within 4Å of the halogen atom itself. For each halogen-acceptor pair, the distance between the two atoms and their Van der Waals overlap, as well as the θ1 and θ2 angles were calculated. The Van der Waals radii of the atoms were taken from https://en.m.wikipedia.org/wiki/Atomic_radii_of_the_elements_(data_page) ( Bondi 1964 ; Slater 1964 ; Clementi et al. 1967 ; Pyykkö et al. 2005 ; Mantina et al. 2009 ). Possible halogen bonds to water were excluded as θ2 angles could not be calculated. Similarly, as for C-X··Y halogen bonds, we mined halogen bonds between a halogen atom and a π-system found in either phenylalanine (PHE), tyrosine (TYR), histidine (HIS) or tryptophan (TRP) to find halogen-π bonds within protein-ligand complexes. Such an interaction was assigned when the distance between the halogen atom and the centroid of the π-system was within 6Å. The centroid of the π-system was also used to calculate the θ1 angle for the interaction. For the halogen-π interactions, θ2 and the Van der Waals overlap cannot be calculated. When a halogen atom had multiple possible acceptors, the acceptor with the θ1 angle closest to 180° was selected for further analyses to get a single acceptor for each halogen atom. Halogen-acceptor pairs with a θ1 angle <90° were removed from the data, as such angles would render the σ-hole unreachable ( Figure 1 ). Mining metadata For each structure model in which we found a halogen bond, the resolution of the X-ray data, the R-factor, the R-free, average B-factor and PDB-REDO version were stored. Finally, the real space correlation coefficient (RSCC, ( Jones et al. 1991 )), as calculated by density-fitness ( van Beusekom et al. 2019 ), was mined for both the halogen containing compound as well as the compound containing the acceptor. Software Mining of the halogen bonds was done using libcif++ (Hekkelman) and libpdb-redo (Hekkelman). The obtained datasets were loaded using pandas2.1.4 ( The pandas development team 2020 ), plots were made using Seaborn0.13.2 ( Waskom 2021 ), all in Python3.12.1. Supplemental material Supplemental material figures and tables referenced in this manuscript are available in PDF format. Data availability statement Reference code for the implementation of HalBS score calculations in PDB-REDO is available at https://github.com/PDB-REDO/HalBS . Acknowledgements and funding We thank the Research High Performance Computing facility of the Netherlands Cancer Institute for providing and maintaining computation resources. This project was funded by the Horizon2020 EC projects iNEXT-Discovery (871037) and FragmentScreen (101094131), and by an institutional grant of the Dutch Cancer Society and of the Dutch Ministry of Health, Welfare and Sport. We also thank Oncode Institute and CCP4 for their financial support and Pantelis G. Bagos for fruitful discussions on the data analysis. Funder Information Declared Horizon2020 EC , 871037 , 101094131 Dutch Cancer Society, https://ror.org/0368jnd28 Dutch Ministry of Health, Welfare and Sport References ↵ Auffinger P , Hays FA , Westhof E , Ho PS . 2004 . Halogen bonds in biological molecules . Proceedings of the National Academy of Sciences . 101 ( 48 ): 16789 – 16794 . doi: 10.1073/pnas.0407607101 . OpenUrl Abstract / FREE Full Text ↵ Bent HA . 1968 . Structural chemistry of donor-acceptor interactions . Chem Rev . 68 ( 5 ): 587 – 648 . doi: 10.1021/cr60255a003 . OpenUrl CrossRef ↵ van Beusekom B , Wezel N , Hekkelman ML , Perrakis A , Emsley P , Joosten RP . 2019 . Building and rebuilding Nglycans in protein structure models . Acta Cryst D . 75 ( 4 ): 416 – 425 . doi: 10.1107/S2059798319003875 . OpenUrl CrossRef PubMed ↵ Bondi A. 1964 . van der Waals Volumes and Radii . J Phys Chem . 68 ( 3 ): 441 – 451 . doi: 10.1021/j100785a001 . OpenUrl CrossRef ↵ Buchholz CR , Pomerantz WCK . 2021 . 19F NMR viewed through two different lenses: ligand-observed and protein-observed 19F NMR applications for fragment-based drug discovery . RSC Chem Biol . 2 ( 5 ): 1312 – 1330 . doi: 10.1039/D1CB00085C . OpenUrl CrossRef PubMed ↵ Burley SK , Berman HM , Bhikadiya C , Bi C , Chen L , Costanzo LD , Christie C , Duarte JM , Dutta S , Feng Z , et al. 2019 . Protein Data Bank: the single global archive for 3D macromolecular structure data . Nucleic Acids Res . 47 ( D1 ): D520 – D528 . doi: 10.1093/nar/gky949 . OpenUrl CrossRef PubMed ↵ Cavallo G , Metrangolo P , Milani R , Pilati T , Priimagi A , Resnati G , Terraneo G. 2016 . The Halogen Bond . Chem Rev . 116 ( 4 ): 2478 – 2601 . doi: 10.1021/acs.chemrev.5b00484 . OpenUrl CrossRef PubMed ↵ Chopra A , Bauman JD , Ruiz FX , Arnold E. 2023 . Halo Library, a Tool for Rapid Identification of Ligand Binding Sites on Proteins Using Crystallographic Fragment Screening . J Med Chem . 66 ( 9 ): 6013 – 6024 . doi: 10.1021/acs.jmedchem.2c01681 . OpenUrl CrossRef PubMed ↵ Choudhary P , Kunnakkattu IR , Nair S , Lawal DK , Pidruchna I , Afonso MQL , Fleming JR , Velankar S. 2025 . PDBe tools for an in-depth analysis of small molecules in the Protein Data Bank . Protein Science . 34 ( 4 ): e70084 . doi: 10.1002/pro.70084 . OpenUrl CrossRef PubMed ↵ Clark T , Hennemann M , Murray JS , Politzer P. 2007 . Halogen bonding: the σ-hole . J Mol Model . 13 ( 2 ): 291 – 296 . doi: 10.1007/s00894-006-0130-2 . OpenUrl CrossRef PubMed ↵ Clementi E , Raimondi DL , Reinhardt WP . 1967 . Atomic Screening Constants from SCF Functions. II. Atoms with 37 to 86 Electrons . The Journal of Chemical Physics . 47 ( 4 ): 1300 – 1307 . doi: 10.1063/1.1712084 . OpenUrl CrossRef ↵ Costa PJ . 2017 . The halogen bond: Nature and applications . Physical Sciences Reviews . 2 ( 11 ). doi: 10.1515/psr-2017-0136 . [accessed 2024 Oct 3 ]. https://www.degruyter.com/document/doi/10.1515/psr-2017-0136/html?lang=en . OpenUrl CrossRef ↵ Dammann M , Stahlecker J , Zimmermann MO , Klett T , Rotzinger K , Kramer M , Coles M , Stehle T , Boeckler FM . 2022 . Screening of a Halogen-Enriched Fragment Library Leads to Unconventional Binding Modes . J Med Chem . 65 ( 21 ): 14539 – 14552 . doi: 10.1021/acs.jmedchem.2c00951 . OpenUrl CrossRef PubMed ↵ Danielson MA , Falke JJ . 1996 . Use of 19F NMR to Probe Protein Structure and Conformational Changes . Annual Review of Biophysics . 25 (Volume 25, 1996): 163 – 195 . doi: 10.1146/annurev.bb.25.060196.001115 . OpenUrl CrossRef PubMed Web of Science ↵ Desiraju GR , Ho PS , Kloo L , Legon AC , Marquardt R , Metrangolo P , Politzer P , Resnati G , Rissanen K. 2013 . Definition of the halogen bond (IUPAC Recommendations 2013) . Pure and Applied Chemistry . 85 ( 8 ): 1711 – 1713 . doi: 10.1351/PAC-REC-12-05-10 . OpenUrl CrossRef ↵ Erlanson DA , Burley SK , Fearon D , Fraser JS , Kreitler D , Nonato MC , Sakai N , Wollenhaupt J , Weiss MS . 2025 . Where and how to house big data on small fragments . Nat Commun . 16 ( 1 ): 4179 . doi: 10.1038/s41467-025-59233-z . OpenUrl CrossRef PubMed ↵ Evans PR , Murshudov GN . 2013 . How good are my data and what is the resolution? Acta Cryst D . 69 ( 7 ): 1204 – 1214 . doi: 10.1107/S0907444913000061 . OpenUrl CrossRef PubMed Web of Science ↵ Fraley AE , Sherman DH . 2018 . Halogenase engineering and its utility in medicinal chemistry . Bioorganic & Medicinal Chemistry Letters . 28 ( 11 ): 1992 – 1999 . doi: 10.1016/j.bmcl.2018.04.066 . OpenUrl CrossRef PubMed ↵ Garstka MA , Fish A , Celie PHN , Joosten RP , Janssen GMC , Berlin I , Hoppes R , Stadnik M , Janssen L , Ovaa H , et al. 2015 . The first step of peptide selection in antigen presentation by MHC class I molecules . Proceedings of the National Academy of Sciences . 112 ( 5 ): 1505 – 1510 . doi: 10.1073/pnas.1416543112 . OpenUrl Abstract / FREE Full Text ↵ Gilday LC , Robinson SW , Barendt TA , Langton MJ , Mullaney BR , Beer PD . 2015 . Halogen Bonding in Supramolecular Chemistry . Chem Rev . 115 ( 15 ): 7118 – 7195 . doi: 10.1021/cr500674c . OpenUrl CrossRef PubMed ↵ Hassel O. 1970 . Structural Aspects of Interatomic Charge-Transfer Bonding . Science . 170 ( 3957 ): 497 – 502 . doi: 10.1126/science.170.3957.497 . OpenUrl FREE Full Text ↵ Heidrich J , Sperl LE , Boeckler FM . 2019 . Embracing the Diversity of Halogen Bonding Motifs in Fragment-Based Drug Discovery—Construction of a Diversity-Optimized Halogen-Enriched Fragment Library . Frontiers in Chemistry. 7 . [accessed 2022 Jan 20 ]. https://www.frontiersin.org/article/10.3389/fchem.2019.00009 . Hekkelman ML . libcifpp . [accessed 2024a Nov 13 ]. https://pdb-redo.github.io/libcifpp/ . Hekkelman ML . libpdb-redo . [accessed 2024b Nov 13 ]. https://github.com/PDB-REDO/libpdb-redo . ↵ Hooft RWW , Sander C , Vriend G. 1996 . Positioning hydrogen atoms by optimizing hydrogen-bond networks in protein structures . Proteins: Structure, Function, and Bioinformatics . 26 ( 4 ): 363 – 376 . doi: 10.1002/(SICI)1097-0134(199612)26:43.0.CO;2-D . OpenUrl CrossRef ↵ Ibrahim MAA , Saeed RRA , Shehata MNI , Ahmed MN , Shawky AM , Khowdiary MM , Elkaeed EB , Soliman MES , Moussa NAM . 2022 . Type I–IV Halogen⋯Halogen Interactions: A Comparative Theoretical Study in Halobenzene⋯Halobenzene Homodimers . Int J Mol Sci . 23 ( 6 ): 3114 . doi: 10.3390/ijms23063114 . OpenUrl CrossRef PubMed ↵ Jaskolski M , Wlodawer A , Dauter Z , Minor W , Rupp B. 2022 . Group depositions to the Protein Data Bank need adequate presentation and different archiving protocol . Protein Science : A Publication of the Protein Society . 31 ( 4 ): 784 . doi: 10.1002/pro.4271 . OpenUrl CrossRef PubMed ↵ Jones TA , Zou J-Y , Cowan SW , Kjeldgaard M. 1991 . Improved methods for building protein models in electron density maps and the location of errors in these models . Acta Cryst A . 47 ( 2 ): 110 – 119 . doi: 10.1107/S0108767390010224 . OpenUrl CrossRef PubMed Web of Science ↵ Joosten RP , Salzemann J , Bloch V , Stockinger H , Berglund A-C , Blanchet C , Bongcam-Rudloff E , Combet C , Da Costa AL , Deleage G , et al. 2009 . PDB_REDO: automated re-refinement of X-ray structure models in the PDB . J Appl Crystallogr . 42 ( 3 ): 376 – 384 . doi: 10.1107/S0021889809008784 . OpenUrl CrossRef PubMed ↵ Jubb HC , Higueruelo AP , Ochoa-Montaño B , Pitt WR , Ascher DB , Blundell TL . 2017 . Arpeggio: A Web Server for Calculating and Visualising Interatomic Interactions in Protein Structures . Journal of Molecular Biology . 429 ( 3 ): 365 – 371 . doi: 10.1016/j.jmb.2016.12.004 . OpenUrl CrossRef PubMed ↵ Kellett CW , Kennepohl P , Berlinguette CP . 2020 . π covalency in the halogen bond . Nat Commun . 11 ( 1 ): 3310 . doi: 10.1038/s41467-020-17122-7 . OpenUrl CrossRef PubMed ↵ Kortagere S , Ekins S , Welsh WJ . 2008 . Halogenated ligands and their interactions with amino acids: Implications for structure–activity and structure–toxicity relationships . Journal of Molecular Graphics and Modelling . 27 ( 2 ): 170 – 177 . doi: 10.1016/j.jmgm.2008.04.001 . OpenUrl CrossRef PubMed ↵ Kreutz C , Kählig H , Konrat R , Micura R. 2006 . A General Approach for the Identification of Site-Specific RNA Binders by 19F NMR Spectroscopy: Proof of Concept . Angewandte Chemie International Edition . 45 ( 21 ): 3450 – 3453 . doi: 10.1002/anie.200504174 . OpenUrl CrossRef PubMed ↵ Krzywinski M , Altman N. 2014 . Visualizing samples with box plots . Nature Methods . 11 ( 2 ): 119 – 120 . doi: 10.1038/nmeth.2813 . OpenUrl CrossRef PubMed ↵ Langton MJ , Serpell CJ , Beer PD . 2016 . Anion Recognition in Water: Recent Advances from a Supramolecular and Macromolecular Perspective . Angewandte Chemie International Edition . 55 ( 6 ): 1974 – 1987 . doi: 10.1002/anie.201506589 . OpenUrl CrossRef PubMed ↵ Li Q , Kang C. 2024 . Perspectives on Applications of 19F-NMR in Fragment-Based Drug Discovery . Molecules . 29 ( 23 ): 5748 . doi: 10.3390/molecules29235748 . OpenUrl CrossRef PubMed ↵ Lu Y , Shi T , Wang Y , Yang H , Yan X , Luo X , Jiang H , Zhu W. 2009 . Halogen Bonding—A Novel Interaction for Rational Drug Design? J Med Chem . 52 ( 9 ): 2854 – 2862 . doi: 10.1021/jm9000133 . OpenUrl CrossRef PubMed ↵ Lu Y , Wang Y , Zhu W. 2010 . Nonbonding interactions of organic halogens in biological systems: implications for drug discovery and biomolecular design . Phys Chem Chem Phys . 12 ( 18 ): 4543 . doi: 10.1039/b926326h . OpenUrl CrossRef PubMed ↵ Mantina M , Chamberlin AC , Valero R , Cramer CJ , Truhlar DG . 2009 . Consistent van der Waals Radii for the Whole Main Group . J Phys Chem A . 113 ( 19 ): 5806 – 5812 . doi: 10.1021/jp8111556 . OpenUrl CrossRef PubMed ↵ Nesbitt NM , Zheng X , Li Z , Manso JA , Yen W-Y , Malone LE , Ripoll-Rozada J , Pereira PJB , Mantle TJ , Wang J , et al. 2018 . In silico and crystallographic studies identify key structural features of biliverdin IXβ reductase inhibitors having nanomolar potency . Journal of Biological Chemistry . 293 ( 15 ): 5431 – 5446 . doi: 10.1074/jbc.RA118.001803 . OpenUrl Abstract / FREE Full Text ↵ PDBe-KB consortium . 2022 . PDBe-KB: collaboratively defining the biological context of structural data . Nucleic Acids Research . 50 ( D1 ): D534 – D542 . doi: 10.1093/nar/gkab988 . OpenUrl CrossRef PubMed ↵ Perrakis A. 2025 May 13. iNEXT-Discovery recommendation relevant for Fragment Screening Data Management . Zenodo . [accessed 2025 May 13 ]. https://zenodo.org/records/15394696 . ↵ Politzer P , Murray JS , Clark T. 2010 . Halogen bonding: an electrostatically-driven highly directional noncovalent interaction . Phys Chem Chem Phys . 12 ( 28 ): 7748 – 7757 . doi: 10.1039/C004189K . OpenUrl CrossRef PubMed ↵ Priyadarshi A , Kim EE , Hwang KY . 2010 . Structural insights into Staphylococcus aureus enoyl-ACP reductase (FabI), in complex with NADP and triclosan . Proteins: Structure, Function, and Bioinformatics . 78 ( 2 ): 480 – 486 . doi: 10.1002/prot.22581 . OpenUrl CrossRef PubMed ↵ Pyykkö P , Riedel S , Patzschke M. 2005 . Triple-Bond Covalent Radii . Chemistry – A European Journal . 11 ( 12 ): 3511 – 3520 . doi: 10.1002/chem.200401299 . OpenUrl CrossRef ↵ Riley KE , Tran K-A. 2017 . Strength and Character of R–X⋯π Interactions Involving Aromatic Amino Acid Sidechains in Protein-Ligand Complexes Derived from Crystal Structures in the Protein Data Bank . Crystals . 7 ( 9 ): 273 . doi: 10.3390/cryst7090273 . OpenUrl CrossRef ↵ Scholfield MR , Zanden CMV , Carter M , Ho PS . 2013 . Halogen bonding (X-bonding): A biological perspective . Protein Science . 22 ( 2 ): 139 – 152 . doi: 10.1002/pro.2201 . OpenUrl CrossRef PubMed ↵ Slater JC . 1964 . Atomic Radii in Crystals . The Journal of Chemical Physics . 41 ( 10 ): 3199 – 3204 . doi: 10.1063/1.1725697 . OpenUrl CrossRef ↵ The pandas development team . 2020 . pandas-dev/pandas: Pandas . doi: 10.5281/zenodo.3509134 . 10.5281/zenodo.3509134. OpenUrl CrossRef ↵ Troelsen NS , Shanina E , Gonzalez‐Romero D , Danková D , Jensen ISA , Śniady KJ , Nami F , Zhang H , Rademacher C , Cuenda A , et al. 2020 . The 3F Library: Fluorinated Fsp3 ‐Rich Fragments for Expeditious19 F NMR Based Screening . Angew Chem Int Ed. 59 ( 6 ): 2204 – 2210 . doi: 10.1002/anie.201913125 . OpenUrl CrossRef ↵ Turunen L , Hansen JH , Erdélyi M. 2021 . Halogen Bonding: An Odd Chemistry? The Chemical Record . 21 ( 5 ): 1252 – 1257 . doi: 10.1002/tcr.202100060 . OpenUrl CrossRef PubMed ↵ Verteramo ML , Ignjatović MM , Kumar R , Wernersson S , Ekberg V , Wallerstein J , Carlström G , Chadimová V , Leffler H , Zetterberg F , et al. 2024 . Interplay of halogen bonding and solvation in protein–ligand binding . iScience . 27 ( 4 ): 109636 . doi: 10.1016/j.isci.2024.109636 . OpenUrl CrossRef PubMed ↵ Wang Y , Fu Q , Zhou Y , Du Y , Huang N. 2019 . Replacement of Protein Binding-Site Waters Contributes to Favorable Halogen Bond Interactions . J Chem Inf Model . 59 ( 7 ): 3136 – 3143 . doi: 10.1021/acs.jcim.9b00128 . OpenUrl CrossRef PubMed ↵ Waskom ML . 2021 . seaborn: statistical data visualization . Journal of Open Source Software . 6 ( 60 ): 3021 . doi: 10.21105/joss.03021 . OpenUrl CrossRef ↵ Weiss MS , Wollenhaupt J , Correy GJ , Fraser JS , Heine A , Klebe G , Krojer T , Thunissen M , Pearce NM . 2022 . Of problems and opportunities—How to treat and how to not treat crystallographic fragment screening data . Protein Science . 31 ( 9 ): e4391 . doi: 10.1002/pro.4391 . OpenUrl CrossRef PubMed ↵ Westbrook JD , Shao C , Feng Z , Zhuravleva M , Velankar S , Young J. 2015 . The chemical component dictionary: complete descriptions of constituent molecules in experimentally determined 3D macromolecules in the Protein Data Bank . Bioinformatics . 31 ( 8 ): 1274 – 1278 . doi: 10.1093/bioinformatics/btu789 . OpenUrl CrossRef PubMed ↵ Westbrook JD , Young JY , Shao C , Feng Z , Guranovic V , Lawson CL , Vallat B , Adams PD , Berrisford JM , Bricogne G , et al. 2022 . PDBx/mmCIF Ecosystem: Foundational Semantic Tools for Structural Biology . Journal of Molecular Biology . 434 ( 11 ): 167599 . doi: 10.1016/j.jmb.2022.167599 . OpenUrl CrossRef PubMed ↵ Whitehouse RL , Alwan WS , Ilyichova OV , Taylor AJ , Chandrashekaran IR , Mohanty B , Doak BC , Scanlon MJ . 2023 . Fragment screening libraries for the identification of protein hot spots and their minimal binding pharmacophores . RSC Med Chem . 14 ( 1 ): 135 – 143 . doi: 10.1039/D2MD00253A . OpenUrl CrossRef PubMed ↵ Wilcken R , Zimmermann MO , Lange A , Joerger AC , Boeckler FM . 2013 . Principles and Applications of Halogen Bonding in Medicinal Chemistry and Chemical Biology . J Med Chem . 56 ( 4 ): 1363 – 1388 . doi: 10.1021/jm3012068 . OpenUrl CrossRef PubMed ↵ Zhang Q , Xu Z , Shi J , Zhu W. 2017 . Underestimated Halogen Bonds Forming with Protein Backbone in Protein Data Bank . J Chem Inf Model . 57 ( 7 ): 1529 – 1534 . doi: 10.1021/acs.jcim.7b00235 . OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted June 27, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Halogen bonds between ligands and proteins: can we use them in validation? Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Halogen bonds between ligands and proteins: can we use them in validation? Ida de Vries , Georgia Tsiompanaki , Anastassis Perrakis , Robbie P. Joosten bioRxiv 2025.06.24.661284; doi: https://doi.org/10.1101/2025.06.24.661284 Share This Article: Copy Citation Tools Halogen bonds between ligands and proteins: can we use them in validation? Ida de Vries , Georgia Tsiompanaki , Anastassis Perrakis , Robbie P. Joosten bioRxiv 2025.06.24.661284; doi: https://doi.org/10.1101/2025.06.24.661284 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Biochemistry Subject Areas All Articles Animal Behavior and Cognition (7618) Biochemistry (17636) Bioengineering (13859) Bioinformatics (41847) Biophysics (21401) Cancer Biology (18535) Cell Biology (25423) Clinical Trials (138) Developmental Biology (13353) Ecology (19860) Epidemiology (2067) Evolutionary Biology (24287) Genetics (15582) Genomics (22463) Immunology (17701) Microbiology (40300) Molecular Biology (17141) Neuroscience (88432) Paleontology (666) Pathology (2825) Pharmacology and Toxicology (4813) Physiology (7633) Plant Biology (15107) Scientific Communication and Education (2042) Synthetic Biology (4285) Systems Biology (9808) Zoology (2267)
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.