Confidence-guided cryo-EM map optimisation with LocScale-2.0

doi:10.1101/2025.09.11.674726

Confidence-guided cryo-EM map optimisation with LocScale-2.0

2025 · doi:10.1101/2025.09.11.674726

preprint OA: gold CC-BY-4.0

📄 Open PDF Full text JSON View at publisher

Full text 103,831 characters · extracted from preprint-html · click to expand

Confidence-guided cryo-EM map optimisation with LocScale-2.0 | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Confidence-guided cryo-EM map optimisation with LocScale-2.0 View ORCID Profile Alok Bharadwaj , Reinier de Bruin , View ORCID Profile Arjen J. Jakobi doi: https://doi.org/10.1101/2025.09.11.674726 Alok Bharadwaj a Department of Bionanoscience, Kavli Institute of Nanoscience, Delft University of Technology , 2629 HZ Delft, The Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Alok Bharadwaj Reinier de Bruin a Department of Bionanoscience, Kavli Institute of Nanoscience, Delft University of Technology , 2629 HZ Delft, The Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site Arjen J. Jakobi a Department of Bionanoscience, Kavli Institute of Nanoscience, Delft University of Technology , 2629 HZ Delft, The Netherlands Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Arjen J. Jakobi For correspondence: a.jakobi{at}tudelft.nl Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Cryogenic sample electron microscopy (cryo-EM) maps often display uneven quality, with high-resolution features coexisting alongside weak or poorly ordered regions. Such variation complicates structural interpretation, especially for heterogeneous macromolecular assemblies. Here, we present LocScale-2.0, a context-aware map optimisation framework that operates without prior knowledge of molecular structure or composition. By leveraging general expectations of electron scattering by biological macromolecules, it enhances local detail and connectivity while preserving weak but biologically relevant structural context. We further introduce LocScale-FEM, a Bayesian-approximate deep-learning approach that emulates this optimisation to generate feature-enhanced maps. LocScale-FEM provides voxel-wise confidence scores that give a statistically grounded measure of reliability, are sensitive to local phase error in the feature-enhanced map, and highlight regions where interpretation warrants caution. Selected examples illustrate how such maps can aid biological interpretation and how confidence-guided map optimisation can increase objectivity in cryo-EM density analysis. Introduction Over the past decade, cryogenic electron microscopy (cryo-EM) has transformed structural biology by enabling high-resolution structure determination of macromolecular assemblies that were previously difficult or impossible to study by other structural methods. Cryo-EM now routinely delivers near–atomic resolution reconstructions across a wide range of systems and has become a cornerstone technique for exploring the structure if molecular machines in their functional states and native environments 1 , 2 . Current applications increasingly target systems that are structurally and compositionally complex: membrane proteins in native or near-native lipid environments 3 – 5 , large assemblies with flexible or low-occupancy subunits 6 – 8 , samples purified from endogenous sources 9 – 11 and in-cell structures obtained by subtomogram averaging from native cellular samples 8 , 12 , 13 . Such specimens often contain extensive structural context such as lipid/detergent shells or embedding membranes, heterogeneous modifications and peripheral scaffolds, and exhibit pronounced conformational and compositional heterogeneity. These features are frequently weak or poorly ordered, yet often biologically important. Interpreting such reconstructions therefore requires methods that enhance high-resolution detail without suppressing weak but informative low-resolution context, and ideally provide an estimate of confidence in regions where the map is ambiguous. Automating these processes is essential for reproducibility and for making reliable interpretation accessible beyond expert users. In cryo-EM single-particle analysis and subtomogram averaging, three-dimensional electric potential maps are assembled by averaging information of many molecules in differing orientation from low signal-to-noise ratio projection images or tomographic subvolumes. Because the ensemble of imaged molecules inevitably contains molecules in multiple states, the final reconstructions represent averages over conformers and compositions, even after classification into structurally uniform subsets. Regions of structural variability therefore exhibit reduced signal-to-noise ratio (SNR) and lower effective resolution 14 – 16 . The result is, sometimes strong, spatial variation in map quality across the reconstructed volume. To compensate for the variation in resolution-dependent contrast loss, and to facilitate structural interpretation, maps are typically post-processed after reconstruction by local spectral reweighting of Fourier terms 17 – 21 and real-space filtering 22 – 25 . More recently, density-modification approaches have extended these strategies by incorporating physical and statistical priors about expected map properties into post-processing 21 , 26 , 27 and during map reconstruction 28 , 29 . We refer to this spectrum of procedures collectively as map optimisation. Deep learning methods offer alternatives that mimic the effect of local sharpening or density-modification and produce optimised maps with little or no manual intervention 30 – 32 . While these methods are widely adopted, their lack of explicit reliability estimates introduces important caveats for interpretation. Deterministic neural networks risk introducing bias by suppressing or hallucinating signal and enhancing artefacts without signalling their uncertainty, leaving practitioners to subjective judgement when deciding which map features to interpret, especially in ambiguous, low contrast regions. With the ongoing exponential growth in cryo-EM structures this poses a risk for misinterpretation, especially by new and inexperienced users 33 . A framework that integrates map optimisation with robust confidence measures would therefore represent a critical step toward more objective and reproducible cryo-EM map analysis. Here we introduce LocScale-2.0, an automated frame-work for context-aware and confidence-guided map optimisation. The method extends the original LocScale approach 18 with a procedure for locally adaptive map optimisation that requires no prior model information. In addition, we develop a machine learning strategy that emulates this optimisation and provides a voxel-wise confidence metric to assess the reliability of individual features. Together, these components yield maps that preserve weak but biologically informative context, improve contrast for high-resolution detail, and support more objective structural in-terpretation. Results Multimodal cryo-EM map optimisation in LocScale-2.0 LocScale-2.0 integrates physics-informed and deep learning-based map optimisation into complementary workflows ( Figure 1 ). The first workflow couples model-independent local scale estimation with windowed Fourier-amplitude scaling, which is conceptually related to local map sharpening in the original LocScale approach 18 . Instead of using explicit model information as a reference, it employs physical priors to estimate and locally compensate for resolution-dependent contrast loss. These priors draw on established expectations for the averaged squared structure factor of biological macro-molecules 21 , 34 , 35 . The second workflow implements a deep convolutional neural network, MC-EMmerNet, that learns from pairs of unmodified input maps and maps optimised with our physics-informed procedure to predict feature-enhanced maps directly in real space. Unlike the physics-based method, which adjusts only the amplitudes of Fourier coefficients and leaves their phases locally unchanged, this procedure modifies both amplitudes and phases in a manner similar to density modification. To quantify predictive uncertainty, we adopt a Bayesian approximation using variational inference with Monte Carlo dropout 36 . In addition, the workflow produces a baseline map derived from local amplitude scaling of the unmodified half maps with the mean predicted map, which serves as a reference for computing a voxel-wise confidence metric that is sensitive to local phase discrepancies and hence putative bias in the feature-enhanced map (see Methods). Download figure Open in new tab Fig. 1. Overview of LocScale-2.0 LocScale-2.0 provides two complementary workflows for map optimisation. The physics-informed workflow leverages priors on electron scattering properties to generate reference maps, which are then used for local scaling of radially averaged Fourier amplitudes. The deep neural network (DNN)-based workflow employs MC-EMmerNet, a network trained to emulate the physics-informed process, to directly predict an optimised map. This predicted map can either serve as a scaling reference or, when generated with a variational inference-enhanced network (MC-EMmerNet), as a directly interpretable feature-enhanced map . Confidence scores are calibrated against amplitude-modified baseline maps, enabling systematic identification of high-versus low-confidence regions for structural interpretation (see LocScale-FEM). Physics-informed map optimisation A limitation of most existing map-optimisation methods is their susceptibility to bias. This limitation affects reference-based sharpening approaches implemented in LocScale-1.0 18 or phenix.autosharpen 19 , as well as density modification 27 and deep learning-based methods 30 – 32 . In reference-based methods, inaccuracies or incompleteness in the input structural model may cause suppression of density in regions not supported by the reference, and obscure relevant contextual features for biological interpretation 18 , 21 . Deep learning-based methods 30 – 33 face analogous challenges, often compounded by limitations in representa-tiveness of training data and generalisability. An additional concern for these latter methods is positive bias, where plausible but non-existent structural details are hallucinated in a way that could lead to misinterpretation. To mitigate these issues, we developed a method for local map optimisation that considers the unbiased molecular signal of the 3D reconstruction and requires no prior structural information. The approach constrains the radially averaged Fourier amplitudes using first-principles expectations and data-driven estimates of the average squared structure factor of biological macromolecules. The spectral profile of this radial structure factor depends on molecular mass distribution, local B factors, and secondary structure 21 , 34 , 35 . To approximate these parameters, we first estimate the molecular volume using statistical hypothesis testing with false discovery rate (FDR) control 37 and define density consistent with genuine molecular signal at the 1% FDR threshold ( Supplementary Figure S1a,b ). Molecular mass estimates from the volume enclosed by the binarised FDR mask correlate strongly with masses computed from primary sequences and support our chosen threshold as a suitable proxy for the molecular envelope ( Supplementary Figure S1c,d ). Importantly, this method reliably generates envelopes that capture density from molecular components absent from the primary sequence, enabling its application to complexes with heterogeneous or unknown composition ( Supplementary Figure S1c,d ). Within this envelope, pseudoatoms are placed randomly to initialise a pseudomodel, which is then iteratively refined against the experimental density ( Supplementary Figure S2a–c ). In many practical cases, partial structural information is available from prior experimental models or structure prediction and can be exploited in a hybrid workflow that uses explicit model coordinates where available and a pseudoatomic representation in unmodelled regions ( Figure 2a–c ; Supplementary Figure S1a ). This strategy ensures that all density within the molecular boundary is represented and prevents signal suppression in regions lacking atomic models. Download figure Open in new tab Fig. 2. Pseudomodel generation and ADP refinement (a) Example for pseudoatom placement and refinement for Drosophila melanogaster NOMPC (EMDB: EMD-8702 ) with partial prior model information (hybrid model). Pseudoatoms (blue) are uniformly placed within the molecular boundary defined by the FDR confidence mask except for regions for which prior model information is available (gray). Models are shown for the start (iteration 1) and end (iteration 50) of the refinement. (b) Close-up of a region at the interface between explicit and pseudomodel. (c) Radially averaged Fourier amplitudes of model maps computed throughout the iterations of pseudomodel refinement. Inset: Close-up of low-to-medium resolution region defining the overall molecular envelope. (d) Atomic displacement factors (ADP) mapped onto atomic coordinates shown for different snapshots across the ADP refinement cycles. (e) Evolution of model-to-map Fourier shell correlation (FSC) shown for a series of ADP refinement cycles. The insets shows the half-map validation displaying the average integrated FSC for work and test maps as a function of refinement cycle. (f) Correlation of atomic model and pseudomodel ADPs averaged in 25 Å windows. R denotes the Pearson correlation coefficient. (g) Distribution of Pearson correlation coefficients for window-averaged ADPs between atomic and pseudomodel representations across 83 EMDB entries. (h) Average model-to-map Fourier Shell Correlation computed for 83 EMDB entries and their corresponding PDB-deposited models, pseudomodels and hybrid models. The shaded areas correspond to 95% confidence intervals. Maps were resampled to uniform pixel size for comparison. See also Supplementary Figure S1 - S3 . To approximate the physical decay of the overall structure factor, atomic displacement factors (ADPs or B factors) are then refined using restrained refinement based on local neighbourhood averaging across an empirically determined radius ( Figure 2d–e , Supplementary Figure S2d–e ; Methods). These restraints ensure that B factors of pseudoatoms, which are independent and non-bonded, vary smoothly, thereby effectively reducing the number of free refinement parameters. Refined local B factors from pseudomodels agree closely with those from restrained ADP refinement of atomic models ( Figure 2f–g , Supplementary Figure S3d–e ), without evidence of overfitting ( Figure 2e , Supplementary Figure S2e ). The resulting B factor distributions follow the shifted inverse-gamma behaviour characteristic for macromolecular structures 38 , 39 . In several cases, we observed multimodal B factor distributions consistent with structural heterogeneity such as flexible loops, peripheral or low-occupancy subunits, detergent micelles, and with prior reports that local mixtures of shifted inverse-gamma distributions reflect conformational or compositional variability 39 ( Supplementary Figure S3h-i ). Together, these steps provide model-independent estimates of local structure factors and their resolution-dependent falloff, from which radially averaged structure factors can be computed. Because the pseudomodel representations only approximate secondary structure, we apply empirical priors to imprint expected spectral texture of secondary structure elements from proteins and nucleic acids into the local radial structure factor over the relevant frequencies 21 , 29 . The spectral profiles of the locally averaged Fourier amplitudes are then used for local map sharpening as described previously 18 . A detailed account for the implementation of the above procedure is given in the Methods. Comparison of model–to–map Fourier Shell Correlation (FSC) curves for 83 model–map pairs illustrates the respective strengths and limitations of atomic, pseudoatomic, and hybrid reference models for local amplitude scaling ( Figure 3h ). Pseudomodels, which lack explicit stereochemical information, are well suited to capturing low-resolution scattering behaviour by representing signal-containing regions not typically covered by atomic models, but they cannot fully reproduce high-resolution features. Atomic models, in contrast, provide an accurate description of high-resolution signal but tend to suppress density in weak, unmodelled or heterogeneous regions. Hybrid models combine these complementary advantages and yield the most balanced representation of the experimental density. In the following we will therefore focus our discussion on applications of this hybrid approach for reference generation and subsequent local sharpening in LocScale-2.0. Download figure Open in new tab Fig. 3. Comparison of LocScale-2.0 hybrid mode map optimisation with other local sharpening methods (a) Map optimisation of Klebsiella pneumoniae type II secretion system outer membrane complex (EMDB: EMD-0193 ) using model-based sharpening with LocScale-1.0 (left), hybrid reference sharpening in LocScale-2.0 (middle) and phenix.autosharpen (right). Approximate locations of the outer (OM) and inner (IM) membrane are indicated. Arrows mark the visible detergent shell of the outer membrane-spanning segment and the section views reveal the central disordered plug occluding the lumen. (b) Optimised maps for human Tweety homologue 2 (EMDB: EMD-51108 ). The arrows mark density for N-linked glycans and the lipid belt around the the hydrophobic cavity. See also Supplementary Figure S4 . Preserving structural context with hybrid map optimisation To benchmark our procedure, we applied LocScale-2.0 to generate optimised maps for a set of representative single-particle reconstructions and subtomogram averages from the Electron Microscopy Data Bank (EMDB), and compared them with corresponding maps produced by two established local sharpening approaches: LocScale-1.0 18 and phenix.autosharpen 19 (see Methods for details). Across test cases, LocScale-2.0 produced maps whose high-resolution detail was generally comparable to, and in some cases improved relative to, the alternative methods, while additionally preserving and enhancing weak but informative density in regions that are flexible, disordered, or generally unmodelled such as detergent shells, lipid belts, N-linked glycans, and low-occupancy subunits ( Figure 3 , Supplementary Figure S4 ). A notable feature of the optimised maps is that both high-resolution detail and weak, low-resolution contextual density remain visible at a single density threshold, allowing co-visualisation of these densities during map interpretatioo and facilitating direct comparison between structurally heterogeneous regions. For example, in the Klebsiella pneumoniae type II secretin (EMD-0193), the LocScale-2.0 map co-visualises the plug density that occludes the lumen, a feature likely unresolved at high resolution due to its mismatch with the C 15 symmetry of the secretin complex 40 . In the deposited half maps this feature is only detectable after strong low-pass filtering ( Figure 3a , Supplementary Figure S4e ). In subtomogram averages of Mycoplasma pneumoniae 70S ribosomes (EMD-13234) from in-cell to-mograms, the LocScale-2.0 map co-visualises heterogeneous density at the mRNA entry and A-site tRNA without loss of high-resolution detail in well-resolved regions (Extended Figure S4a-c). Similarly, in Tweety homologue 2 (TTYH2; EMD-51108), LocScale-2.0 captures the largely continuous lipid/detergent belt surrounding the transmembrane region as well as the N-linked glycans, while retaining fine detail of the transmembrane helices, including individually resolved, ordered lipids ( Figure 3b , Supplementary Figure S4d ). Overall, these observations show that hybrid reference-based sharpening simultaneously enhances weak contextual features and high-resolution detail, and yields maps that represent heterogeneous complexes and assemblies in a manner more consistent with their structural context. This extends to highly heterogeneous assemblies: In apolipoprotein B-100 (apoB-100)-assembled low-density lipoprotein (LDL) particles (EMD-44469), for instance, the method emphasises well-resolved density for the structured apoB-100 N-terminal domain including morphological features of its β-belt formed by amphipathic β-sheets wrapped around the surface of the core lipids of LDL, while retaining the weak density consistent with cholesteryl ester plates within the LDL core ( Figure 4a,b , Supplementary Figure S4f ). By contrast, these weak and low complexity densities are entirely suppressed by the alternative methods. Download figure Open in new tab Fig. 4. Preservation of contextual structure by LocScale-2.0 (a) cryo-EM density maps of Apolipoprotein B 100 bound to LDL receptor and legobody (EMDB: EMD-44469 – top; deposited 6 ) and after hybrid reference sharpening in LocScale-2.0 (bottom). (b) LocScale-2.0 optimised map EMD-44469. Top: Density assigned to protein is shown in blue; unassigned contextual lipid density is shown in grey. Bottom: The deposited atomic model (PDB: 9bdt ) fitted into the optimised map with colours as labelled. Cross-sections show the cholesteryl ester plates in the interior of the low-density lipoprotein (LDL) particle. See also Supplementary Figure S4 . LocScale-2.0 optimised maps aid automated model building We next asked whether the improved balance in representing high- and lower resolution features in LocScale-2.0 optimised maps can aid automated methods for atomic model building. To test this, we used the cryo-EM model building software ModelAngelo 41 on a bench-mark set of 50 map–model pairs from the EMDB and PDB, each determined at better than 4.0 Å FSC resolution. For each case, an optimised map was generated using the hybrid LocScale-2.0 procedure, and ModelAngelo was run both on these maps and on the corresponding EMDB-deposited maps ( Supplementary Figure S5 ). Overall, ModelAngelo achieved higher sequence coverage from LocScale-2.0 maps than from deposited maps, both before (82%) and after (72%) pruning of short peptide fragments ( Supplementary Figure S5a-c ). On average, these models also exhibited smaller predicted backbone root-meansquared deviation (r.m.s.d.) for both protein and nucleic acid components. Interestingly, improvements were observed for targets both represented and not represented in the ModelAngelo training dataset. In several cases, the improvements were substantial. For example, in the Azospirillum brasilense glutamate synthase (EMD-10106), the LocScale-2.0 map enabled building of 1306 additional residues compared to the deposited map ( Supplementary FigureS5d,e ). Given that this α 6 β 4 complex comprises 11108 residues in total, this represents an increase of ~ 12% in modelled sequence. In 17% of the bench-mark cases, however, the EMDB-deposited maps produced higher sequence coverage than LocScale-2.0 maps and in 11% the sequence coverage was equal, indicating that improvements are not uniform across the dataset. The sequence recall (i.e. the fraction of residues correctly identified compared to the PDB deposited model) computed from the 50 test map-model pairs was comparable for EMDB-deposited and LocScale-2.0 maps (Extended Figure S5f-j). Since ModelAngelo was trained on generally B -factor–augmented maps, these results suggest that additional gains might be realised by retraining ModelAn-gelo, or related deep learning–based model building tools, directly on LocScale-2.0 maps, thereby potentially extending their reach to lower resolution. Complementary to retraining, LocScale-2.0 optimisation could also be applied at the inference step, so that model building benefits from context-aware maps during prediction. In practice, these strategies may be combined to maximise performance. Feature-enhanced maps from uncertainty-aware deep learning We next investigated whether the physics-informed map optimisation procedure can be replicated and accelerated using machine learning. To this end, we trained a 3D U-Net on pairs of unmodified half maps and hybrid LocScale-2.0 maps to predict optimised maps directly from unmodified input densities. Predictions from this network, which we term MC-EMmerNet, emulate the sharpening achieved by the physics-informed approach ( Supplementary Figure S6a-d ) at substantially reduced computational cost. For example, for a large and context-rich structure such at the apolipoprotein B100 assemblies (EMD-44469; Figure 4 complex, network prediction speeds up map optimisation about 16-fold compared to the physics-informed procedure (14 min vs. ~ 4h; Supplementary Table S1 ). However, deterministic networks provide point estimates with no measure of predictive uncertainty that would allow identification of regions where the output of the network may be unreliable. To overcome this limitation, we implemented variational inference in the 3D U-Net using Monte Carlo dropout, which retains dropout layers at inference time and samples multiple stochastic forward passes 36 . This produces an ensemble of predictions from which voxel-wise means and variances can be computed, yielding both the average predicted map (which we call F eature- E nhanced M ap, or LocScale-FEM) and a spatially resolved estimate of predictive uncertainty ( Figure 5a , Figure S6e-g ). Rather than using the raw voxel-wise variance from these predictions as the uncertainty metric, we take the ensemble mean as a reference to perform local amplitude scaling and generate a baseline map that locally retains experimental phases while matching the predicted amplitude distribution. The statistical difference of voxel intensities between the predicted ensemble distribution and the baseline reference then allows computing a probability-derived confidence measure in the form of a rescaled z-score that we term the predicted voxel-wise difference test (pVDDT) score. Since Fourier amplitudes have been spectrally matched in baseline and feature-enhanced maps, the intensity residuals are dominated by phase errors in the predicted map (see Methods) and the pVDDT metric captures these errors in an interpretable way ( Figure 5a , Supplementary Figure S6l-k ). Download figure Open in new tab Fig. 5. Confidence-weighted map optimisation and feature-enhanced maps (LocScale-FEM) (a) Schematic overview of Bayesian-approximate variational inference in MC-EMmerNet (left), and computation of voxel-wise pVDDT confidence scores by statistical comparison to a baseline reference (right). The far right shows the resulting feature-enhanced map (FEM) weighted according to local confidence. (b) Illustration of predicted and scaled central voxel intensity distributions for five voxels with varying pVDDT scores. For clarity, only a single predicted distribution is shown; in practice, unique distributions are generated per voxel. (c-d) Comparison of baseline and LocScale-FEM maps for plant phytochrome A (EMDB: EMD-35691 ). Shown are two regions with positive pVDDT scores (threshold: 0.15), overlaid with baseline maps displayed at varying thresholds, with (c) showing an example where the baseline map nevers recovers the positively flagged density. See also Supplementary Figures S6 – S7 . Interpreting pVDDT confidence scores While the variances from Monte Carlo dropout provide a first estimate of predictive uncertainty, we found that they were systematically smaller than the actual prediction errors, measured as the absolute difference between the predicted means and the corresponding baseline values ( Supplementary Figure S6h ). This mismatch reflects the common tendency of Monte Carlo dropout to underestimate uncertainty and produce overconfident predictions 42 , 43 . We therefore used isotonic regression calibration to adjust the predicted standard deviations so that they matched the empirically observed residuals ( Supplementary Figure S6i ). The resulting calibrated uncertainties establish a statistically robust baseline for voxel-wise pVDDT scores, which quantify both the probability and direction of signal deviations in the predicted maps ( Figure 5b-c , Supplementary Figure S6l-m ). The magnitude of the score reflects the statistical strength of the deviation. For interpretability, we define three ranges of pVDDT values. Scores between –80 and +80 fall within the reliable range, corresponding approximately to the central 80% confidence interval of the standard normal distribution. This threshold provides a practical compromise between sensitivity and robustness of the metric. Scores below –80 or above +80 indicate statistically significant deviations, while values beyond ± 95 mark voxels where deviations are highly unlikely given the calibrated uncertainty. As feature-enhanced maps tend to accentuate secondary structure, negative pVDDT confidence scores often appear along the grooves of α -helices. High positive pVDDT scores (greater than +95) may represent network hallucination of density features not present in the phase-conservative baseline map ( Figure 5c , Supplementary S7a), but in other cases may correspond to real features ( Figure 5d , Supplementary S7b). Thus, pVDDT confidence scores help draw attention to regions that merit closer inspection, and joint examination of feature-enhanced and baseline maps provides an efficient strategy for guiding interpretation. One limitation of our procedure is that pVDDT values are referenced to the feature-enhanced maps for visualisation; as a result, strongly negative scores corresponding to genuine densities that are completely suppressed in the prediction will not be reported. Feature-enhanced maps should therefore always be evaluated alongside the baseline map to ensure that such features are not overlooked. Applications of LocScale-FEM in structure analysis We examined how pVDDT confidence scores can guide interpretation of feature-enhanced maps from LocScale-FEM. As a first example, we applied LocScale-FEM to the unmodified half maps of EMD-13234 to re-examine the in-cell subtomogram averaged reconstruction of M. pneumoniae 70S ribosomes 8 . For comparison, we also generated the corresponding map using DeepEMhancer, which has been trained on LocScale-1.0 (model-based) maps 30 . The LocScale-FEM map effectively recovered weak density at levels comparable to the equivalent hybrid LocScale-2.0 map (cf. Supplementary Figure S4a-c ), including density at the mRNA entry site, A-site tRNA and the nascent peptide ( Figure 6a ). pVDDT confidence scores supported the reliability of most of these features, with the exception of the nascent peptide density 8 . While density near the mRNA entry site remained heterogeneous and uninterpretable, the A-site density in the LocScale-FEM map supported confident tRNA placement ( Figure 6b ). In contrast, DeepEMhancer maps showed pronounced downscaling of the same regions, leaving them essentially uninterpretable ( Figure 6a,b ). Download figure Open in new tab Fig. 6. Comparison of LocScale-FEM and alternative deep learning approaches for contextual structure recovery (a) LocScale-FEM and DeepEMhancer maps of Mycoplasma pneumoniae 70S ribosome (EMDB: EMD-13234 ). Selected contextual densities are highlighted in the LocScale-FEM map. The 1% FDR contour computed from the unmodified half maps is outlined for both maps. (b) Close-up views from (a), showing improved interpretability of densities for the A-site tRNA, nascent peptide, and a peripheral region. (c) Comparison of author-deposited, EMReady-optimised, and LocScale-FEM maps for subtomogram averages of the Human T-cell leukemia virus type I immature capsid (CA;EMDB: EMD-17929 ). The capsid protein C-terminal domain (CA-CTD) is highlighted. A close-up shows the CA-CTD viewed from below, comparing the 25 Å low-pass filtered EMDB map with the LocScale-FEM map. (d) Author-deposited and optimised maps for in situ subtomogram averages of the peripheral stalks of Polytomella ATP synthase (EMDB: EMD-19999 ). All optimised maps are superimposed on the low-pass filtered contour of the EMDB-deposited map. Contextual densities for the F 1 and F 0 ATP synthase subunits, oligomycin sensitivity-conferral protein (OCSP), and the crista membrane are indicated. (e) Close-up of the C 2-symmetric ATP synthase dimer in the LocScale-FEM map. The right half of the map is shown transparent and superposed on PDB 6rd4 (F 1 and F 0 ) and PDB 9evd (peripheral stalk). The pVDDT colour bar is shown for reference. (f) Zoom of the F 0 subunit showing resolved helical densities for the C 10 ring. (g) Volume recall for EMD-0665 computed for different thresholds for LocScale-FEM, EMReady and DeepEMhancer optimised maps. (h) Volume recall curves for LocScale-FEM, DeepEMhancer and EMReady maps generated for EMD-0665 (i) Area-under-the-recall-curve (AURC) for LocScale-FEM, DeepEMhancer and EMReady plotted for 26 randomly selected maps from the EMDB. Statistical significance of mean differences was evaluated by permutation testing with 10,000 resamples. See also Supplementary Figure S7 . A similar trend was observed for subtomogram averages of tubular lattices formed by the capsid (CA) and nucleo-capsid (NC) domains of Human T-cell leukemia virus type I (EMD-17929) 48 . LocScale-FEM produced interpretable density for dimers within the the irregular hexamers formed by the CA C-terminal domain (CA-CTD), which in the EMDB-deposited map is visible only after strong low-pass filtering ( Figure 6c ; shown at 25 Å low-pass) and entirely suppressed in the corresponding EMReady map. It has been hypothesised that CA-CTD interactions buttress the NTD scaffold but leave the lattice free to adopt diverse curvatures 48 , highlighting that co-visualisation of ordered elements (here, the NTD lattice) and less-ordered components (here, CTD-mediated contacts) in such reconstructions may help inform mechanistic models. Another class of structures for which co-visualisation of contextual density is highly informative are transmembrane or membrane-associated complexes. An illustrative case is the in-cell structure of mitochondrial ATP synthase from Polytomella 49 . The deposited consensus map (EMD-19999) captures ATP synthase dimers on cristae ridges, with the best resolved region (4 Å local resolution) at the central peripheral stalk. The F1 and Fo subcomplexes are less well resolved due to averaging over different rotational states 49 , but remain visible after low-pass filtering ( Figure 6d ). Map optimisation with DeepEMhancer and EMReady entirely suppressed density outside the central peripheral stalk, whereas the LocScale-FEM map co-visualised the peripheral stalks alongside both F1 and Fo subcomplexes and the strongly curved cristae membrane, without loss of detail in the peripheral stalks compared to the deposited or otherwise density-modified maps. The LocScale-FEM map also distinguished individual α -helical densities for several of the ten outer c-ring subunits embedded in the membrane ( Figure 6e,f ), with pVDDT scores suggesting high confidence for these features. This case exemplifies how LocScale-FEM can preserve the broader architectural context of complex membrane-bound assemblies. Similarly, LocScale-FEM maps of the yeast COPII inner coat assembled on membrane tubules (EMD-15949) 5 , 50 allowed confident placement of the Sar1 amphipathic helix inserting into the outer leaflet of the membrane ( Supplementary Figure S7d ). The map clearly visualises the parallel insertion of the amphipathic helices, which has been posited to reinforcing curvature through cooperative interactions across the lattice 51 . Additional examples are provided in Supplementary Figure S7e-f . The above examples suggest that LocScale-FEM is less prone to inadvertent signal suppression, preserving contextual density features that are often obliterated by other deep-learning–based map optimisation methods. To quantify this effect, we measured volumetric recall relative to an unbiased signal envelope derived from the original half maps using FDR thresholding 52 . For each case, LocScale-FEM, DeepEMhancer, and EM-Ready maps were normalised by rescaling their positive voxels to the unit interval [0,1]. We then calculated volumetric recall across varying thresholds to generate recall curves for each method. Figure 6d,e illustrates an example for this procedure. Applied to 26 randomly selected EMDB reconstructions, LocScale-FEM showed significantly higher integrated volume recall (AURC) compared to DeepEMhancer and EMReady, confirmed by permutation testing (p < 0.0004 and p < 0.0002, respectively; Figure 6f ). This analysis establishes that the advantages observed in individual examples generalise across diverse datasets. Interpretation of small-molecule ligands We next examined the utility of feature-enhanced maps and pVDDT scores for interpreting small-molecule ligands and other non-protein components. As a representative case, we analysed the GPCR–Gi complex of human relaxin family peptide receptor 4 (RXFP4) bound to compound 4, an amidrazone scaffold (EMD-33888) 53 , 54 . LocScale-FEM reproduced the ligand density observed in the deposited (DeepEMhancer-processed) map, with visible features corresponding to both the hydroxyindole and chlorophenyl substituents ( Figure 7a ). Analysis of pVDDT confidence scores, however, revealed important distinctions between these moieties. While the scores supported reliable interpretation of the hydroxyindole group, strongly positive scores around the chlorophenyl substituent indicated possible overemphasis of density at this site relative to an amplitude-modified baseline. This differential confidence scoring demonstrates how our approach can provide additional guidance for ligand interpretation by flagging regions where structural features may be less reliable or potentially artifactual. To validate this approach across different ligand chemistries, we examined β-galactosidase bound to the inhibitor phenylethyl-β-D-thiogalactopyranoside (PETG; EMD-7770) 55 , where lig- and pose can be challenging 56 . The LocScale-FEM analysis showed high confidence density for the well-ordered pyranose moiety while appropriately downscaling density for the somewhat more flexible phenylethyl substituent ( Supplementary Figure S8b ). This pattern suggests that our confidence scoring effectively distinguishes between well-ordered structural elements and regions with inherently higher mobility or weaker density. LocScale-FEM demonstrated density preservation across diverse ligand types and retained ligand density also in cases where other deep-learning methods tend to downscale density excessively ( Figure 7b,c , Supplementary Figure S8c-e ). Despite this apparent robustness, fundamental limitations remain. Ligands are strongly underrepresented in the EMDB and their structural diversity spans an enormous chemical space, which places inevitable constraints on any deep-learning model’s ability to generalise across all molecular scaffolds. This limitation is exemplified in our analysis of ordered lipid densities in the Connexin-43 gap junction channel (EMD-33394) 57 ( Supplementary Figure S8a ). While such densities are clearly visible in the base-line LocScale maps, they were substantially downweighted in LocScale-FEM as well as in DeepEMhancer and EM-Ready predictions. This case shows that all three deep learning models may systematically suppress genuine signal. Taken together, these examples illustrate both the potential and the limitations of LocScale-FEM for non-protein components. Confidence scores can provide useful discrimination in some cases, while in others suppression of genuine features persists. In practice, joint inspection of feature-enhanced maps, confidence scores, and baseline references will therefore be essential for interpretation. Download figure Open in new tab Fig. 7. Small-molecule ligand interpretation with LocScale-FEM (a) Author-deposited (DeepEMhancer) and LocScale-FEM map of (RXFP4)-G i bound to 1-[2-(4-chlorophenyl)ethyl]-3-[(7-ethyl-5-oxidanyl-1H-indol-3-yl)methylideneamino]guanidine (compound 4; EMDB: EMD-33888 ). Ligands superposed on their respective densities are shown on the right. (b) LocScale-FEM map for human voltage-gated sodium channel (Nav1.7; EMDB: EMD-351993 ) in complex with bupivacaine 44 The close-ups show ligand-superposed densities for LocScale-FEM, DeepEMhancer and EMReady-optimised maps. The LocScale-FEM baseline map is also shown for comparison. (c) LocScale-FEM maps for Thermus thermophilus complex I (EMDB: EMD-11231 ) 45 , pyruvate kinase PKM (EMDB: EMD-10577 ) 46 and stabilised F-actin filaments (EMDB: EMD-10366 ) 47 containing a chemically diverse array of ligands. 2D chemical representations of the respective ligands are drawn below. See also Supplementary Figure S8 . Discussion In this work, we demonstrate new capabilities of LocScale-2.0 map optimisation for recovering weak and contextual structure in reconstructions affected by conformational or compositional heterogeneity, both from cryo-EM single-particle analysis and cryo-ET subtomogram averaging. LocScale-2.0 integrates physics-informed map sharpening with uncertainty-aware deep learning to address limitations of current map post-processing methods. Both hybrid sharpening and feature-enhanced maps generated by LocScale-FEM consistently mitigate negative bias in regions that remain poorly resolved in consensus maps or retain residual heterogeneity after extensive classification. These improvements are most pronounced for low-resolution regions and contextual density, while performance in the highest-resolution areas varies due to limitations of current physical priors and residual trade-offs between preserving low-resolution context and maximally accentuating high-resolution detail. Importantly, LocScale-FEM introduces calibrated voxel-wise confidence scores that enable systematic identification of ambiguous regions, thereby reducing reliance on experience and subjective judgment. Although not all retained low-resolution density will be chemically interpretable, the ability of LocScale-2.0 maps to co-visualise high-resolution details and weaker contextual features at a single density threshold represents an important practical advantage for structural analysis and the visual communication of complex macromolecular assemblies. Several limitations warrant consideration. pVDDT confidence estimates are referenced to the feature-enhanced maps, and strongly negative deviations corresponding to genuine features completely suppressed during prediction may go undetected. This is most relevant for small-molecule ligands and other components under-represented in the training set, underscoring the need to inspect feature-enhanced maps alongside their baseline references. Likewise, while our physical priors capture general scattering behaviour, they do not account for all aspects of macromolecular structure and further improvements can be made. Finally, although throughout we refer to significant differences between predicted and base-line maps as phase errors in the context of confidence estimates, it should be emphasised that the experimental Fourier phases themselves are subject to error. Since the true, error-free structure is unknown, the metric should therefore be seen as a conservative measure erring on the side of caution. Put differently, it should be recognised that some apparent errors may reflect genuine improvements over noisy observations but cannot be distinguished as such. Future extensions could refine physical priors through explicit anisotropy corrections to account for directiondependent blurring, and incorporate expectations on map behaviour in real-space such as solvent flattening 58 – 60 , histogram matching 61 , 62 , and the use of symmetry-related correlations. Several of these ideas have been investigated in previous methods, but their combination remains unexplored 26 , 27 . For LocScale-FEM, while Monte Carlo dropout offers a practical means to estimate uncertainty, Bayesian alternatives that are currently computationally too demanding may in the future yield better calibrated or more accurate uncertainty estimates 63 – 65 . By introducing a statistical measure of reliability, LocScale-2.0 represents a step toward automated cryo-EM map in-terpretation frameworks that transparently report on predictive uncertainty. More broadly, integrating confidence-aware optimisation into automated model building and refinement could increase accuracy and sequence recall of these methods toward lower resolution maps. As cryo-EM expands to increasingly complex systems, such approaches will be important for ensuring rigorous and objective structural analysis. DATA AND CODE AVAILABILITY LocScale-2.0 is open-source software released under a BSD license and is available at https://github.com/cryotud/locscale , where detailed documentation is also provided. Pretrained MC-EMmerNet models (v0.3) can be accessed via Zenodo (DOI: https://zenodo.org/records/8211668 ). Scripts used to generate figures shown in this manuscript can be found at https://gitlab.tudelft.nl/aj-lab/publications/2025_LocScale-2.0 . Methods Estimation of molecular envelope The regions in a map that correspond to macromolecule and associated components (such as lipid, glycans or ligands) as opposed to solvent (i.e. the molecular envelope or boundary) are identified using False Discovery Rate-controlled statistical thresholding 37 . Sampling windows located near the box edges are used to to estimate the background noise distribution; we note that the procedure will fail if the noise sampling box overlaps with part of the signal as can happen for filaments or subtomogram averages in which signal extends to (some of) the box edges. In these cases, noise center coordinates of sampling windows can be individually supplied. The size of the noise box is set to 20 pixels or 10% the unit cell dimension, whichever is higher. FDR confidence maps are binarised at 1% FDR to yield confidence masks . Estimation of total scattering mass Using the molecular volume enclosed by the confidence mask, the number of required pseudoatoms is calculated assuming constant values for the mean protein density and the average atomic mass of the pseudoatoms: The number of required pseudoatoms to fill this missing scattering mass is calculated assuming constant values for the mean protein density and the average atomic mass: where N A denotes Avogadro’s constant, ρ avg (1.35 g/cm 3 ) is the mean protein density determined from partial specific volumes using hydrodynamic compressibility 66 , 67 and V mask is the volume of the FDR mask (for pure pseudo-models) or the difference mask (for hybrid models). The average atomic mass for pseudoatoms was estimated by computing the ratio of molecular mass to the number of non-hydrogen atoms over 119 atomic models from a reference dataset, which is derived from the training data used for DeepEMhancer. The median ratio was found to be 13.2 Da. For hybrid model construction, we estimate the unmodelled volume by computing the difference between the FDR-based confidence mask and a binary mask derived from the available atomic model. The atomic model mask is obtained by placing a spherical mask of radius 3 Å at each atomic coordinate excluding hydrogen atoms. To minimise artefacts arising from subtraction, the difference mask is smoothed with a uniform filter across three voxels and subsequently binarised at a threshold of 0.5. The calculated number of pseudoatoms are initially placed at random within the boundaries of the FDR confidence or difference mask. They are further randomly displaced by a magnitude of 0.5 pixels to prevent two atoms from overlapping. Positional refinement of pseudoatoms The positions of pseudoatoms are then refined using a regularised gradient-based molecular dynamics scheme, with the cryo-EM density map acting as an external potential. This refinement integrates density-gradient forces and interatomic Lennard–Jones (LJ) interactions using a simple Verlet integration with friction damping 68 . For simplicity, pseudoatom mass is set to unity, so that forces directly translate to accelerations. Note the atoms corresponding to the input atomic models remain unchanged during this operation. The total force on a pseudoatom is computed as: The attraction to high-density regions is modeled by the local gradient of the cryo-EM map: where ∇ρ is the local gradient of the density map, and g is a scaling factor to scale the gradient force magnitude relative to that of the Lennard-Jones term (default g = 10). This approach is conceptually similar to other density-biased refinement methods 69 , 70 . To avoid pseudoatom clustering and promote spatial regularity, a pairwise Lennard–Jones potential is applied between pseudoatoms within a 3 Å neighborhood.To stabilise the refinement and assist convergence, we apply linear friction: where v is the instantaneous velocity of the pseudoatom and μ = 10 is the friction coefficient. We implemented velocity Verlet integration to propagate the positions and velocities of pseudoatoms. By default. the refinement runs for 50 iterations with a timestep of Δt = 0.05 (in arbitrary units) which we found to reach convergence in most cases. Once the positions of all pseudoatoms are refined, pseudatoms are merged with the input atomic model to form a single structure. The pseudoatoms are introduced as a separate chain, with the sequence number of the added chain recorded for downstream purposes. For consistency, identifiers of the original atomic model chains always begin from “A”. If no input model is supplied, LocScale-2.0 assumes the entire map is unmodelled. Only the pseudoatomic model is retained for further processing. The overall workflow for constructing the pseudomodel and hybrid model is illustrated in Supplementary Figure S1a . ADP refinement of pseudoatoms and hybrid models LocScale 2.0 performs ADP (isotropic B -factor) refinement with REFMAC (v5.8) 71 via the Servalcat wrapper (v0.4.100) 72 , and supports explicit atomic models, pure pseudomodels, and hybrid models. In all cases positional refinement is disabled ( refi bonly ), all atomic B fac- 2 tors are initialised to 40 Å, and refinement is carried out against the unmodified map up to the Nyquist frequency. REFMAC restrains ADPs using a weighted Kullback–Leibler divergence between atom pairs with the isotropic B factors as the optimised parameters, where the weights depend on distance and bonding connectivity 71 . For hybrid models and pure pseudoatomic models, the absence of chemical bonds for the pseudomodel component necessitates a different strategy. Refinement is performed one cycle at a time, and each cycle is followed by spherical averaging of B factors within a 3 Å radius to enforce local smoothness and reduce the effective number of free parameters. In hybrid models, this averaging is restricted to the pseudoatomic chain(s) identified when constructing the hybrid model; coordinates belonging to explicit atomic chains are left unchanged except for their refined B factors. Pure pseudoatomic models lack valid chemical topology and are therefore refined in REFMAC with unconstrained refinement ( refi type unre ) while still applying the postcycle spherical averaging step described above. This additional keyword is not required for hybrid models. By default, the sequence of a single refinement cycle followed by local spherical averaging is repeated ten times; the number of iterations can be adjusted by the user. Independent half map refinement is performed in all cases and auto-matically monitored for overfitting. Symmetry Averaging If the input map has non- C 1 point group symmetry, reference maps simulated from pseudo-models or hybdrid models do not necessarily preserve the point group symmetry of the original map. To correct for this, symmetry averaging on the simulated density using a user-defined point group symmetry. The desired point group symmetry can be specified using the -sym command-line argument. Amplitude scaling with generalised radial profiles For each voxel position within the molecular envelope mask, cubic subvolumes are extracted both from the unmodified experimental map and from the corresponding reference map. The spherically averaged power spectra of these cubes are then compared, and the radial profile of the experimental cube is rescaled to match that of the reference cube. This procedure follows the principle of LocScale-1.0, but is extended to account for the use of pseudomodels and hybrid models. For voxels that lie within the FDR or difference mask corresponding to pseudoatomic regions, additional corrections are introduced to incorporate average scattering profiles. First, the frequency limits for applying these corrections are defined: the low-resolution limit corresponds to the transition from a continuous-volume description to a discrete i.i.d. distribution, estimated from the local molecular volume 35 , while the high-resolution limit is set by the half-map FSC. Within these limits, scattering amplitude deviations are computed by rescaling the scattering profile to the B factor of the reference profile, constructing an exponential fall-off function with the same B factor, and subtracting the scaled scattering amplitudes from this function. Finally, the computed deviations are added back to the reference radial profile within the relevant frequency range. This ensures that the local scaling not only matches the reference map but also reflects expected scattering behaviour in regions represented by pseudomodels. Monte Carlo (MC-EMmerNet) Network architecture We implemented a convolutional 3D U-Net, following a previous design 30 , 73 with several modifications ( Supplementary Figure S6a ; Table S6 ). The architecture consists of an encoder–decoder with skip connections, using strided convolutions for downsampling and transposed convolutions for upsampling. PReLU was chosen as the activation function throughout the network. Dataset The network was trained on cubic subvolumes extracted from average of unmodified EMDB-deposited half maps and their corresponding LocScale-2.0 reference maps. Cubes were 32 Å on each side and sampled from the training maps on a 24 Å grid. The dataset was derived from the DeepEMhancer map–model pairs 30 , excluding cases where reliable confidence masks could not be generated. Hybrid model maps were available for 114 entries, of which 89 were used for training and 14 for validation (86:14 split). A separate set of 11 maps was reserved for testing and uncertainty calibration. In addition, 24 EMDB additional maps were specifically selected from the EMDB to assess the ability of LocScale-2.0 to enhance contextual density and retain non-protein components. These examples were also used to validate pVDDT scores ( Supplementary Figure S7a–c,g–h ). Data augmentation Training cubes were classified as signal-or noise-containing based on the resampled confidence mask. A 4:1 ratio of signal to noise cubes was enforced. Data augmentation included random rotations (0–2 π ), sharpening or blurring corresponding to random B factors between 0 and 400 Å 2 , and Gaussian low-pass filtering. Training Input intensities were standardised to zero mean and standard deviation of 0.1, and maps were resampled to 1 Å per pixel. The Adam optimiser was used with a constant learning rate of 10 −4 , and mean absolute error (MAE) served as the loss function. Networks were trained for 15 epochs. Prediction At inference, maps were preprocessed identically to training data. Subvolumes of size 32 Å were extracted every 16 Å and restricted to the confidence mask region. A default batch size of 8 per GPU was used, with multi-GPU data parallelism handled via MirroredStrategy . Uncertainty estimates were obtained by enabling dropout during inference ( training=True ), yielding multiple stochastic forward passes. Voxel-wise means and standard deviations were computed across the ensemble. Overlapping cube predictions were merged using a weight matrix to reduce boundary artefacts. Final mean and standard deviation volumes were resampled to the original pixel size and saved as .mrc files. Uncertainty prediction Multiple stochastic forward passes (MC samples) are performed to generate a distribution of predictions. From these, the voxel-wise mean and variance are computed as follows: where Ŷ is the predictive mean, σ 2 is the predictive variance, and T is the number of MC samples. The mean and variance volumes are stored for each voxel in the map. During post-processing, these volumes are reintegrated into their original positions on the global grid and corrected for overlaps as described previously. Uncertainty calibration The uncertainty estimates from Monte Carlo dropout are typically uncalibrated and therefore not directly suitable for statistical inference without further adjustment 42 , 74 . In a perfectly calibrated regression model, the predicted uncertainties should match the expected residuals, defined as the absolute difference between the prediction and the true value. As shown in Supplementary Figure S6h , the raw uncertainties predicted via Monte Carlo dropout tend to be significantly smaller than the actual residuals. For a given voxel i , the prediction interval is defined as: where Ŷ i is the predicted mean, and σ i is the standard deviation estimated via Monte Carlo dropout. The constant z α is the z-score corresponding to a desired confidence level α . A well-calibrated model produces uncertainty estimates that correspond to empirical probabilities. Specifically, for any confidence level α ∈ [0, 1], the probability that the true value Y i lies within the interval defined by the predictive mean Ŷ i and scaled uncertainty ± z α σ i should be approximately α : In this study, we employ isotonic regression to calibrate the predicted uncertainties 43 , 75 by learning a monotonically increasing function ℐ that maps predicted standard deviations to expected residuals. The calibration procedure uses a set of N voxel-level predictions and their corresponding ground-truth values: Residuals are computed for each voxel as: For the set 𝒰 = { σ 1 , σ 2 , …, σ N } of predicted standard deviations from Monte Carlo dropout, the isotonic regression function ℐ is learned by minimizing the squared error between residuals and calibrated uncertainties: subject to: ℐ ( σ i ) ≤ ℐ ( σ i +1 ) for all i ∈ {1, 2, …, N − 1} The resulting function ℐ can then be applied to all predicted uncertainties to obtain calibrated standard deviations for statistical inference. For the calibration procedure, 11 maps from the test dataset were selected. For each map, a mean and variance map was generated via Monte Carlo dropout. The mean map was used as input to generate the corresponding LocScale map, serving as the ground-truth reference. Calibration was performed voxel-wise by extracting the predicted mean and variance from the MC-EMmerNet predictions and the baseline values from the LocScale maps. Since most voxels in a map correspond to background (i.e., regions with little or no signal), including them in the calibration process would bias the results and lead to underestimation of uncertainties. These background voxels typically exhibit very low predicted variance. However, simply discarding low-variance voxels is not trivial, as some signal-bearing voxels, particularly those with low intensity, also fall in this range. To address this, we apply a variance cutoff of 0.005: voxels with predicted variance below this threshold are excluded from the calibration process. While this introduces some miscalibration for low-intensity signal voxels, it significantly improves overall reliability. In practice, miscalibration tends to appear most prominently when low-threshold contours are used to visualize the feature-enhanced map. For consistent interpretation, we recommend using a contour threshold of 0.1 or higher when displaying predictions alongside pVDDT scores, as variances are well-calibrated in this range. Additionally, predicted variances are capped at a maximum value observed within the dataset. The isotonic regression model is also bounded accordingly: any input variance exceeding this cap is mapped to a fixed upper value. The effective calibration range is visualized in Supplementary Figure S6i . Within this valid range, the calibrated variance serves as a reliable estimate of prediction error. This calibration is essential for the statistical interpretation of voxel-wise deviations and facilitates the detection of regions where the predicted distribution significantly diverges from the experimental reference. Such regions can then be analyzed using standard hypothesis testing techniques. Relationship of pVDDT score and phase differences between feature-enhanced and baseline maps To evaluate voxel-wise significance of differences between predicted and baseline maps, we consider the data in Fourier space where density maps are represented by their series of Fourier coefficients. The structure factors of observed and predicted maps are: LocScale modifies the original observation by adjusting the amplitudes of its Fourier coefficients to match the radially averaged spectrum of the prediction while, within the scaling window, preserving their phases: with: The local Fourier-space difference between the prediction and amplitude-scaled observation is: This can be rearranged to highlight the role of phase and amplitude differences: Here, the first term reflects residual amplitude differences between Fourier coefficients and the second term captures phase differences. When amplitude matching is effective (i.e., | F pred ( s ) | ≈ k (∥ s ∥) | F obs ( s ) |), the first term becomes small, and the difference density depends primarily on the phase difference ( Supplementary Figure S6l,m ): The inverse discrete Fourier transform over the local window grid 𝒢 gives the real-space difference density: At the central voxel ( r = 0): This demonstrates that, under the condition that amplitude differences are small, the central voxel intensity of the local difference map is primarily determined by the accumulated phase differences between Fourier terms of predicted and unmodified maps across spatial frequencies. These differences manifest as measurable voxel intensity variations in real space that can be statistically evaluated, and justify the use of the intensity difference of the central voxel ρ diff (0) as a phase-sensitive metric. We use ρ diff (0), to compute a confidence metric based on a voxel-wise difference density test ( pVDDT ) score. A calibrated standard deviation σ cal is first assigned to each voxel of the predicted map using a learned uncertainty from the Monte Carlo dropout predictions. The voxel-wise z-score for the difference between predicted and baseline map is then computed as: Here, σ cal represents the expected difference between predicted and baseline densities. The z-score therefore measures how strongly the observed deviation exceeds this expectation. The probability of observing a z-score less than or equal to z 0 under the null hypothesis ℋ 0 : z 0 = 0 is given by: where Φ ( z ) is the cumulative distribution function of a standard normal distribution. To reflect both the magnitude and sign of the deviation in a bounded and interpretable scale, the result is linearly rescaled to the range [−100, 100]: Positive pvDDT score indicate voxels where predicted voxel intensity exceeds the baseline reference (possible overestimation), negative values indicate underestimation, and larger absolute values reflect greater statistical significance. Automated model building with ModelAngelo All ModelAngelo model building was done using ModelAngelo with default parameters. For each of the 50 map-model pairs in our ModelAngelo test dataset, FASTA files containing primary sequences of all complex components were pulled from the PDB. If applicable, protein and nucleic acid sequences were subsequently split over separate FASTA sequence files. For each model-map pair, ModelAngelo was run using both the EMDB-deposited map and LocScale-2.0 optimised map. To test the accuracy of sequence prediction, residue identities for each protein residue in the predicted structure were compared to that of the closest residue in the deposited PDB reference structure based on the coordinates of their respective C- α atoms. Recall statistics were then computed for all residues from each map-model pair in our dataset. Supplementary material Supplementary Figures Download figure Open in new tab Supplementary Fig. S1. Definition of pseudoatom placement and generation of hybrid models. (a) Illustration of pseudoatom placement for human γ -secretase (EMD-3061). The molecular envelope is estimated using FDR thresholding 52 , defined as the volume enclosed by a binarised mask computed from the confidence map at a 1% FDR threshold. When (partial) prior model information is available, a contextual structure mask is derived from the symmetric difference between the binarised model and envelope masks. Pseudoatoms are placed only within this difference mask and then merged with the prior atomic model. (b) Regression plots showing the number of pseudoatoms placed within the atomic model mask versus the expected number of atoms based on the known protein sequence, assuming hydrogenated and non-hydrogenated models. (c) Histogram of real-space correlation coefficients (RSCC) between FDR confidence masks and atomic model masks. Bars are colored by RSCC values below (RSCC 0.71, blue) the median. (N = 119 for panels b–c.) (d) Regression plots comparing molecular mass estimates derived from pseudoatom placements within the FDR mask to those from the primary sequence, for RSCC below and above the median. Download figure Open in new tab Supplementary Fig. S2. Pseudomodel generation and ADP refinement. (a) Example for pseudoatom placement and refinement for human γ -secretase (EMD-3061). Models are shown for the start (iteration 1) and end (iteration 50) of the positional refinement. The molecular boundary is outlined by a 1% FDR confidence mask. (b) Slab through the pseudomodel for both refinement iterations. (c) Radially averaged Fourier amplitudes of model maps computed throughout the iterations of pseudomodel refinement. Inset: Close-up of low-to-medium resolution region defining the overall molecular envelope. (d) Atomic displacement factors (ADP) mapped onto atomic coordinates shown for different snapshots across the ADP refinement cycles. (e) Evolution of model-to-map Fourier shell correlation (FSC) shown for a series of ADP refinement cycles. The insets shows the half-map validation displaying the average integrated FSC for work and test maps as a function of refinement cycle. Download figure Open in new tab Supplementary Fig. S3. Implementation and validation of pseudomodel ADP refinement. (a) ADP distribution mapped on the refined atomic model of human gamma secretase complex (PDB ID 5a63). (b) Scatter plot of atomic ADPs versus locally averaged pseudomodel ADPs for averaging radii of 2 Å (left) and 10 Å (right). (c) Relationship between neighborhood radius and ADP correlation coefficient for unrestrained and restrained ADP refinement of pseudomodels compared to atomic model refinement (top). Also shown are neighborhood radius correlation curves for pseudoatom clusters in ordered and disordered regions of the map. (d) Regression plot of atomic model vs. pseudomodel ADPs for γ -secretase (EMD-3061/PDB ID 5a63). (e) Left: ADP correlation as a function of neighbourhood radius plotted for 110 randomly selected map/model pairs from the EMDB (red: unrestrained pseudomodel ADP refinement; green: restrained pseudomodel ADP refinement; blue: atomic model ADPs). Right: Similarity of the ADP correlation curves to a reference curve derived from an atomic model. (f) Effect of neighbourhood-restrained ADP refinement of pseudoatoms shown after four ADP refinement cycles. Red circles outline the 3 Å averaging radius (left and middle). For comparison refined ADPs of an explicit atomic model (PDB ID 5a63) are also shown for the same map segment (right). (g) ADP restraints at the boundary of explicitly modelled and pseudoatom regions in hybrid reference models. The difference mask outlines the unmodelled density of a N-linked glycan. (h) ADP validation with toBvalid 39 for pseudomodels obtained for EMD-3061 and EMD-8702. Histograms shows distinguishable modes of the shifted inverse Γ distributions (EMD-3061: two modes; EMD-8702: three modes). Mapping the different modes back onto the pseudomodel reveals dinstinguishable clusters corresponding to well-resolved and poorly resolved/disordered regions (right). (i) Plot of Kolmogorov-Smirnov distances measuring the maximum distance between the empirical cumulative distribution function of the pseudoatom or atomic model ADP distributions and the cumulative distribution function of the theoretical gamma distribution for 110 randomly selected maps/models from the EMDB. Statistical significance is obtained from permutation tests with 1000 resamples. (j) α versus β 1 / 2 plots for bimodal fits to ADP distributions from atomic models (top) and pseudomodels (bottom). The red comet shows the smoothened unimodal distribution of α versus β 1 / 2 from empirical analysis of 45,000 PDB structures 39 . Download figure Open in new tab Supplementary Fig. S4. LocScale-2.0 map optimisation. (a) On-views and cross-sectional views of locally sharpened maps for in situ subtomogram averages of Mycoplasma pneumoniae 70S ribosomes (EMD-13234) using model-based sharpening with LocScale-1.0 (middle left), hybrid reference sharpening in LocScale-2.0 (middle right) and phenix.autosharpen (right). The author-deposited map is also shown (left). Arrows mark the mRNA entry point. (b) Side-by-side comparison of author-deposited and LocScale-2.0 maps for a well-resolved helical density segment from (a). (c) Unmodelled and partially interpretable regions of contextual structure highlighted in the LocScale-2.0 map. (d) Comparison of author-deposited and LocScale-2.0 sharpened maps for Klebsiella pneumoniae type II secretion system outer membrane complex (EMD-0193). (e) Comparison of author-deposited and LocScale-2.0 sharpened maps for Tweety homologue 2 (TTYH2, EMD-51108). (f) Unfiltered and low-pass filtered half maps in comparison to the hybrid LocScale map for ApoB100 (EMD-44469). Download figure Open in new tab Supplementary Fig. S5. Automated model building with LocScale-2.0 maps. (a,b) Aggregate statistics of the number of ModelAngelo-built residues for 50 randomly selected maps from the EMDB before and after pruning; residue numbers are not normalised for point group symmetry. 16 of these models (a) were not part of the Modelangelo training set, and 34 had been used in ModelAngelo training (b). (c) Selection of EMDB entries for which LocScale-2.0 maps support improvements in ModelAngelo model completion compared to the deposited maps. Residues and nucleotide bases additionally built in LocScale-2.0 maps are shown in red. (d) LocScale-2.0 map for Azospirillum brasilense glutamate synthase (EMDB: EMD-10106 ). (e) Automatically built models from ModelAngelo superposed on a selected map region indicated in (a) using the author-deposited map (left) and LocScale-2.0 map (right) as input. The full map was used for automated model building. (f) Sequence recall for ModelAngelo predictions using deposited or LocScale-2.0 maps for 16 models not part of the ModelAngelo training dataset. (g) Sequence recall for ModelAngelo predictions using deposited or LocScale-2.0 maps for 34 models that had been used in the ModelAngelo training dataset. (h-j) Sequence recall visualised in EMDB: EMD-0071/ PDB: 6gve . Two representative regions are shown, one of which (j) shows a coordinate shift in the LocScale-2.0 map. Download figure Open in new tab Supplementary Fig. S6. Monte Carlo Dropout and pVDDT scores. (a) 3D U-Net architecture of MC-EMmerNet. b) Spectral behaviour of MC-EMmerNet training measured by Fourier-Shell Correlation (FSC) of MC-EMmerNets test set prediction vs. target map as a function of training epoch. Low frequency information is rapidly learnt after a few epochs, while high frequency detail is learnt more gradually as observed by the slower convergence in the FSC curves at high frequencies. Predicted maps at selected epochs are shown. (c) Loss curves curves showing the evolution of training and validation losses. Due to the presence of dropouts in training the validation loss is lower than the training loss. (d) Average Fourier Shell correlation () in the Guinier region (0-0.1 Å -1 ) and Wilson region (>0.1 Å -1 ) measured vs. target map for the entire test set (N=11). (e) Central slices from 4 out of 15 samples generated by the MC-EMmerNet model using Monte Carlo dropout. The intensity distribution for the voxel highlighted in red is shown on the right. (f) Normality tests for all voxels in the sample cubes, with a histogram of the resulting p-values shown to the right. (g) Effect of the number of Monte Carlo samples on the change in prediction mean (top) and variance (bottom). (h) Reliability and calibration curves used to evaluate the uncertainty calibration. (i) Calibration curve from isotonic regression. (j) Feature-enhanced map (LocScale-FEM) for EMD-0282 colored by pVDDT scores, alongside DeepEMhancer and EMReady predictions. (k) Fourier phase correlation between the three deep learning models shown in (h) and the unmodified reference map. (l) Fourier amplitude correlation between predicted and target (hybrid LocScale-2.0) map for 11 EMDB entries with varying resolution between 3-6 Å. Shown are the mean correlations between 100 randomly selected signal cubes with their 95% confidence intervals. (m) Fourier phase correlation between predicted and unmodified (average of EMDB-deposited half maps) for 11 EMDB entries with varying resolution between 3-6 Å. Shown are the mean correlations between 100 randomly selected signal cubes with their 95% confidence intervals. Download figure Open in new tab Supplementary Fig. S7. Interpretation of LocScale-FEM maps. (a) LocScale-FEM map for EMDB: EMD-35691 ) shown at 0.15 contour level. A feature with strong positive pVDDT score is shown as close-up. The corresponding baseline map of the highlighted feature displayed at successively decreasing contour levels is also shown. (b) LocScale-FEM map for EMDB: EMD-17225 shown at 0.15 contour level. A feature with strong positive pVDDT score is shown as close-up. The corresponding baseline map of the highlighted feature displayed at successively decreasing contour levels is also shown. (c) LocScale-FEM maps for eigth random EMDB entries shown alingsude their baseline maps. The maps are sorted according to increasing variance in the pVDDT scores. (d) Comparison of optimised maps for subtomogram averages of the yeast COPII inner coat assembled on membrane tubules (EMDB: EMD-15949 ). The inset shows density for the membrane-embedded amphipathic helix of the Sar1 subunit in the LocScale-FEM map. (e) Comparison of maps for Apolipoprotein B-100/low-density lipoprotein (LDL) particles EMDB: EMD-44469 ). Contextual densities for liquid-crystalline cholesteryl esters are highlighted. (f) On-axis and cross-sectional views of author-deposited and optimised maps for E. coli respiratory complex I (EMDB: EMD-12654 . The peripheral antiporter subunit NuoL is highlighted. Download figure Open in new tab Supplementary Fig. S8. LocScale-FEM interpretation of small-molecule ligands. (a) Suppression of ordered lipid densities in Connexin 43 (EMDB: EMD-33394 ) in LocScale-FEM, DeepEMhancer and EMReady maps displayed at equivalent normalised thresholds. (b) Phenylethyl-β-D-thiogalactopyranoside (PETG) binding site in β-galactosidase (EMDB: EMD-7770 ) in LocScale-FEM, DeepEMhancer and EMReady maps displayed at equivalent normalised thresholds. PETG is shown in stick representation. (c) LocScale-FEM map of fragment-complexed human pyruvate kinase PKM (EMDB: EMD-10577 ). Close-ups show LocScale-FEM feature-enhanced and baseline maps of the ligand binding site. (d) LocScale-FEM map of fragment-complexed T. thermophilus complex I (EMDB: EMD-11231 ). Close-ups show LocScale-FEM feature-enhanced and baseline maps of the flavin mononucleotide/NADH site and an F 4 S 4 iron-sulfur cluster, respectively. (e) LocScale-FEM map of jasplakinolide-stabilised F-actin (EMDB: EMD-10366 ). Close-ups show LocScale-FEM feature-enhanced and baseline maps of the ADP site and an jasplakinolide binding sites, respectively. Supplementary Tables View this table: View inline View popup Download powerpoint Supplementary Table S1. Computation time for Hybrid LocScale-2.0 and LocScale-FEM optimisation View this table: View inline View popup Download powerpoint Supplementary Table S2. EMDB and PDB IDs for maps and models used for MC-EMmerNet training View this table: View inline View popup Download powerpoint Supplementary Table S3. EMDB and PDB IDs for maps and models used for MC-EMmerNet validation View this table: View inline View popup Download powerpoint Supplementary Table S4. EMDB and PDB IDs for maps and models used for testing and uncertainty calibration View this table: View inline View popup Download powerpoint Supplementary Table S5. EMDB and PDB IDs for maps and models in additional test dataset View this table: View inline View popup Download powerpoint Supplementary Table S6. Details of MC-EMmerNet architecture ACKNOWLEDGEMENTS We thank Keitaro Yamashita and Tom Burnley for valuable discussions, and Agnel Joseph for help with integrating LocScale-2.0 in CCP-EM Doppio. We are grateful to Ambroise Desfosses, Benedikt Junglas and the participants of the CCP-EM Icknield model building workshops for testing early versions of the method and for useful feedback. This work was supported by the European Research Council (ERC) under the European Union’s Horizon 2020 research and innovation programme (ERC-StG-852880 to AJ), the TU Delft AI initiative and the Collaborative Computational Project for Electron Cryo-Microscopy (CCP-EM). We also acknowledge the use of computational resources of the DelftBlue supercomputer provided by the Delft High Performance Computing Centre. Funder Information Declared European Research Council, https://ror.org/0472cxd90 , 852880 TU Delft AI Initiative Footnotes https://cryotud.github.io/locscale/ https://github.com/cryotud/locscale https://zenodo.org/records/8211668 Bibliography 1. ↵ E. Nogales and J. Mahamid . Bridging structural and cell biology with cryo-electron microscopy . Nature , 628 ( 8006 ): 47 – 56 , April 2024 . OpenUrl CrossRef PubMed 2. ↵ J. Hutchings and E. Villa . Expanding insights from in situ cryo-EM . Current Opinion in Structural Biology , 88 : 102885 , October 2024 . OpenUrl CrossRef PubMed 3. ↵ F. Waltz , R. D. Righetto , L. Lamm , T. Salinas-Giegé, R. Kelley , X. Zhang , M. Obr , S. Khavnekar , A. Kotecha , et al. In-cell architecture of the mitochondrial respiratory chain . Science , 387 ( 6740 ): 1296 – 1301 , March 2025 . OpenUrl CrossRef PubMed 4. C. E. Coupland , R. Karimi , S. A. Bueler , Y. Liang , G. M. Courbon , J. M. Di Trani , C. J. Wong , R. Saghian , J.-Y. Youn , L.-Y. Wang , et al. High-resolution electron cryomicroscopy of V-ATPase in native synaptic vesicles . Science (New York, N.Y .), 385 ( 6705 ): 168 – 174 , July 2024 . OpenUrl 5. ↵ J. Hutchings , V. G. Stancheva , N. R. Brown , A. C. M. Cheung , E. A. Miller and G. Zanetti . Structure of the complete, membrane-assembled COPII coat reveals a complex interaction network . Nature Communications , 12 ( 1 ): 2034 , April 2021 . OpenUrl PubMed 6. ↵ M. Reimund , A. D. Dearborn , G. Graziano , H. Lei , A. M. Ciancone , A. Kumar , R. Holewinski , E. B. Neufeld , F. J. O’Reilly , A. T. Remaley , et al. Structure of apolipoprotein B100 bound to the low-density lipoprotein receptor . Nature , 638 ( 8051 ): 829 – 835 , February 2025 . OpenUrl CrossRef PubMed 7. M. R. Leung , J. Zeng , X. Wang , M. C. Roelofs , W. Huang , R. Zenezini Chiozzi , J. F. Hevler , J. R. Heck , S. K. Dutcher , A. Brown , R. Zhang , et al. Structural specializations of the sperm tail . Cell , 186 ( 13 ): 2880 – 2896.e17 , June 2023 . OpenUrl CrossRef PubMed 8. ↵ L. Xue , S. Lenz , M. Zimmermann-Kogadeeva , D. Tegunov , P. Cramer , P. Bork , J. Rappsilber , et al. Visualizing translation dynamics at atomic detail inside a bacterial cell . Nature , 610 ( 7930 ): 205 – 211 , October 2022 . OpenUrl CrossRef PubMed 9. ↵ E. J. Verbeke , A. L. Mallam , K. Drew , E. M. Marcotte and D. W. Taylor . Classification of Single Particles from Human Cell Extract Reveals Distinct Structures . Cell Reports , 24 ( 1 ): 259 – 268.e3 , July 2018 . OpenUrl PubMed 10. C.-M. Ho , X. Li , M. Lai , T. C. Terwilliger , J. R. Beck , J. Wohlschlegel , D. E. Goldberg , A. W. P. Fitzpatrick , et al. Bottom-up structural proteomics: cryoEM of protein complexes enriched from the cellular milieu . Nature Methods , 17 ( 1 ): 79 – 85 , January 2020 . OpenUrl PubMed 11. ↵ C.-C. Su , M. Lyu , C. E. Morgan , J. R. Bolla , C. V. Robinson and E. W. Yu . A ‘Build and Retrieve’ methodology to simultaneously solve cryo-EM structures of membrane proteins . Nature Methods , 18 ( 1 ): 69 – 75 , January 2021 . OpenUrl PubMed 12. ↵ V. Zila , E. Margiotta , B. Turoňová , T. G. Müller , C. E. Zimmerli , S. Mattei , M. Allegretti , K. Börner , J. Rada , B. Müller , M. Lusic , H.- G. Kräusslich , et al. Cone-shaped HIV-1 capsids are transported through intact nuclear pores . Cell , 184 ( 4 ): 1032 – 1046.e18 , February 2021 . OpenUrl CrossRef PubMed 13. ↵ X. Zhang , S. Sridharan , I. Zagoriy , C. Eugster Oegema , C. Ching , T. Pflaesterer , H. K. H. Fung , I. Becher , I. Poser , C. W. Müller , A. A. Hyman , M. M. Savitski , et al. Molecular mechanisms of stress-induced reactivation in mumps virus condensates . Cell , 186 ( 9 ): 1877 – 1894.e27 , April 2023 . OpenUrl CrossRef PubMed 14. ↵ C. M. Palmer and C. H. S. Aylett . Real space in cryo-EM: the future is local . Acta Crystallo-graphica Section D Structural Biology , 78 ( 2 ): 136 – 143 , February 2022 . OpenUrl PubMed 15. R. J. Read , C. Millán , A. J. McCoy and T. C. Terwilliger . Likelihood-based signal and noise analysis for docking of models into cryo-EM maps . Acta Crystallographica Section D Structural Biology , 79 ( 4 ): 271 – 280 , April 2023 . OpenUrl PubMed 16. ↵ B. O. Forsberg , P. N. M. Shah and A. Burt . A robust normalized local filter to estimate compositional heterogeneity directly from cryo-EM maps . Nature Communications , 14 ( 1 ): 5802 , September 2023 . OpenUrl PubMed 17. ↵ P. B. Rosenthal and R. Henderson . Optimal Determination of Particle Orientation, Absolute Hand, and Contrast Loss in Single-particle Electron Cryomicroscopy . Journal of Molecular Biology , 333 ( 4 ): 721 – 745 , October 2003 . OpenUrl CrossRef PubMed Web of Science 18. ↵ A. J. Jakobi , M. Wilmanns and C. Sachse . Model-based local density sharpening of cryo-EM maps . eLife , 6 : e27131 , October 2017 . OpenUrl CrossRef PubMed 19. ↵ T. C. Terwilliger , O. V. Sobolev , P. V. Afonine and P. D. Adams . Automated map sharpening by maximization of detail and connectivity . Acta Crystallographica Section D: Structural Biology , 74 ( 6 ): 545 – 559 , June 2018 . OpenUrl PubMed 20. E. Ramírez-Aportela , J. L. Vilas , A. Glukhova , R. Melero , P. Conesa , M. Martínez , D. Maluenda , J. Mota , A. Jiménez , J. Vargas , R. Marabini , P. M. Sexton , J. M. Carazo , et al. Automatic local resolution-based sharpening of cryo-EM maps . Bioinformatics , 36 ( 3 ): 765 – 772 , February 2020 . OpenUrl CrossRef PubMed 21. ↵ A. Bharadwaj and A. J. Jakobi . Electron scattering properties of biological macromolecules and their use for cryo-EM map sharpening . Faraday Discussions , 240 ( 0 ): 168 – 183 , November 2022 . OpenUrl CrossRef PubMed 22. ↵ G. Cardone , J. B. Heymann and A. C. Steven . One number does not fit all: Mapping local variations in resolution in cryo-EM reconstructions . Journal of Structural Biology , 184 ( 2 ): 226 – 236 , November 2013 . OpenUrl CrossRef PubMed 23. A. Kucukelbir , F. J. Sigworth and H. D. Tagare . Quantifying the local resolution of cryo-EM density maps . Nature Methods , 11 ( 1 ): 63 – 65 , January 2014 . OpenUrl PubMed 24. J. L. Vilas , J. Gómez-Blanco , P. Conesa , R. Melero , J. Miguel de la Rosa-Trevín , J. Otón , J. Cuenca , R. Marabini , J. M. Carazo , J. Vargas , et al. MonoRes: Automatic and Accurate Estimation of Local Resolution for Electron Microscopy Maps . Structure , 26 ( 2 ): 337 – 344.e4 , February 2018 . OpenUrl CrossRef PubMed 25. ↵ K. Ramlaul , C. M. Palmer and C. H. S. Aylett . A Local Agreement Filtering Algorithm for Transmission EM Reconstructions . Journal of Structural Biology , 205 ( 1 ): 30 – 40 , January 2019 . OpenUrl CrossRef PubMed 26. ↵ M. Spiegel , A. K. Duraisamy and G.F. Schröder . Improving the visualization of cryo-EM density reconstructions . Journal of Structural Biology , 191 ( 2 ): 207 – 213 , August 2015 . OpenUrl CrossRef PubMed 27. ↵ T. C. Terwilliger , O. V. Sobolev , P. V. Afonine , P. D. Adams and R. J. Read . Density modification of cryo-EM maps . Acta Crystallographica Section D: Structural Biology , 76 ( 10 ): 912 – 925 , October 2020 . OpenUrl PubMed 28. ↵ D. Kimanius , G. Zickert , T. Nakane , J. Adler , S. Lunz , C.-B. Schönlieb , O. Öktem , et al. Exploiting prior knowledge about biological macromolecules in cryo-EM structure determination . IUCrJ , 8 ( 1 ): 60 – 75 , January 2021 . OpenUrl PubMed 29. ↵ M. A. Gilles and A. Singer . A molecular prior distribution for Bayesian inference based on Wilson statistics . Computer Methods and Programs in Biomedicine , 221 : 106830 , June 2022 . OpenUrl PubMed 30. ↵ R. Sanchez-Garcia , J. Gomez-Blanco , A. Cuervo , J. M. Carazo , C. O. S. Sorzano and J. Vargas . DeepEMhancer: a deep learning solution for cryo-EM volume post-processing . Communications Biology , 4 ( 1 ): 1 – 8 , July 2021 . OpenUrl CrossRef PubMed 31. J. He , T. Li and S.-Y. Huang . Improvement of cryo-EM maps by simultaneous local and non-local deep learning . Nature Communications , 14 ( 1 ): 3217 , June 2023 . OpenUrl PubMed 32. ↵ S. R. Maddhuri Venkata Subramaniya , G. Terashi and D. Kihara . Enhancing cryo-EM maps with 3D deep generative networks for assisting protein structure modeling . Bioinformatics , 39 ( 8 ): btad494 , August 2023 . OpenUrl PubMed 33. ↵ R. F. Berkeley , B. D. Cook and M. A. Herzik . Machine learning approaches to cryoEM density modification differentially affect biomacromolecule and ligand density quality . Frontiers in Molecular Biosciences , 11 , April 2024 . 34. ↵ R. J. Morris , E. Blanc and G. Bricogne . On the interpretation and use of ⟨|E|2⟩(d*) profiles . Acta Crystallographica Section D: Biological Crystallography , 60 ( 2 ): 227 – 240 , February 2004 . OpenUrl CrossRef PubMed 35. ↵ A. Singer . Wilson statistics: derivation, generalization and applications to electron cryomicroscopy . Acta Crystallographica Section A: Foundations and Advances , 77 ( 5 ): 472 – 479 , September 2021 . OpenUrl CrossRef 36. ↵ Y. Gal and Z. Ghahramani . Dropout as a Bayesian Approximation: Representing Model Uncertainty in Deep Learning . In Proceedings of The 33rd International Conference on Machine Learning , pages 1050 – 1059 . PMLR , June 2016 . ISSN: 1938-7228 . 37. ↵ M. Beckers , A. J. Jakobi and C. Sachse . Thresholding of cryo-EM density maps by false discovery rate control . IUCrJ , 6 ( 1 ): 18 – 33 , January 2019 . OpenUrl CrossRef PubMed 38. ↵ R. C. Masmaliyeva and G. N. Murshudov . Analysis and validation of macromolecular B values . Acta Crystallographica Section D: Structural Biology , 75 ( 5 ): 505 – 518 , May 2019 . OpenUrl PubMed 39. ↵ R. C. Masmaliyeva , K. H. Babai and G. N. Murshudov . Local and global analysis of macromolecular atomic displacement parameters . Acta Crystallographica Section D: Structural Biology , 76 ( 10 ): 926 – 937 , October 2020 . OpenUrl PubMed 40. ↵ A. A. Chernyatina and H. H. Low . Core architecture of a bacterial type II secretion system . Nature Communications , 10 ( 1 ): 5437 , November 2019 . OpenUrl PubMed 41. ↵ K. Jamali , L. Käll , R. Zhang , A. Brown , D. Kimanius and S. H. W. Scheres . Automated model building and protein identification in cryo-EM maps . Nature , 628 ( 8007 ): 450 – 457 , April 2024 . OpenUrl CrossRef PubMed 42. ↵ C. Guo , G. Pleiss , Y. Sun and K. Q. Weinberger . On calibration of modern neural networks . In Proceedings of the 34th International Conference on Machine Learning - Volume 70, ICML’17 , pages 1321 – 1330 , Sydney, NSW, Australia , August 2017 . JMLR.org. 43. ↵ V. Kuleshov , N. Fenner and S. Ermon . Accurate Uncertainties for Deep Learning Using Calibrated Regression , July 2018 . arxiv: 1807.00263 [cs]. 44. ↵ Q. Wu , J. Huang , X. Fan , K. Wang , X. Jin , G. Huang , J. Li , X. Pan , et al. Structural mapping of Nav1.7 antagonists . Nature Communications , 14 ( 1 ): 3224 , June 2023 . OpenUrl PubMed 45. ↵ J. Gutiérrez-Fernández , K. Kaszuba , G. S. Minhas , R. Baradaran , M. Tambalo , D. T. Gallagher , et al. Key role of quinone in the mechanism of respiratory complex I . Nature Communications , 11 ( 1 ): 4135 , August 2020 . OpenUrl PubMed 46. ↵ M. Saur , M. J. Hartshorn , J. Dong , J. Reeks , G. Bunkoczi , H. Jhoti , et al. Fragment-based drug discovery using cryo-EM . Drug Discovery Today , 25 ( 3 ): 485 – 490 , March 2020 . OpenUrl CrossRef PubMed 47. ↵ S. Pospich , F. Merino and S. Raunser . Structural Effects and Functional Implications of Phalloidin and Jasplakinolide Binding to Actin Filaments . Structure , 28 ( 4 ): 437 – 449.e5 , April 2020 . OpenUrl CrossRef 48. ↵ M. Obr , M. Percipalle , D. Chernikova , H. Yang , A. Thader , G. Pinke , D. Porley , L. M. Mansky , R. A. Dick , et al. Distinct stabilization of the human T cell leukemia virus type 1 immature Gag lattice . Nature Structural & Molecular Biology , 32 ( 2 ): 268 – 276 , February 2025 . OpenUrl PubMed 49. ↵ L. Dietrich , A.-N. A. Agip , C. Kunz , A. Schwarz and W. Kühlbrandt . In situ structure and rotary states of mitochondrial ATP synthase in whole Polytomella cells . Science , 385 ( 6713 ): 1086 – 1090 , September 2024 . OpenUrl CrossRef PubMed 50. ↵ J. Zivanov , J. Otón , Z. Ke , A. von Kügelgen , E. Pyle , K. Qu , D. Morado , D. Castaño-Díez , G. Zanetti , T. A. M. Bharat , J. A. G. Briggs , et al. A Bayesian approach to single-particle electron cryo-tomography in RELION-4.0 . eLife , 11 : e83724 , December 2022 . OpenUrl CrossRef PubMed 51. ↵ J. Hutchings , V. Stancheva , E. A. Miller and G. Zanetti . Subtomogram averaging of COPII assemblies reveals how coat organization dictates membrane shape . Nature Communications , 9 : 4154 , October 2018 . OpenUrl PubMed 52. ↵ M. Beckers , C. M. Palmer and C. Sachse . Confidence maps: statistical inference of cryo-EM maps . Acta Crystallographica Section D Structural Biology , 76 ( 4 ): 332 – 339 , April 2020 . OpenUrl PubMed 53. ↵ B. DeChristopher , S.-H. Park , L. Vong , D. Bamford , H.-H. Cho , R. Duvadie , A. Fedolak , C. Hogan , T. Honda , P. Pandey , O. Rozhitskaya , L. Su , E. Tomlinson , et al. Discovery of a small molecule RXFP3/4 agonist that increases food intake in rats upon acute central administration . Bioorganic & Medicinal Chemistry Letters , 29 ( 8 ): 991 – 994 , April 2019 . OpenUrl PubMed 54. ↵ Y. Chen , Q. Zhou , J. Wang , Y. Xu , Y. Wang , J. Yan , Y. Wang , Q. Zhu , F. Zhao , C. Li , C.-W. Chen , X. Cai , R. A. D. Bathgate , C. Shen , H. Eric Xu , D. Yang , H. Liu , et al. Ligand recognition mechanism of the human relaxin family peptide receptor 4 (RXFP4) . Nature Communications , 14 ( 1 ): 492 , January 2023 . OpenUrl PubMed 55. ↵ A. Bartesaghi , C. Aguerrebere , V. Falconieri , S. Banerjee , L. A. Earl , X. Zhu , N. Grigorieff , J. L. S. Milne , G. Sapiro , X. Wu , et al. Atomic Resolution Cryo-EM Structure of β-Galactosidase . Structure , 26 ( 6 ): 848 – 856.e3 , June 2018 . OpenUrl CrossRef PubMed 56. ↵ C. L. Lawson , A. Kryshtafovych , G. D. Pintilie , S. K. Burley , J. Černý , V. B. Chen , P. Emsley , Gobbi, A. Joachimiak , S. Noreng , M. G. Prisant , R. J. Read , J. S. Richardson , A. L. Rohou , B. Schneider , B. D. Sellers , C. Shao , E. Sourial , C. I. Williams , C. J. Williams , Y. Yang , V. Abbaraju , P. V. Afonine , M. L. Baker , P. S. Bond , T. L. Blundell , T. Burnley , A. Campbell , R. Cao , J. Cheng , G. Chojnowski , K. D. Cowtan , F. DiMaio , R. Esmaeeli , N. Giri , H. Grubmüller , S. W. Hoh , J. Hou , C. F. Hryc , C. Hunte , M. Igaev , A. P. Joseph , W.-C. Kao , D. Kihara , D. Kumar , L. Lang , S. Lin , S. R. Maddhuri Venkata Subramaniya , S. Mittal , A. Mondal , N. W. Moriarty , A. Muenks , G. N. Murshudov , R. A. Nicholls , M. Olek , C. M. Palmer , A. Perez , E. Pohjolainen , K. R. Pothula , C. N. Rowley , D. Sarkar , L. U. Schäfer , C. J. Schlicksup , G. F. Schröder , M. Shekhar , D. Si , A. Singharoy , O. V. Sobolev , G. Terashi , A. C. Vaiana , S. C. Vedithi , J. Verburgt , X. Wang , R. Warshamanage , M. D. Winn , S. Weyand , K. Yamashita , M. Zhao , M. F. Schmid , H. M. Berman , et al. Outcomes of the EMDataResource cryo-EM Ligand Modeling Challenge . Nature Methods , 21 ( 7 ): 1340 – 1348 , July 2024 . OpenUrl PubMed 57. ↵ H.-J. Lee , H. J. Cha , H. Jeong , S.-N. Lee , C.-W. Lee , M. Kim , J. Yoo , et al. Conformational changes in the human Cx43/GJA1 gap junction channel visualized using cryo-EM . Nature Communications , 14 ( 1 ): 931 , February 2023 . OpenUrl PubMed 58. ↵ B.-C. Wang . Resolution of phase ambiguity in macromolecular crystallography . In Methods in Enzymology, volume 115 of Diffraction Methods for Biological Macromolecules Part B , pages 90 – 112 . January 1985 . doi: 10.1016/0076-6879(85)15009-3 . OpenUrl CrossRef PubMed Web of Science 59. K. D. Cowtan and P. Main . Improvement of macromolecular electron-density maps by the simultaneous application of real and reciprocal space constraints . Acta Crystallographica Section D: Biological Crystallography , 49 ( 1 ): 148 – 157 , January 1993 . OpenUrl CrossRef PubMed Web of Science 60. ↵ T. C. Terwilliger . Reciprocal-space solvent flattening . Acta Crystallographica Section D: Biological Crystallography , 55 ( 11 ): 1863 – 1871 , November 1999 . OpenUrl CrossRef PubMed Web of Science 61. ↵ K. Y. J. Zhang and P. Main . Histogram matching as a new density modification technique for phase refinement and extension of protein molecules . Acta Crystallographica Section A: Foundations of Crystallography , 46 ( 1 ): 41 – 46 , January 1990 . OpenUrl CrossRef 62. ↵ K. Cowtan . Recent developments in classical density modification . Acta Crystallographica Section D: Biological Crystallography , 66 ( 4 ): 470 – 478 , April 2010 . OpenUrl CrossRef PubMed Web of Science 63. ↵ M. Minderer , J. Djolonga , R. Romijnders , F. Hubis , X. Zhai , N. Houlsby , D. Tran , et al. Revisiting the Calibration of Modern Neural Networks , October 2021 . arxiv: 2106.07998 [cs]. 64. B. Lakshminarayanan , A. Pritzel and C. Blundell . Simple and scalable predictive uncertainty estimation using deep ensembles . In Proceedings of the 31st International Conference on Neural Information Processing Systems, NIPS’17 , pages 6405 – 6416 , Red Hook, NY, USA , December 2017 . Curran Associates Inc . ISBN 978-1-5108-6096-4 . 65. ↵ C. Blundell , J. Cornebise , K. Kavukcuoglu and D. Wierstra . Weight Uncertainty in Neural Network . In Proceedings of the 32nd International Conference on Machine Learning , pages 1613 – 1622 . PMLR , June 2015 . ISSN: 1938-7228 . 66. ↵ I. Kuntz and W. Kauzmann . Hydration of Proteins and Polypeptides . In Advances in Protein Chemistry , volume 28 , pages 239 – 345 . 1974 . ISBN 978-0-12-034228-0 . doi: 10.1016/S0065-3233(08)60232-6 . OpenUrl CrossRef PubMed 67. ↵ P. G. Squire and M. E. Himmel . Hydrodynamics and protein hydration . Archives of Biochemistry and Biophysics , 196 ( 1 ): 165 – 177 , August 1979 . OpenUrl CrossRef PubMed Web of Science 68. ↵ L. Verlet . Computer “Experiments” on Classical Fluids. I. Thermodynamical Properties of Lennard-Jones Molecules . Physical Review , 159 ( 1 ): 98 – 103 , July 1967 . OpenUrl CrossRef Web of Science 69. ↵ L. G. Trabuco , E. Villa , K. Mitra , J. Frank and K. Schulten . Flexible fitting of atomic structures into electron microscopy maps using molecular dynamics . Structure (London, England: 1993) , 16 ( 5 ): 673 – 683 , May 2008 . OpenUrl CrossRef PubMed 70. ↵ M. Topf , K. Lasker , B. Webb , H. Wolfson , W. Chiu and A. Sali . Protein structure fitting and refinement guided by cryo-EM density . Structure (London, England: 1993) , 16 ( 2 ): 295 – 307 , February 2008 . OpenUrl CrossRef PubMed 71. ↵ G. N. Murshudov , P. Skubák , A. A. Lebedev , N. S. Pannu , R. A. Steiner , R. A. Nicholls , M. D. Winn , F. Long , et al. REFMAC5 for the refinement of macromolecular crystal structures . Acta Crystallographica Section D: Biological Crystallography , 67 ( 4 ): 355 – 367 , April 2011 . OpenUrl CrossRef PubMed Web of Science 72. ↵ K. Yamashita , C. M. Palmer , T. Burnley and G. N. Murshudov . Cryo-EM single-particle structure refinement and map calculation using Servalcat . Acta Crystallographica Section D: Structural Biology , 77 ( 10 ): 1282 – 1291 , October 2021 . OpenUrl PubMed 73. ↵ N. Navab , J. Hornegger , W. M. Wells and A. F. Frangi O. Ronneberger , P. Fischer and T. Brox . U-Net: Convolutional Networks for Biomedical Image Segmentation . In N. Navab , J. Hornegger , W. M. Wells and A. F. Frangi , editors, Medical Image Computing and Computer-Assisted Intervention – MICCAI 2015 , pages 234 – 241 , Cham , 2015 . Springer International Publishing . ISBN 978-3-319-24574-4 . doi: 10.1007/978-3-319-24574-4_28 . OpenUrl CrossRef PubMed 74. ↵ M.-H. Laves , S. Ihler , K.-P. Kortmann and T. Ortmaier . Calibration of Model Uncertainty for Dropout Variational Inference , June 2020 . arxiv: 2006.11584 [cs]. 75. ↵ N. Chakravarti . Isotonic Median Regression: A Linear Programming Approach . Mathematics of Operations Research , 14 ( 2 ): 303 – 308 , 1989 . OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted September 14, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Confidence-guided cryo-EM map optimisation with LocScale-2.0 Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Confidence-guided cryo-EM map optimisation with LocScale-2.0 Alok Bharadwaj , Reinier de Bruin , Arjen J. Jakobi bioRxiv 2025.09.11.674726; doi: https://doi.org/10.1101/2025.09.11.674726 Share This Article: Copy Citation Tools Confidence-guided cryo-EM map optimisation with LocScale-2.0 Alok Bharadwaj , Reinier de Bruin , Arjen J. Jakobi bioRxiv 2025.09.11.674726; doi: https://doi.org/10.1101/2025.09.11.674726 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Biophysics Subject Areas All Articles Animal Behavior and Cognition (7635) Biochemistry (17691) Bioengineering (13892) Bioinformatics (41937) Biophysics (21452) Cancer Biology (18588) Cell Biology (25504) Clinical Trials (138) Developmental Biology (13378) Ecology (19899) Epidemiology (2067) Evolutionary Biology (24320) Genetics (15609) Genomics (22506) Immunology (17736) Microbiology (40394) Molecular Biology (17181) Neuroscience (88605) Paleontology (666) Pathology (2832) Pharmacology and Toxicology (4824) Physiology (7641) Plant Biology (15156) Scientific Communication and Education (2045) Synthetic Biology (4294) Systems Biology (9825) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall: last seen: 2026-05-21T05:10:58.409756+00:00

License: CC-BY-4.0