Temporal windows of perceptual organization: Evidence from crowding and uncrowding

doi:10.1101/2025.07.14.664690

Temporal windows of perceptual organization: Evidence from crowding and uncrowding

2025 · doi:10.1101/2025.07.14.664690

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 38,923 characters · extracted from preprint-html · click to expand

Temporal windows of perceptual organization: Evidence from crowding and uncrowding | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Temporal windows of perceptual organization: Evidence from crowding and uncrowding View ORCID Profile Alessia Santoni , View ORCID Profile Luca Ronconi , View ORCID Profile Jason Samaha doi: https://doi.org/10.1101/2025.07.14.664690 Alessia Santoni 1 Department of Psychology, Vita-Salute San Raffaele University , Milan, Italy 2 Department of Psychology and Cognitive Sciences, University of Trento , Trento, Italy 3 Department of Psychology, University of California , Santa Cruz, California, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Alessia Santoni For correspondence: alessiasantoni6{at}gmail.com Luca Ronconi 2 Department of Psychology and Cognitive Sciences, University of Trento , Trento, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Luca Ronconi Jason Samaha 3 Department of Psychology, University of California , Santa Cruz, California, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jason Samaha Abstract Full Text Info/History Metrics Preview PDF ABSTRACT Organizing visual input into coherent percepts requires dynamic grouping and segmentation mechanisms that operate across both spatial and temporal domains. While crowding disrupts target perception when nearby elements fall within the same spatial pooling window, specific flanker configurations can alleviate this effect through Gestalt-based grouping, a phenomenon known as uncrowding. Here, we examined the temporal dynamics underlying these spatial organization processes using a Vernier discrimination task. In Experiment 1, we varied stimulus duration and found that uncrowding emerged only after 160 ms, suggesting a time-consuming process. In Experiment 2, we manipulated the stimulus onset asynchrony (SOA) between the target and flankers. We found that presenting good-Gestalt flankers briefly before the target (as little as 32 ms) significantly boosted uncrowding, even in the absence of temporal overlap between the two stimuli. This effect was specific to conditions in which flankers preceded the target, ruling out pure temporal integration and masking accounts. These findings suggest that spatial segmentation can be dynamically facilitated when the temporal order of presentation allows grouping mechanisms to engage prior to target processing. Moreover, the observed time course indicates that segmentation is not purely feedforward, particularly for stimuli that are likely to recruit higher-level visual areas, pointing instead to the involvement of recurrent or feedback processes. INTRODUCTION In order to organize incoming sensory input, the visual system needs to identify and group elements across space, as well as integrate information across time. This dual challenge is central to defining coherent and meaningful perceptual units, yet the mechanisms that support it remain only partially understood. In the spatial domain, the presence of nearby elements in the visual scene can impair target perception, a phenomenon known as crowding. Crowding is a pervasive feature of visual processing, occurring across different levels of stimulus complexity, from simple Gabor patches to alphanumeric characters and natural scenes (e.g., Bernard & Chung, 2011 ; Ringer et al., 2021 ; Ronconi et al., 2016 ; Tanriverdi & Cornelissen, 2024 ). Previous research has identified object spacing as the key factor driving crowding: when the distance between target and flankers falls below an observer’s critical spacing at that retinal location, crowding is likely to occur. This principle, originally described by Herman Bouma in 1970, has since become known as “Bouma’s law” (Bouma, 1970; Pelli & Tillman, 2008). Additionally, the strength of crowding is shaped by flanker-target similarity, with target identification errors often reflecting either a bias toward flanker features or mislocalization of the target relative to the flankers ( Bernard & Chung, 2011 ; Põder & Wagemans, 2007 ; Zahabi & Arguin, 2014 ). This and other evidence have contributed to the view that crowding reflects a perceptual bottleneck, arising from feature integration or pooling within spatial regions defined by receptive field sizes in the feedforward visual hierarchy (for a comprehensive characterization of models of crowding refer to Pelli, 2008 ). This account of crowding has been challenged in the past decade by a notable exception in which specific flanker configurations alleviate the otherwise detrimental effects of crowding. This effect, known as uncrowding , is often attributed to Gestalt grouping principles, whereby flanking elements are perceptually organized into unitary structures based on their features ( Malania et al., 2007 ; Manassi et al., 2012 , 2013 ; Sayim et al., 2010 ). The spatial arrangement of flankers determines whether they are perceived as part of a unified object with the target or as separate elements, affecting the degree of crowding accordingly ( Livne & Sagi, 2007 ; Saarela et al., 2010 ; Tiurina et al., 2022 ). Unlike crowding, which has been often considered an early, feedforward limitation, uncrowding may reflect a time-dependent process of perceptual organization emerging through recurrent or integrative mechanisms over time ( Herzog et al., 2015 ; Manassi & Whitney, 2018 ). In the temporal domain, crowding effects can still be observed when flankers are not presented simultaneously to the target. For example, Huckauf and Heller (2004) manipulated the stimulus onset asynchrony (SOA) between target and flanker letters and found that strong crowding effects emerged at short temporal delays, and persisted even when target and flankers were separated by longer time-windows of ±150 ms. However, a precise temporal characterization of uncrowding is still lacking. Sayim and colleagues (2014) investigated the interaction between backward masking (i.e., when the target precedes the flankers) and (un)crowding by manipulating both the appearance of the flankers and the SOA between target and flankers. They found that flankers can produce type-B backward masking, with the greatest performance impairments occurring at SOAs of approximately 40-60 ms, depending on stimulus characteristics. Notably, the study did not reveal any perceptual advantage when flankers formed a good Gestalt (e.g., cuboids) compared to typical crowding-inducing flankers (e.g., vertical lines), suggesting that Gestalt-based representations may require additional time to emerge and be the results of higher-level feedback mechanisms ( Sayim et al., 2014 ). This interpretation is also supported by recent results by Morea and colleagues (2025) , who showed that while uncrowding effects typically emerged only after 160 ms under standard simultaneous presentation, even a brief 20 ms preview of the good-Gestalt flankers prior to the full flanker-target display significantly improved Vernier discrimination performance. The aim of the present study is to investigate temporal dynamics underlying spatio-temporal organization in visual perception. To characterize the temporal dynamics of crowding and uncrowding, we conducted two experiments using a Vernier discrimination task. In the first study, we manipulated stimulus duration while presenting flankers known to elicit either crowding or uncrowding effects. In the second study, we introduced a temporal delay between the flankers and the target Vernier stimulus, such that flankers (inducing either crowding or uncrowding) could appear before or after the target. This design allowed us to systematically map both the directionality and timing of uncrowding effects. Our results first replicated previous findings showing that grouping effects typically emerge relatively slowly. However, this delay was drastically reduced when flankers were presented before the target. We interpret these findings in light of feedback or recurrent mechanisms, suggesting that early presentation of the flankers pre-activates these processes, leading to a marked reduction in the time required for the uncrowding benefit to emerge. METHODS Participants 24 participants were recruited from the University of California, Santa Cruz community. Two participants were excluded due to uncorrected visual impairments, resulting in a final sample of 22 participants (mean age = 22 years, range: 18-35 years). The final sample included 16 individuals who identified as female, 5 as male, and 1 as non-binary. Participants received university research credits as compensation, if interested. The study was approved by the Institutional Review Board at the University of California, Santa Cruz. All participants performed two experiments, which order was counterbalanced across participants. Apparatus and stimuli Participants were seated in a dimly lit room at a viewing distance of 75 cm, maintained with a chinrest, and completed two tasks, each lasting approximately 25 minutes. Stimuli were presented through PsychToolbox 3 ( Brainard, 1997 ) for MATLAB ( The MathWorks Inc., 2022 ) on a black background on a VIEWPixx/EEG monitor with a 120 Hz refresh rate. Stimulus luminance was set to 80 cd/m 2 . In a Vernier discrimination task, Vernier targets consisted of two vertical lines, with a slight horizontal offset in the lower line. Following an intertrial interval (ITI) of 500 ms (±250 ms jitter), Vernier stimuli were randomly presented either to the left or right of the central fixation dot. The center of the stimulus was positioned 4 degrees of visual angle (DVA) from fixation, and participants were instructed to maintain central fixation throughout the trial. The two vertical lines composing the Vernier stimulus measured 40 arcminutes (′) in length each and were separated by a vertical gap of 4′. The horizontal offset between the two lines was set to 1′, and offset direction was randomized across trials. Across three experimental blocks, Vernier stimuli were presented either in isolation (baseline condition) or flanked by additional elements (illustrated in Figure 1A ). Flankers, when present, were presented symmetrically to the Vernier stimulus along the horizontal axis at a distance of 16′. Flankers could be either vertical lines (44′ in length) or rectangular flankers (44′ tall × 116′ wide), previously shown to elicit crowding and uncrowding effects, respectively ( Manassi et al., 2012 ). Participants were instructed to indicate the direction of the offset of the lower line relative to the upper line by pressing “M” (right) or “Z” (left) on the keyboard. Download figure Open in new tab Figure 1. A) Stimuli used in the Vernier discrimination task; Vernier stimuli were either presented in isolation (baseline condition) or flanked by lines or rectangles across separate blocks of trials. B) Schematic representation of Experiment 2. A temporal delay was introduced between the flankers and the Vernier target, such that flankers either preceded (left panel) or followed (right panel) the Vernier. Stimuli are enlarged for illustrative purposes. On each trial, stimuli were randomly presented to the left or right of a central fixation point. C-D) Results from experiment 1 and 2 show that the uncrowding effect emerges around 160 ms when stimuli are presented simultaneously, but at a SOA of 32 ms when flankers precede Verniers. Asterisks represent p -values from t-tests comparing accuracy for flanker shape (lines vs. rectangles). Error bars represent standard error of the mean (SEM). E) Pearson’s correlations between accuracy in study 1 and 2, across conditions (left panel: line flanker blocks, right panel: rectangular flanker blocks). Dots represent individual subjects; grey shaded areas represent 95% confidence intervals. * p FDR < .05, ** p FDR < .01. Procedure Experiment 1 Participants were asked to report the offset direction of the Vernier stimulus, while stimulus duration was manipulated along the following values: 32, 64, 80, 96, 128, 160, or 200 ms. Vernier and flanker stimuli were always presented simultaneously. The task included a total of 588 trials: 196 baseline trials and 196 trials for each flanker shape (lines and rectangles). Experiment 2 Participants performed a Vernier discrimination task where the duration of both the Vernier and flanker stimuli was fixed at 40 ms. However, target and flanker stimuli were either presented simultaneously (i.e., a SOA of 0 ms) or with a variable SOA, randomly selected from ±32, ±64, ±80, ±96, ±128, or ±160 ms ( Figure 1B ). Negative SOA values indicate trials in which the flankers preceded the Vernier stimulus, whereas positive SOA values indicate trials in which the flankers followed the Vernier stimulus. The task included a total of 616 trials: 56 baseline trials and 280 trials for each flaker shape (lines and rectangles). For both experiments, participants completed three separate blocks of trials: one for the baseline condition (no flankers), one with line flankers, and one with rectangle flankers. Block order was counterbalanced across participants. Before each experiment, participants completed 20 practice trials with feedback to familiarize themselves with the procedure. Statistical analyses For experiment 1, we investigated the effect of stimulus duration on Vernier discrimination. With this aim, stimulus duration (seven levels: 32, 64, 80, 96, 128, 160, and 200 ms) and flanker shape (lines vs. rectangles) were input as within-subject factors in a two-way repeated-measures ANOVA on accuracy data. For experiment 2, a two-way repeated-measures ANOVA was conducted on accuracy data to examine the interaction between flanker shape (lines vs. rectangles) and stimulus SOA (twelve levels: ±32, ±64, ±80, ±96, ±128, ±160 ms). Sphericity was assessed using Mauchly’s test, and Greenhouse-Geisser correction was applied where necessary. For each ANOVA, post hoc t-tests were performed to further investigate the relationship between flanker shape and either stimulus duration or SOA. In the second experiment, additional post hoc t-tests were conducted to compare accuracy at same-magnitude positive and negative SOAs, for each flanker shape separately. False Discovery Rate (FDR; Benjamini & Hochberg, 1995 ) was used to control for the family-wise type-I error rate across multiple comparisons. Accuracy data from the baseline condition were not included in the ANOVAs; instead, they were examined to ensure that participants performed above chance level. Finally, Pearson’s correlation analyses were conducted to assess whether individual accuracy scores (averaged for stimulus duration/SOA level) based on flanker shape were related across the two tasks. RESULTS Experiment 1 Results from experiment 1 are depicted in Figure 1C . A two-way repeated-measures ANOVA was conducted to examine the effects of stimulus duration (seven levels: 32, 64, 80, 96, 128, 160, and 200 ms) and flanker shape (lines vs. rectangles) on Vernier discrimination accuracy. The analysis revealed a significant main effect of stimulus duration, F (3.47, 72.80) = 8.12, p < .001, and a significant main effect of flanker shape, F (1, 21) = 6.63, p = .018. Importantly, the analysis showed a significant interaction between stimulus duration and flanker shape, F (4.60, 96.60) = 2.51, p = .039, suggesting that the effect of duration on accuracy differed between the two flanker shapes. Post hoc pairwise comparisons conducted between the two flanker shapes at each stimulus duration revealed significantly higher accuracy in the presence of rectangular flankers compared to flanker lines at 160 ms, t (21) = -2.77, p FDR = .040, and 200 ms, t (21) = -2.83, p FDR = .040. No significant differences were found at shorter durations (32–128 ms; all ps > .08). Experiment 2 Results from experiment 2 are depicted in Figure 1D . The repeated-measures ANOVA on flanker shape (lines vs. rectangles) and SOA (twelve levels: ±32, ±64, ±80, ±96, ±128, ±160 ms) revealed a significant main effect of SOA, F (6.87, 144.24) = 32.96, p < .001, and a significant main effect of flanker shape, F (1, 21) = 22.88, p < .001. A significant interaction between SOA and flanker shape was found, F (7.69, 161.64) = 3.00, p = .004. Post hoc tests comparing accuracy for flanker shapes at each SOA revealed significantly higher accuracy for rectangular flankers at negative SOAs of -128 ms ( t (21) = -3.99, p FDR = .003), - 96 ms ( t (21) = -3.70, p FDR = .004), -80 ms ( t (21) = -4.65, p FDR < .001), -64 ms ( t (21) = -3.38, p FDR = .006), and -32 ms ( t (21) = -3.37, p FDR = .006), as well as at the positive SOA of 160 ms ( t (21) = -4.64, p FDR .10). Post hoc t-test revealed that Vernier accuracy significantly differed between negative and positive SOAs of the same magnitude across all SOA levels when rectangular flankers were presented, at 160 ms ( t (21) = 3.82, p FDR = .002), 128 ms ( t (21) = 3.57, p FDR = .002), 96 ms ( t (21) = 3.57, p FDR = .002), 80 ms ( t (21) = 6.81, p FDR < .001), 64 ms ( t (21) = 4.50, p FDR = 0.001), and 32 ms ( t (21) = 3.21, p FDR = 0.004). The same post hoc t-test performed when line flankers were presented only revealed a significant difference at 160 ms ( t (21) = 5.68, p FDR .15). Correlations Accuracy scores averaged for stimulus duration/SOA level across the two experiments were positively correlated for both line flanker blocks ( r (20) = 0.61, p = .003) and rectangular flanker blocks ( r (20) = 0.48, p = .025), indicating that the two tasks successfully measured related processes ( Figure 1F ). DISCUSSION Perception depends on dynamic grouping and segmentation processes that unfold across both space and time. Here, we extended previous work by examining the time course of spatial segmentation using a Vernier discrimination paradigm known to produce strong crowding and uncrowding effects depending on the flanker configuration. Rectangular flankers, in particular, have been shown to alleviate crowding compared to simple vertical lines, as they are perceptually grouped into a single unit under Gestalt principles ( Herzog et al., 2015 ; Manassi et al., 2012 ). While earlier studies have largely focused on how flanker properties influence spatial grouping (see, e.g., Manassi et al., 2012 , 2013 ), our focus was on when these effects emerge during stimulus processing. In our first experiment, we mapped the timeframe of the uncrowding benefit by varying stimulus duration across a broad range (20 to 200 ms) and found that uncrowding emerged only when the stimulus was presented for at least 160 ms. This aligns with recent findings by Morea et al. (2025) , who reported uncrowding at 160 ms but not at 20 ms, though their study included only two durations. By sampling more densely across time, our results confirm and extend their observation, suggesting that spatial segmentation and grouping build up over time, likely via either recurrent or feedback processing ( Herzog et al., 2015 ). However, a difference from previous studies is that in our paradigm, stimulus location was randomized across hemifields, minimizing stimulus expectancy and preparatory spatial attention. Despite this, we observed that the same temporal window was necessary for uncrowding to emerge, indicating that the time course of spatial segmentation is likely not contingent on stimulus location predictability. While our first experiment confirmed that spatial organization unfolds over relatively long timescales, our second experiment demonstrated that when flankers precede the target, the uncrowding effect emerges more rapidly. In this experiment, we systematically varied the SOA between the Vernier and the flankers, both presented for 40 ms, across a broad temporal range. First, we showed that even when flankers and Verniers are not presented simultaneously, crowding and uncrowding effects are still observed, demonstrating the temporal extent of spatial segmentation mechanisms. Furthermore, we found uncrowding benefits emerging at SOAs as early as 32 ms and persisting up to 128 ms when flankers preceded the target. Beyond this point, the temporal separation between the two stimuli was large enough that the temporal crowding effect was minimal to begin with. At an SOA of -32 ms, assuming temporal integration between flankers and Vernier, the total visual stimulation amounts to 72 ms, about half the presentation duration expected to elicit uncrowding under the condition of our first experiment. This suggests that Gestalt-based uncrowding can emerge much faster than previously thought when there is a brief temporal offset between the flanker and target. Moreover, while an SOA of -32 ms involved an 8 ms temporal overlap between flankers and the Vernier, similar uncrowding effects were also observed at longer negative SOAs without any overlap (i.e., SOAs < -64 ms). For example, even at an SOA of -128 ms, corresponding to an 88 ms gap between flanker offset and Vernier onset, significant uncrowding still occurred. This highlights the temporal stability of Gestalt grouping, which can alleviate crowding of subsequent targets even after a substantial delay. The task manipulation introduced in this second experiment allows us to investigate Temporal Integration Windows (TIWs) across different perceptual conditions; for example, we show that uncrowding stimuli define a narrower TIW as compared to crowding stimuli (see the width of the curve in Figure 1D ). However, it is important to note that the observed uncrowding benefits cannot be solely attributed to temporal integration mechanisms. Indeed, this effect was specific to negative SOAs (i.e., when flankers preceded the target), implicating rapid preview mechanisms that extend beyond simple temporal integration of the two stimuli. If temporal integration were the only mechanism at play, the uncrowding benefit should have been comparable for positive and negative SOAs of equal magnitude. On the other hand, our results are also only partially compatible with masking mechanisms. Asymmetries between forward and backward masking are well-documented, with backward masking typically exerting a stronger disruptive effect on perception ( Enns & Di Lollo, 2000 ). However, our findings show that crowding strength was comparable for positive and negative SOAs of equal magnitude when presenting crowding stimuli (with the expectation of the SOA equal to 160 ms). According to the masking account, backward masking effects are often interpreted as arising from temporally delayed feedback from higher-to lower-level visual processes, which can disrupt the perception of the target stimulus ( Di Lollo et al., 2000 ). In line with this idea, Huckauf and Heller (2004) showed that crowding was reduced when targets were followed by letter-like nonletters as opposed to letter flankers. They attributed this effect to reduced top-down activation: since letter-like nonletters engage the letter level more weakly, they generate less feedback to early visual areas, thereby weakening the crowding effect. Additional results investigating backward masking and stimulus configurations come from Sayim et al. (2014) , where authors reported stronger masking at SOAs around 40-60 ms (i.e., type-B masking) regardless of flanker configuration (i.e., flankers could be either lines or cuboids). This lack of uncrowding effect for backward masking is coherent with our results at positive SOAs, further corroborating the idea that Gestalt representations might operate on feedback processes that require additional processing time ( Wagemans et al., 2012 ). However, in our study, performance was maximally impaired at short and zero SOAs, rather than intermediate SOAs as in Sayim et al. (2004). Taken together, we suggest that when flakers form good Gestalts, spatial grouping processes can rapidly segment flankers from targets and do so even in the absence of temporal overlap between the stimuli. It has been previously hypothesized that crowding occurs when stimuli fall within the same processing stage ( Manassi & Whitney, 2018 ). In this view, pre-activating relevant Gestalt structures may engage top-down/lateral spatial segmentation mechanisms that facilitate subsequent target processing. In contrast, when the target preceded the flankers, no such advantage was observed, further arguing against a purely masking-based account. Importantly, our conclusions about the involvement of feedback or recurrent mechanisms are likely to apply specifically to the relatively complex flanker configurations used in our paradigm, which presumably engage higher-level visual areas responsible for spatial grouping across objects and shapes. It remains an open question whether similar temporal dynamics would be observed with simpler stimuli that rely predominantly on early visual processing stages, where crowding might still arise from more purely feedforward mechanisms. Finally, it is possible that exogenous attention contributed to the behavioral improvement observed at negative SOAs compared to their positive counterparts. Previous studies have shown that both endogenous and exogenous attention can modulate the strength of crowding ( Gong et al., 2024 ; Kewan-Khalayly & Yashar, 2022 ; Yeshurun & Carrasco, 1999 ). However, the timeline of our fastest stimuli is not entirely compatible with mechanisms of exogenous attention, which tend to emerge around 100 ms after cue onset ( Carrasco, 2011 ; Egeth & Yantis, 1997 ). At any rate, it is reasonable to assume that any potential attentional effects in our paradigm were equally present in the two flanker configurations and therefore cannot fully account for the uncrowding effects observed here. CONCLUSIONS Our results demonstrate that spatial segmentation, though relatively slow under standard uncrowding conditions, can be significantly accelerated when uncrowding flankers are presented prior to the target stimulus. We interpret this finding as evidence that a rapid presentation of the flankers, even for just tens of milliseconds, facilitates the emergence of Gestalt-based benefits by initiating grouping mechanisms that have a sustained impact on subsequent target perception. In turn, these results offer further support for the idea that spatial segmentation and grouping can be mediated by recurrent or feedback processing in the case of relatively complex configurations that likely engage higher-level visual areas. ACKNOWLEDGMENTS We would like to thank Michael Herzog and Martina Morea for the helpful discussions. We also thank Emily Lincoln, Vrishab Nukala and Gaia Minari for their help in data collection. The present work was performed by A.S. in fulfilment of the requirements for obtaining the PhD degree at Vita-Salute San Raffaele University, Milan, Italy. REFERENCES ↵ Benjamini , Y. , & Hochberg , Y. ( 1995 ). Controlling the false discovery rate: A practical and powerful approach to multiple testing . Journal of the Royal statistical society: series B (Methodological) , 57 ( 1 ), 289 – 300 . OpenUrl CrossRef PubMed Web of Science ↵ Bernard , J.-B. , & Chung , S. T. L. ( 2011 ). The dependence of crowding on flanker complexity and target-flanker similarity . Journal of Vision , 11 ( 8 ), 1 – 1 . doi: 10.1167/11.8.1 OpenUrl Abstract / FREE Full Text ↵ Brainard , D. H. ( 1997 ). The psychophysics toolbox . Spatial vision , 10 ( 4 ), 433 – 436 . OpenUrl CrossRef PubMed Web of Science ↵ Carrasco , M. ( 2011 ). Visual attention: The past 25 years . Vision Research , 51 ( 13 ), 1484 – 1525 . doi: 10.1016/j.visres.2011.04.012 OpenUrl CrossRef PubMed Web of Science ↵ Di Lollo , V. , Enns , J. T. , & Rensink , R. A. ( 2000 ). Competition for consciousness among visual events: The psychophysics of reentrant visual processes . Journal of Experimental Psychology: General , 129 ( 4 ), 481 – 507 . doi: 10.1037/0096-3445.129.4.481 OpenUrl CrossRef PubMed Web of Science ↵ Egeth , H. E. , & Yantis , S. ( 1997 ). VISUAL ATTENTION: Control, Representation, and Time Course . Annual Review of Psychology , 48 ( 1 ), 269 – 297 . doi: 10.1146/annurev.psych.48.1.269 OpenUrl CrossRef PubMed Web of Science ↵ Enns , J. T. , & Di Lollo , V. ( 2000 ). What’s new in visual masking? Trends in Cognitive Sciences , 4 ( 9 ), 345 – 352 . doi: 10.1016/S1364-6613(00)01520-5 OpenUrl CrossRef PubMed Web of Science ↵ Gong , M. , Liu , T. , Chen , Y. , & Sun , Y. ( 2024 ). Dissociable Effects of Endogenous and Exogenous Attention on Crowding: Evidence from Event-Related Potentials . Brain Sciences , 14 ( 10 ), 956 . doi: 10.3390/brainsci14100956 OpenUrl CrossRef PubMed ↵ Herzog , M. H. , Sayim , B. , Chicherov , V. , & Manassi , M. ( 2015 ). Crowding, grouping, and object recognition: A matter of appearance . Journal of Vision , 15 ( 6 ), 5 . doi: 10.1167/15.6.5 OpenUrl Abstract / FREE Full Text ↵ Huckauf , A. , & Heller , D. ( 2004 ). On the relations between crowding and visual masking . Perception & Psychophysics , 66 ( 4 ), 584 – 595 . doi: 10.3758/BF03194903 OpenUrl CrossRef PubMed ↵ Kewan-Khalayly , B. , & Yashar , A. ( 2022 ). The role of spatial attention in crowding and feature binding . Journal of Vision , 22 ( 13 ), 6 . doi: 10.1167/jov.22.13.6 OpenUrl CrossRef PubMed ↵ Livne , T. , & Sagi , D. ( 2007 ). Configuration influence on crowding . Journal of Vision , 7 ( 2 ), 4 . doi: 10.1167/7.2.4 OpenUrl Abstract / FREE Full Text ↵ Malania , M. , Herzog , M. H. , & Westheimer , G. ( 2007 ). Grouping of contextual elements that affect vernier thresholds . Journal of Vision , 7 ( 2 ), 1 . doi: 10.1167/7.2.1 OpenUrl Abstract / FREE Full Text ↵ Manassi , M. , Sayim , B. , & Herzog , M. H. ( 2012 ). Grouping, pooling, and when bigger is better in visual crowding . Journal of Vision , 12 ( 10 ), 13 – 13 . doi: 10.1167/12.10.13 OpenUrl Abstract / FREE Full Text ↵ Manassi , M. , Sayim , B. , & Herzog , M. H. ( 2013 ). When crowding of crowding leads to uncrowding . Journal of Vision , 13 ( 13 ), 10 – 10 . doi: 10.1167/13.13.10 OpenUrl Abstract / FREE Full Text ↵ Manassi , M. , & Whitney , D. ( 2018 ). Multi-level Crowding and the Paradox of Object Recognition in Clutter . Current Biology , 28 ( 3 ), R127 – R133 . doi: 10.1016/j.cub.2017.12.051 OpenUrl CrossRef PubMed ↵ Morea , M. , Herzog , M. H. , Francis , G. , & Manassi , M. ( 2025 ). Dynamics of vision: Grouping takes longer than crowding . [Preprint] doi: 10.31234/osf.io/wd4yj_v2 OpenUrl CrossRef ↵ Pelli , D. G. ( 2008 ). Crowding: A cortical constraint on object recognition . Current opinion in neurobiology , 18 ( 4 ), 445 – 451 . OpenUrl CrossRef PubMed Web of Science ↵ Põder , E. , & Wagemans , J. ( 2007 ). Crowding with conjunctions of simple features . Journal of Vision , 7 ( 2 ), 23 . doi: 10.1167/7.2.23 OpenUrl Abstract / FREE Full Text ↵ Ringer , R. V. , Coy , A. M. , Larson , A. M. , & Loschky , L. C. ( 2021 ). Investigating Visual Crowding of Objects in Complex Real-World Scenes . I-Perception , 12 ( 2 ), 2041669521994150 . doi: 10.1177/2041669521994150 OpenUrl CrossRef PubMed ↵ Ronconi , L. , Bertoni , S. , & Bellacosa Marotti , R. ( 2016 ). The neural origins of visual crowding as revealed by event-related potentials and oscillatory dynamics . Cortex , 79 , 87 – 98 . doi: 10.1016/j.cortex.2016.03.005 OpenUrl CrossRef ↵ Saarela , T. P. , Westheimer , G. , & Herzog , M. H. ( 2010 ). The effect of spacing regularity on visual crowding . Journal of Vision , 10 ( 10 ), 17 – 17 . doi: 10.1167/10.10.17 OpenUrl Abstract / FREE Full Text ↵ Sayim , B. , Manassi , M. , & Herzog , M. ( 2014 ). How color, regularity, and good Gestalt determine backward masking . Journal of Vision , 14 ( 7 ), 8 – 8 . doi: 10.1167/14.7.8 OpenUrl Abstract / FREE Full Text ↵ Sayim , B. , Westheimer , G. , & Herzog , M. H. ( 2010 ). Gestalt Factors Modulate Basic Spatial Vision . Psychological Science , 21 ( 5 ), 641 – 644 . doi: 10.1177/0956797610368811 OpenUrl CrossRef PubMed ↵ Tanriverdi , D. , & Cornelissen , F. W. ( 2024 ). Rapid assessment of peripheral visual crowding . Frontiers in Neuroscience , 18 , 1332701 . doi: 10.3389/fnins.2024.1332701 OpenUrl CrossRef PubMed ↵ The MathWorks Inc . 2022 . MATLAB Version: 9.12.0.1884302 (R2022a) . MathWorks Inc . https://www.mathworks.com . ↵ Tiurina , N. A. , Markov , Y. A. , Choung , O.-H. , Herzog , M. H. , & Pascucci , D. ( 2022 ). Unlocking crowding by ensemble statistics . Current Biology , 32 ( 22 ), 4975 – 4981 .e3. doi: 10.1016/j.cub.2022.10.003 OpenUrl CrossRef PubMed ↵ Wagemans , J. , Elder , J. H. , Kubovy , M. , Palmer , S. E. , Peterson , M. A. , Singh , M. , & Von Der Heydt , R. ( 2012 ). A century of Gestalt psychology in visual perception: I. Perceptual grouping and figure–ground organization . Psychological Bulletin , 138 ( 6 ), 1172 – 1217 . doi: 10.1037/a0029333 OpenUrl CrossRef PubMed ↵ Yeshurun , Y. , & Carrasco , M. ( 1999 ). Spatial attention improves performance in spatial resolution tasks . Vision Research , 39 ( 2 ), 293 – 306 . doi: 10.1016/S0042-6989(98)00114-X OpenUrl CrossRef PubMed Web of Science ↵ Zahabi , S. , & Arguin , M. ( 2014 ). A crowdful of letters: Disentangling the role of similarity, eccentricity and spatial frequencies in letter crowding . Vision Research , 97 , 45 – 51 . doi: 10.1016/j.visres.2014.02.001 OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted July 18, 2025. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Temporal windows of perceptual organization: Evidence from crowding and uncrowding Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Temporal windows of perceptual organization: Evidence from crowding and uncrowding Alessia Santoni , Luca Ronconi , Jason Samaha bioRxiv 2025.07.14.664690; doi: https://doi.org/10.1101/2025.07.14.664690 Share This Article: Copy Citation Tools Temporal windows of perceptual organization: Evidence from crowding and uncrowding Alessia Santoni , Luca Ronconi , Jason Samaha bioRxiv 2025.07.14.664690; doi: https://doi.org/10.1101/2025.07.14.664690 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Neuroscience Subject Areas All Articles Animal Behavior and Cognition (7621) Biochemistry (17645) Bioengineering (13867) Bioinformatics (41872) Biophysics (21416) Cancer Biology (18549) Cell Biology (25443) Clinical Trials (138) Developmental Biology (13360) Ecology (19866) Epidemiology (2067) Evolutionary Biology (24289) Genetics (15587) Genomics (22470) Immunology (17706) Microbiology (40314) Molecular Biology (17142) Neuroscience (88456) Paleontology (666) Pathology (2826) Pharmacology and Toxicology (4815) Physiology (7634) Plant Biology (15111) Scientific Communication and Education (2042) Synthetic Biology (4285) Systems Biology (9812) Zoology (2268)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00