A residual memory trace in an accumulator explains serial dependence

doi:10.1101/2025.08.24.671986

A residual memory trace in an accumulator explains serial dependence

2025 · doi:10.1101/2025.08.24.671986

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 54,579 characters · extracted from preprint-html · click to expand

A residual memory trace in an accumulator explains serial dependence | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results A residual memory trace in an accumulator explains serial dependence Hiroshi Higashi doi: https://doi.org/10.1101/2025.08.24.671986 Hiroshi Higashi 1 Graduate School of Engineering, The University of Osaka Find this author on Google Scholar Find this author on PubMed Search for this author on this site Abstract Full Text Info/History Metrics Preview PDF Abstract Human perception is not a series of isolated snapshots; our recent past continuously shapes what we currently see, a phenomenon known as serial dependence. While convolutional neural networks (CNNs) excel as models of vision, they are typically static and fail to capture such dynamic, history-dependent effects. Here, we introduce SDNet, a model that explains how serial dependence arises from the mechanics of decision-making. SDNet integrates a standard CNN with a recurrent network that functions as a sequential evidence accumulator. We hypothesize that this bias is not a flaw or a feature for optimality, but a natural byproduct of the accumulator retaining a residual memory trace of past decisions. Without being directly fit to behavioral data, SDNet spontaneously reproduces the characteristic patterns of serial dependence from human orientation and numerosity judgment tasks. The model even captures a key feature of human perception: that the bias grows stronger as task difficulty increases. This work provides a concrete, neurally plausible mechanism for serial dependence, challenging theories that frame it as a purely optimal strategy. By showing how a fundamental perceptual bias emerges from an intrinsic property of a dynamic system, SDNet represents a significant advance in building more biologically realistic models of human vision. 1 Introduction Visual perception is not a passive snapshot of the world. It is a dynamic process, profoundly shaped by our recent past. A wealth of evidence shows that our judgement of a stimulus is robustly pulled toward recently seen ones, a phenomenon termed serial dependence [ 12 , 20 ]. This “attractive” bias is ubiquitous [ 14 , 2 , 40 ], influencing our perception of fundamental features like orientation [ 15 , 25 , 43 , 45 ], spatial position [ 8 , 40 , 44 ], color [ 4 , 5 , 58 ], numerosity [ 14 , 18 , 21 ], and shape [ 39 , 38 ], and extending even to high-level judgement like face identity [ 36 , 55 , 56 ] and expression [ 30 , 37 , 60 , 17 , 41 ]. Its prevalence suggests serial dependence is not a mere curiosity but fundamental feature of visual processing, yet its underlying mechanism remains a subject a intense debate. Computational approaches to search for this mechanisms are split between two dominant but incomplete ways. On one hand, traditional cognitive models excel at describing the dynamics of decision-making but are abstract and cannot “see”—they do not operate directly on image pixels [ 49 , 50 , 42 , 47 ]. On the other hand, convolutional neural networks (CNNs) have revolutionized our understanding of the brain’s visual pathway and are inherently imagecomputable [ 33 , 34 , 61 ]. However, they are fundamentally static; unlike humans, a standard CNN’s response to an image is deterministic and unaffected by prior stimuli. This leaves a critical gap between biologically-inspired vision models and dynamic human perception. To bridge this divide, we developed SDNet, an image-computable neural network model that are capable of reproducing sequential effects for image-based inputs. SDNet combines a CNN front-end, functioning as a visual processing system, with a recurrent neural network (RNN) that models the decision process as the accumulation of evidences based on sequential sampling models [ 10 , 11 , 23 , 29 ] ( Figure 1 ). Our central hypothesis is that serial dependence is a natural consequence of this accumulation process [ 44 ]. Specifically, we propose that the accumulator [ 9 , 28 , 59 ] does not fully reset between decisions, but rather retains a residual trace of the previous choice in its internal memory. This inherited residue, carried in the RNN’s hidden state, then biases the accumulation process for the next stimulus. Download figure Open in new tab Figure 1. The SDNet model architecture and its mechanism for serial dependence. SDNet’s operation involves three key stages, illustrated here for an orientation adjustment task. (1) Sensory encoding: A CNN processes an input image (a titled grating) and outputs sensory evidence as a probability distribution over possible orientations. (2) Evidence accumulation: An RNN sequentially samples from this evidence to integrate it over time and form a decision. (3) The causal mechanism: Crucially, the RNN’s hidden state is not reset after each decision. Instead, the final state from the previous trial is carried over to initialize the current trial. This inherited memory trace provides a bias that pulls the current decision toward the previous one, thus generating serial dependence. We tested this hypothesis by presenting SDNet with sequences of images from two classic perceptual tasks: orientation adjustment [ 20 ] and numerosity judgement [ 14 , 22 ]. Without being explicitly trained to do so, SDNet spontaneously reproduced the key signatures of human serial dependence. More impressively, the model also captured the nuanced relationship between task difficulty and the strength of the bias, a hallmark of human behaviour. This study offers three key contributions. First, we introduce the first imagecomputable model that quantitatively reproduces serial dependence. Second, we provide a neurally plausible mechanism, framing the bias not as an optimized strategy but as an emergent property of a leaky decision accumulator. Finally, SDNet serves as a powerful new tool to forge a more unified understanding of perception, from pixels to dynamic, history-dependent decisions. 2 Results We assessed SDNet’s ability to reproduce core features of human perceptual behaviour by comparing its performance to human participants across two distinct tasks: orientation adjustment and numerosity judgement. We first validated that the model could achieve human-level precision before testing its capacity to spontaneously generate serial dependence. 2.1 Orientation adjustment task We first analyzed an orientation adjustment task ( Figure 7 ) performed by 83 human participants and 83 SDNet instances. In each trial, participants viewed a grating image of random orientation and adjusted a bar to match it. To mimic the varying sensory evidence available to humans, SDNet’s recurrent accumulator processed either 8 or 16 samples from the CNN, analogous to short (0.3 s) and long (0.6 s) stimulus presentation time. SDNet captures human-like performance and its modulation by task difficulty First, we confirmed that SDNet’s basic performance mirrored that of humans. The average adjustment error was comparable between human (13. ± 5 14.6 ° ) and SDNet (15.0 ± 17.8 ° ). Critically, both humans and SDNet made larger errors under more challenging stimulus conditions: shorter presentation times and lower spatial frequencies ( Figure 2 ). A repeated-measures analysis of variance (RM ANOVA) confirmed these main effects were significant for both humans (presentation time: F 1,82 = 33.481, p < 0.001, spatial frequency: F 1,82 = 11.023, p < 0.001, ) and SDNet (presentation time: F 1,82 = 60.531, p < 0.001, spatial frequency: F 1,82 = 116.379, p < 0.001, ). This shows that SDNet’s precision is sensitive to stimulus uncertainty in a manner consistent with human perception. Download figure Open in new tab Figure 2. Average adjustment error in the orientation task under different conditions (presentation time and spatial frequency (SF)). Dots represent individual participant/instance means; error bars are standard error of the mean. SDNet spontaneously reproduces the attractive bias of serial dependence Next, we tested our central hypothesis. Using a derivative of Gaussian (DoG) fit to quantify the bias (see Section 4 ), we found that both humans and SDNet exhibited a significant attractive pull from the immediately preceding trial (1-back; human: p < 0.001, SDNet: p < 0.001) and the trial before that (2-back; human: p < 0.001, SDNet: p = 0.045), as shown in Figure 3 . This demonstrates that the model’s core mechanism—the inherited hidden state—is sufficient to generate short-term serial dependence. However, the effect diverged for longer histories: the bias remained for humans at 3-back ( p = 0.009) but vanished for SDNet ( p = 0.189), suggesting the model decays rapidly a memory trace. Download figure Open in new tab Figure 3. Serial dependence from 1-back, 2-back, and 3-back trials in orientation adjustment. (A) Adjustment errors as a function of relative orientation between the current and preceding stimuli for human participants. Dot represent individual participant means. (B) SD amplitude (|SD|) and peak shift (ΔSD) for human participants. Error bars for |SD| and ΔSD indicate the standard deviation from bootstrap sampling. (C) |SD| and ΔSD for SDNet instances. (D) Adjustment errors for SDNet instances. The asterisks ( ∗ ) below the bars for |SD| denote significant dependence ( p < 0.05, bootstrap test). Task difficulty amplifies serial dependence in both humans and SD-Net A key feature of human serial dependence is its modulation by task difficulty. We found a remarkable correspondence between our model and human data. When the current stimulus was harder to perceive (i.e., had a low spatial frequency), the magnitude of serial dependence significantly increased for both humans ( p = 0.010) and SDNet ( p = 0.035), as shown in Figure 4A . This shared pattern supports the principle that when current sensory evidence is unreliable, both the human brain and SDNet rely more heavily on the residual memory of the past. A similar trend was observed for short presentation times ( Figure 4B ), though it only reached significance for SDNet ( p = 0.001) and not humans ( p = 0.682). Download figure Open in new tab Figure 4. Modulation of serial dependence by stimulus uncertainty. The strength of the 1-back serial dependence bias was conditioned on the properties of the current and previous stimulus. (A, D) Adjustment errors for humans and SDNet as a function of relative orientation. (B, C) SD amplitude |SD| and peak shift ΔSD for humans and SDNet. Previous trial uncertainty similarly attenuates the bias We also investigated how the reliability of the previous stimulus affected the current bias. Both humans and SDNet showed an identical pattern: when the previous stimulus had low spatial frequency (high uncertainty), it exerted a significantly weaker pull on the current trial (human: p = 0.016, SDNet: p = 0.001), as shown in Figure 4C . The presentation time of the previous trial had no significant effect for either group ( Figure 4D ). This demonstrates that both human perception and SDNet dynamically weight past information, discounting it when it originates from a less reliable source. 2.2 Numerosity judgement task To test the generality of our model, we compared it against a public dataset from a numerosity judgement task [ 22 ]. In this task, 32 participants judged whether a “probe” image had more dots than a “reference” image, after being primed by an “inducer” image. We likewise trained 32 SDNet instances on the same task. SDNet matches human precision but not all task-specific biases SD-Net’s overall task precision was indistinguishable from that of humans ( Z 31 = 158.000, p = 0.238; two-sided Wilcoxon signed-rank test with Bonferroni correction; Figure 5A ). However, SDNet did not capture a specific recency bias observed in humans ( Z 31 = 60.000, p < 0.001; Figure 5B ), who tended to respond “more” when the probe and reference were physically identical, a nuance our general-purpose accumulator architecture does not account for. Although this bias led to a slight difference in their psychometric functions ( Figure 5C ), the points of subjective equality (PSEs) derived from these functions were not significantly different between human and SDNet ( p = 0.053; bootstrap test (see Section 4.2.3 ); Figure 5D ). Download figure Open in new tab Figure 5. Behavioural performance in numerosity judgement task. (A) Percentage of correct responses for the judgement task. The three horizontal bars represents maximum, average, minimum of PSEs, respectively. (B) Percentage of responses indicating “probe stimulus had more dots” when the reference and probe stimuli had equal numerosity (16 dots). (C) Psychometric functions, plotting the proportion of “probe has more dots” responses as a function of probe numerosity. Dots represent the grand average, and error bars show the standard deviation across participants/instances. (D) PSEs. Download figure Open in new tab Figure 6. Serial dependence modulated by inducer numerosity in numerosity judgement task. (A, D) Psychometric functions for humans and SDNet, split by low (12 dots) versus high (24 dots) inducer numerosity. (B, C) PSEs for human and SDNet. Download figure Open in new tab Figure 7. Trial structure of the orientation adjustment task. Participants first viewed a central fixation cross, followed by a brief presentation of sinusoidal grating. After a mask, a response bar appeared, which participants rotated to match the orientation of the grating they had just seen. SDNet robustly reproduces serial dependence Despite the minor difference in bias, SDNet robustly reproduced the core serial dependence effect. For both humans and SDNet, the judgement of the reference stimulus was significantly biased by the numerosity of the preceding inducer stimulus. A lownumerosity inducer caused the subsequent reference to be perceived as having fewer dots (shifting the psychometric curve left), while a high-numerosity in-ducer did the opposite (human: p = 0.001; SDNet: p < 0.001; Figure 6 ). This successful replication in a different task and stimulus domain strongly supports our central claim that serial dependence is an emergent property of evidence accumulation with a leaky memory trace. 3 Discussion Neural networks are powerful tools for modeling vision, but they have largely overlooked the brain’s dynamic nature, where past experiences continuously influence current decisions. In this study, we addressed this gap by developing SDNet, an image-computable model that spontaneously reproduces serial dependence, a hallmark of human perception. By testing it on orientation and numerosity tasks, we demonstrated that SDNet not only matches human-level performance but also captures the core attractive bias of serial dependence and, critically, how its strength is modulated by task difficulty. A mechanistic alternative to optimality Our work offers a new perspective on the very nature of serial dependence. Prevailing computational theories often frame this bias as an optimal strategy derived from Bayesian inference or predictive coding, designed to enhance perceptual stability and efficiency in a noisy world [ 18 , 16 , 42 ]. SDNet challenges this view. We propose that serial dependence is not a dedicated feature for optimization, but rather an emergent property—a natural side effect of how the brain makes decisions. Our model’s architecture is built on the well-established principle of sequential evidence accumulation [ 51 , 23 , 48 , 13 , 19 ]. We hypothesized that the neural accumulators responsible for this process are not perfectly reset after each choice. Instead, a residual memory trace of the previous decision, carried in the accumulator’s internal state, persists and biases the next one [ 44 , 4 ]. Our results validate this hypothesis, shown this simple mechanism is sufficient to generate human-like serial dependence. This reframes a key question: instead of asking why the brain evolved an optimal strategy for serial dependence, we can ask why its decision accumulators are not fully reset. The answer may lie in biological constraints, such as the metabolic cost of a hard reset, or functional benefits, like faster processing by starting from a non-zero baseline. Bridging models and neurophysiology SDNet also provides a concrete framework for investigating the neural underpinnings of serial dependence. Neurophysiological studies have found correlates of past stimuli in both early visual areas like V1 [ 54 , 53 ] and higher-level frontopariental regions [ 1 , 7 , 57 ]. This has fueled debate about where in the processing hierarchy the bias originates. Our model, with its CNN-to-RNN structure, maps onto this hierarchy. While the CNN “sees” the stimulus (like V1), the bias originates in the RNN “accumulator” (like higher-level cortex). This aligns with findings that decision-related accumulation processes are observed in parietal and frontal cortices [ 32 , 31 , 3 , 27 ] and that these regions are causally involved in serial dependence. The influence of these higher areas could then feedback to early visual cortex. SDNet thus provides a powerful tool to test such hypotheses by correlating its internal layer activations with neural recordings from different brain regions [ 61 ]. Limitations and future directions While SDNet captures core phenomena, its simplicity also highlights clear avenues for future work. SDNet’s bias decays rapidly, failing to reproduce the weaker but significant dependence observed from 3-back trials in humans. The longer-term dependence likely suggests the involvement of other cognitive systems [ 52 ] not included in SDNet, such as working memory [ 6 ] or episodic memory. This points to a critical avenue for future research: investigating the interplay of multiple memory systems in human perception [ 25 ]. Our model only accounts for attractive biases. However, under certain conditions, perception is repulsed from a prior stimulus [ 24 , 26 , 2 , 47 ]. These repulsive effects are often considered a signature of distinct neural mechanisms and represent an important phenomenon for future models to explain. Serial dependence in human is strongly modulated by the spatial location of stimuli. The current version of SDNet is not spatially organized. A natural next step is to develop an architecture with multiple, spatially-tuned accumulators to investigate these critical spatial dynamics. Conclusion We introduced SDNet, an image-computable neural network that explains serial dependence as an emergent property of evidence accumulation with a leaky memory. This work provides a neurally plausible, mechanistic alternative to optimality-based theories and represents a critical step toward building more comprehensive, dynamic models of human vision that bridge the gap from pixels to perception and decision. 4 Methods This study investigated serial dependence by comparing the performance of human participants with that of a novel neural network, SDNet, across two perceptual tasks. All analyses were conducted in Python, and the model was implemented in PyTorch. 4.1 Orientation adjustment task To validate SDNet’s ability to reproduce human serial dependence, we collected human behavioural data through an online experiment. 4.1.1 Human behavioural experiment Participants One hundred participants were recruited via Prolific ( www.prolific.com ). All provided informed consent before the experiment. The study protocol was approved by the Committee for Human Research at the Graduate School of Engineering, The University of Osaka, and adhered to the Declaration of Helsinki. Participants received a base compensation of £3 for completing the experiment, with an additional performance-based bonus ranging from £0 to £1 (average: £0.5) based on their accuracy in orientation adjustment. Stimulus and procedure Each trial consisted of a sequence: fixation, stimulus presentation, mask, and adjustment phase ( Figure 7 ). Stimuli were sinusoidal gratings using the GratingStim module in PsychoPy [ 46 ]. For each trial, the grating’s spatial frequency ( sf ) was randomly selected from {2, 3, 4} Hz, orientation ( ori ) from {0, 1, 2, …, 179} degrees, and phase ( phase ) from {0, 0.1, 0.2, …, 0.9} (in steps of 0.1). Stimuli were presented at the center of the browser window, masked by a Gaussian function ( mask: gauss ), and scaled to half the window size. Stimulus presentation duration was either 0.3 s or 0.6 s. A mask image was presented for 0.5 seconds immediately after the stimulus to prevent visual aftereffects. Participants were instructed to adjust a keyboard-controllable bar to match the orientation of the previously presented grating stimulus. The bar’s initial orientation was randomized. Participants used the left and right cursor keys for counter-clockwise and clockwise rotations, respectively. There was no time limit for the adjustment, and participants finalized their response by pressing the space bar. Each participant completed 200 trials, separated into 4 blocks of 50 trials each, with a mandatory break of at least 30 s between blocks.. The average experiment duration was 27 minutes. Data screening Initial participant screening excluded data from participants whose average absolute orientation error exceeded 39.2 ° (calculated as 1.5 × (interquartile range) + (first quantile)). This criterion led to the exclusion of 17 participants (17%). Subsequently, trial-level screening excluded individual trials with an absolute orientation error above 37.5 ° (1.5 × (interquartile range)+ (first quantile)). This excluded 488 samples (approximately 2.9%). The final dataset for analysis comprised 16,112 samples from 83 participants. 4.1.2 SDNet Architecture SDNet consists of two primary modules ( Figure 1 ): a CNN for visual feature extraction and an RNN for sequential evidence accumulation and decision-making. The CNN is an AlexNet [ 35 ] that takes a 128 × 128 pixel image and outputs a 180-dimensional probability vector representing sensory evidence for each orientation. The RNN is a gated recurrent unit (GRU) with 16 hidden cells. At each time step t , it receives a one-hot vector k [ t ] (sampled from the CNN’s evidence) and updates its hidden state h [ t − 1] to produce h [ t ]. The final hidden state is passed through a dense layer to produce the model’s perceptual report. Training Training was a two-stage process. First, the CNN module was trained on a large dataset of generated grating images to predict the correct orientation. The dataset of 5,400 grating images (128 × 128 pixels) was generated using PsychoPy’s GratingStim module, with parameters matching those used in the human experiment (spatial frequency ( sf ): 2, 3, 4, orientation ( ori ): 0, 1, 2, …, 179, phase ( phase ): 0, 0.1, 0.2, …, 0.9). These images were split into training (3,240 images), validation (1,080 images), and test (1,080 images) sets with a 6:2:2 proportion. The CNN was trained to minimize the cross-entropy loss between one-of- K coded ground-truth orientation y n and its predicted probability distribution e n . Early stopping was employed: training was terminated when the average absolute error of the CNN module on the validation dataset reached below the human-averaged orientation error ( ). Following CNN training, the RNN module was trained with the CNN module’s weights frozen. For each training sample, the CNN’s output evidence e n was repeatedly sampled (16 times) to generate a sequence of 180-dimensional one-hot vectors k [ t ], t = 0, 1, … 15. The RNN module was trained to minimize the cross-entropy loss between the true orientation y n and the RNN’s final output evidence ϵ n . Crucially, to model serial dependence, the initial hidden state h n [0] for the current image x n was set to the final hidden state h m [ T ] of a randomly chosen previous image x m from the training set. Early stopping for the RNN training was similarity applied based on reaching the human-averaged orientation error on the validation dataset. Generating behavioural responses To simulate human behavioural data, SDNet processed sequences of images. For a given trial n with input image x n and a previous trial n − 1 with image x n− 1 , the CNN module first computed evidence e n for x n . The RNN module then made a final decision by accumulating T n samples ({ k n [0], k n [ 1 ], …, k n [ T n ]}) from e n , where T n (e.g., 8 or 16) simulated presentation time. A key aspect of SDNet is that the initial hidden state for processing x n ( h n [0]) was inherited from the final hidden state of the n − 1th image ( h n− 1 [ T n− 1 ]). The deterministic orientation was sampled from the RNN module’s final output evidence ϵ n . Behavioural data generation For comparative analysis, 83 instances of SD-Net were created, each trained with different random splits of the image dataset. For each instances, four sequences of 50 test stimulus images (total 200 images per instance) were generated, mimicking the block structure of the human experiment. No instance-level screening was applied, as the instances were already designed to reproduce human-level precision. However, trial-level screening was performed, excluding samples with an orientation error exceeding 37.5 ° , consistent with the human data screening. This resulted in 15,717 samples (883 samples (approximately 5.3%) were excluded) from 83 SDNet instances for analysis. 4.1.3 Analysis of serial dependence Adjustment error and relative orientation For each trial n , the stimulus properties (orientation y n , spatial frequency f n , phase p n , and presentation time t n ) and the human participant’s /model instance’s response ( z n ) were recorded. The adjustment error e n was calculated as the shortest angular distance between the stimulus and response orientation: where min(· · ·) is an operator that outputs the minimum value of the input elements. The relative orientation from m -back trial, , was defined as the shortest angular distance between the current stimulus orientation y n and the stimulus orientation from m trials back y n−m : For each participant/instance, adjustment errors were averaged within bins defined by relative orientation θ , and other stimulus conditions ( f, t, f − 1 , t − 1 for spatial frequency, presentation time, and their 1-back counterparts): for m = 1, 2, 3. Here, Ω( m, θ, f, t, f − 1 , t − 1 ) represents the set of trial indices satisfying the given conditions within a bin of width 10 ° centered at θ given . Derivative of Gaussian (DoG) Fitting To quantify the amplitude of serial dependence, the averaged error plot ( θ versus ϕ ( −m ) ( θ, f, t, f − 1 , t − 1 )) was fitted to a derivative of Gaussian (DoG) curve [ 20 ] for a given conditions { m, f, t, f − 1 , t − 1 }. The DoG function is defined as: where a is the amplitude of the curve, representing the strength and direction of serial dependence, w is the width parameter describing the range of relative orientations over which the effect occurs, and is a constant. Omitting the condition variables, m, f, t, f − 1 , t − 1 from ϕ ( −m ) ( θ, f, t, f − 1 , t − 1 ) for simplicity notation, the parameters a and w were optimized by minimizing the squared error between the empirical adjustment errors ϕ ( θ ) and the DoG function across all participants/instances: where 𝒮 is a set of pairs of a relative orientation error θ and corresponding adjustment error ϕ ( θ ) for all participants/instances. A sequential least squares programming method, implemented via scipy.optimize.minimize in Python, was used for this minimization. SD amplitude quantification Serial dependence was quantified by the SD amplitude (|SD|) and peak relative orientation (ΔSD) derived from the fitted DoG curve. The peak relative orientation is given by and the corresponding SD amplitude is Here, Θ is the range of possible relative orientations, {−90.0, −89.9, −89.8, …, 89.8, 89.9} degrees. A positive amplitude indicates an attractive bias, while a negative amplitude would indicate a repulsive bias. Statistical testing via bootstrap method Statistical significance for the presence of serial dependence and for comparisons between conditions was assessed using a bootstrap method. To test for the presence of serial dependence in a given dataset 𝒮: We generated 100,000 bootstrap samples , m = 1, …, 100000 by resampling with replacement from 𝒮. For each , we performed DoG fitting to obtain loss . To establish a null distribution, we randomly permuted the adjustment error values ϕ ( θ ) within each bin of (while keeping θ fixed) to create 100,000 permuted sample set . For each , we obtained . The p -value for the null hypothesis (i.e., DoG function does not fit the data better than chance) was calculated as p = K/ 100000, where K is the umber of bootstrap samples where . To compare the strengths of serial dependence between two datasets, 𝒮 1 and 𝒮 2 : We generated 100,000 bootstrap samples and by resampling with replacement from 𝒮 1 and 𝒮 2 , respectively. DoG fitting was performed on each boostrapped sample to obtain for and for . For a one-sided test (e.g., whether 𝒮 1 has stronger serial dependence than 𝒮 2 ), the p -value was calculated as p = K/ 100000, where K is the count of samples where . 4.2 Numerosity judgement task In additon to the orientation adjustment task, we evaluated SDNet using a public dataset from a numerosity judgement task. 4.2.1 Human behavioral dataset We utilized a previously recorded dataset of 32 human participants who performed a numerosity judgement task [ 22 ]. In each trial, participants were sequentially presented with three images (inducer, reference, and probe) containing various numerosity of dots (8, 12, 16, 24, 32 dots), dot size (4, 6, 8 pixel), presentation durations (140, 200, 280 ms). Participants’ task was to determine whether the probe stimulus had more dots than the reference stimulus 1 . Each participant completed 10 blocks of 40 trials, totaling 400 trials. Taking breaks between the blocks, the participants completed 10 blocks, resulted in 400 trials done in total. Unlike the original study, no participants were excluded based on EEG signal quality for this behavioral analysis. 4.2.2 SDNet Architecture The SDNet model for the numerosity judgement task ( Figure 8 ) also consists of CNN and RNN modules. The CNN architecture was identical to that used for the orientation adjustment task (AlexNet-based). However, its output was a 37-dimensional probability distribution over dot numerosities (from 0 to 36). The RNN module was implemented with a GRU of Q = 8 hidden cells, accumulating samples from the CNN’s outout evidence. Download figure Open in new tab Figure 8. SDNet architecture for the numerosity judgement task. The model processes three sequential images (inducer, reference, probe) using a shared-weight CNN-RNN pathway. Each image is initially processed by a CNN module for feature extraction, and its evidence is accumulated by an RNN module. Crucially, the RNN’s hidden state for the reference image is initialized with the final hidden state from the inducer image, and similarly, the RNN’s hidden state for the probe image is initialized with the final hidden state from the reference image. The final hidden states from the reference and probe RNNs are then concatenated and fed into a judgement module (a dense layer followed by a softmax layer) that determines whether the probe image has more dots than the reference. Since the task involved comparing two images (reference and probe), these were independently processed by separate CNN-RNN pathways. The final hidden states for the reference ( h ref ) and probe ( h probe ) images were concatenated to form a 16-dimensional feature vector (as Q = 8, so 8 × 2 = 16). This vector then fed into a judgement module, consisting of a single dense layer (reducing to 2 dimensions) and a softmax layer, to output the likelihood that the probe image had more dots. Training Training data consisted of 32,400 images of random dots, generated using the original script used from [ 22 ]. Dot numerosities ranged from 1 to 36, and dot sizes 2 to 10 pixels, covering the settings of the human experiment. Images were generated at 1080 × 1080 pixel resolution and then scaled to 128 × 128 for SDNet input, preserving dot size ratios. The dataset was split 6:4 into training (19,440 images) and validation (12,960 images) sets. The CNN module was trained first to predict dot numerosity by minimizing cross-entropy loss. Early stopping was applied when the CNN’s average absolute numerosity error on the validation set reached below 3. This threshold was empirically determined to achieve human-level final judgement precision. The RNN and judgement modules were then trained with the CNN weights fixed. The CNN’s output evidence e was sampled 16 times to generate sequences k [ t ] ( t = 0, …, 16) for RNN input. The RNN’s hidden state was updated as h [ t ] = GRU( k [ t ], h [ t − 1]). For each training trial, inducer, reference, and probe images were randomly selected. Crucially, the initial hidden state for the reference image’s RNN was set to the final hidden state of the inducer image’s RNN, and the initial hidden state for the probe image’s RNN was set to the final hidden state of the reference image’s RNN. The RNN and judgement modules were trained to minimize the binary cross-entropy loss for the target variable γ , where γ = 1 if probe numerosity was greater than reference, and γ = 0 otherwise. Early stopping was applied when SDNet’s average judgement error (excluding equal numerosity trials) on the validation set reached below the human-averaged error ( ) Generating behavioural response To generate SDNet behavioural data for comparison, 32 instances were trained using different dataset splits. For each trained instance, 400 trial sequences were generated using images from a separate test set, randomly combining inducer, reference, and probe images with parameters matching the human experiment (dot numerosity: 8, 12, 16, 24, 32; dot size: 4, 6, 8). This resulted in 400 responses per SDNet instance, matching the human dataset’s sample size. 4.2.3 Analysis for serial dependence Point of subjective equality (PSE) For each participant/instance, behavioural data consisted of inducer ( a n ), reference ( b n ), probe ( c n ) dot numerosities, and the binary response r n ∈ {0, 1} (0: reference had more dots, 1: probe had more dots) for trial n . For specific inducer and reference numerosities (reference was fixed at 16 dots in this dataset), the proportion of “probe has more dots” responses, ψ ( c ), was calculated for each probe numeoristy c : where Ω( c ) = { n | c n = c, ∀n } defines the set of trials for a given probe numerosity. A psychometric function (Weibull function) F ( θ ; α, β ) was fitted to these proportions across all participants/instances by minimizing the squared error: where ψ i ( c ) is the proportion for the i th participant/instance. PSE was defined as the probe numerosity c at which the psychometric function yielded a 0.5 probability of responding “probe has more dots”: Serial dependence strength was quantified by analyzing shifts in PSE across different inducer numerosities. Statistical testing via bootstrap method Similar to the orientation adjustment task, a bootstrap method was employed for statistical testing of PSE differences. To compare PSEs between two conditions (e.g., different inducer numerosities for 𝒮 1 and 𝒮 2 ): We generated 100,000 bootstrap samples and by resampling with replacement from 𝒮 1 and 𝒮 2 , respectively. For each bootstrapped sample, PSEs were computed as from and from . For a one-sided test, the p -value for testing whether PSEs from 𝒮 1 and 𝒮 2 are significantly different was calculated as p = K/ 100000, where K is the count of samples where . Author contributions H.H. and K.H. designed and performed the research, collected and analyzed the data. H.H drafted the paper. H.H, K.H., and Y.T edited the paper. Competing interests The authors declare no competing interests. Acknowledgements This work was supported in part by the Japan Society for the Promotion of Science (JSPS) KAKENHI, grant number 22H05163 and 24K15047, and Japan Science and Technology Agency (JST) Advanced International Collaborative Research Program (AdCORP), grant number JPMJKB2307. Funder Information Declared Japan Society for the Promotion of Science, https://ror.org/00hhkn466 , 22H05163 , 24K15047 Japan Science and Technology Agency, https://ror.org/00097mb19 , JPMJKB2307 Footnotes 1 The experiments also included two another tasks. One of the participants’ tasks was to determine whether the probe stimulus had bigger dots than the reference stimulus. The other was to determine whether the probe stimulus had longer presentation time than the reference stimulus. In our experiment, we did not use these data. References [1]. ↵ A. Akrami , C. D. Kopec , M. E. Diamond , and C. D. Brody . Posterior parietal cortex represents sensory history and mediates its effects on behaviour . Nature , 554 ( 7692 ): 368 – 372 , 2 2018 . OpenUrl CrossRef PubMed [2]. ↵ D. Alais , J. Leung , and E. Van der Burg . Linear summation of repulsive and attractive serial dependencies: Orientation and motion dependencies sum in motion perception . Journal of Neuroscience , 37 ( 16 ): 4381 – 4390 , 4 2017 . OpenUrl Abstract / FREE Full Text [3]. ↵ A. Bahl and F. Engert . Neural circuits for evidence accumulation and decision making in larval zebrafish . Nature Neuroscience , 23 ( 1 ): 94 – 102 , 1 2020 . OpenUrl CrossRef PubMed [4]. ↵ J. Barbosa and A. Compte . Build-up of serial dependence in color working memory . Scientific Reports , 10 ( 1 ): 10959 , 7 2020 . OpenUrl PubMed [5]. ↵ P. M. Bays , R. F. G. Catalao , and M. Husain . The precision of visual working memory is set by allocation of a shared resource . Journal of Vision , 9 ( 10 ): 7 – 7 , 9 2009 . OpenUrl Abstract / FREE Full Text [6]. ↵ P. M. Bays and M. Husain . Dynamic shifts of limited working memory resources in human vision . Science , 321 ( 5890 ): 851 – 854 , 8 2008 . OpenUrl Abstract / FREE Full Text [7]. ↵ D. P. Bliss , D. Rahnev , W. E. Mackey , C. E. Curtis , and M. D’Esposito . Stimulation along the anterior-posterior axis of lateral frontal cortex reduces visual serial dependence . Journal of Vision , 23 ( 7 ): 1 , 7 2023 . OpenUrl CrossRef PubMed [8]. ↵ D. P. Bliss , J. J. Sun , and M. D’Esposito . Serial dependence is absent at the time of perception but increases in visual working memory . Scientific Reports , 7 ( 1 ): 14739 , 11 2017 . OpenUrl PubMed [9]. ↵ R. Bogacz , E. Brown , J. Moehlis , P. Holmes , and J. D. Cohen . The physics of optimal decision making: A formal analysis of models of performance in two-alternative forced-choice tasks . Psychological Review , 113 ( 4 ): 700 – 765 , 10 2006 . OpenUrl CrossRef PubMed Web of Science [10]. ↵ S. Brown and A. Heathcote . A ballistic model of choice response time . Psychological Review , 112 ( 1 ): 117 – 128 , 1 2005 . OpenUrl CrossRef PubMed Web of Science [11]. ↵ S. D. Brown and A. Heathcote . The simplest complete model of choice response time: Linear ballistic accumulation . Cognitive Psychology , 57 ( 3 ): 153 – 178 , 11 2008 . OpenUrl CrossRef PubMed Web of Science [12]. ↵ D. Burr and G. Cicchini . Vision: Efficient adaptive coding . Current Biology , 24 ( 22 ): R1096 – R1098 , 11 2014 . OpenUrl CrossRef PubMed [13]. ↵ Y.-A. Cheng , I. Felipe Rodriguez , S. Chen , K. Kar , T. Watanabe , and T. Serre . RTify: Aligning deep neural networks with human behavioral decisions . In Advances in Neural Information Processing Systems , 2024 . [14]. ↵ G. M. Cicchini , G. Anobile , and D. C. Burr . Compressive mapping of number to space reflects dynamic encoding mechanisms, not static logarithmic transform . Proceedings of the National Academy of Sciences , 111 ( 21 ): 7867 – 7872 , 5 2014 . OpenUrl Abstract / FREE Full Text [15]. ↵ G. M. Cicchini , K. Mikellidou , and D. Burr . Serial dependencies act directly on perception . Journal of Vision , 17 ( 14 ): 6 , 12 2017 . OpenUrl CrossRef PubMed [16]. ↵ G. M. Cicchini , K. Mikellidou , and D. C. Burr . Serial Dependence in Perception . Annual Review of Psychology , 75 ( 1 ), 1 2024 . [17]. ↵ C. W. G. Clifford , T. L. Watson , and D. White . Two sources of bias explain errors in facial age estimation . Royal Society Open Science , 5 ( 10 ): 180841 , 10 2018 . OpenUrl CrossRef PubMed [18]. ↵ J. E. Corbett , J. Fischer , and D. Whitney . Facilitating stable representations: serial dependence in vision . PLoS ONE , 6 ( 1 ): e16701 , 1 2011 . OpenUrl CrossRef PubMed [19]. ↵ J. S. Duffy , M. A. Bellgrove , P. R. Murphy , and R.G. O’Connell . Disentangling sources of variability in decision-making . Nature Reviews Neuroscience , 3 2025 . [20]. ↵ J. Fischer and D. Whitney . Serial dependence in visual perception . Nature Neuroscience , 17 ( 5 ): 738 – 743 , 2014 . OpenUrl CrossRef PubMed [21]. ↵ M. Fornaciai and J. Park . Attractive serial dependence in the absence of an explicit task . Psychological Science , 29 ( 3 ): 437 – 446 , 3 2018 . OpenUrl CrossRef PubMed [22]. ↵ M. Fornaciai , I. Togoli , and D. Bueti . Perceptual history biases are predicted by early visual-evoked activity . The Journal of Neuroscience , 43 ( 21 ): 3860 – 3875 , 5 2023 . OpenUrl Abstract / FREE Full Text [23]. ↵ B. Forstmann , R. Ratcliff , and E.-J. Wagenmakers . Sequential sampling models in cognitive neuroscience: Advantages, applications, and extensions . Annual Review of Psychology , 67 ( 1 ): 641 – 666 , 1 2016 . OpenUrl CrossRef PubMed [24]. ↵ M. Fritsche and F. P. de Lange . The role of feature-based attention in visual serial dependence . Journal of Vision , 19 ( 13 ), 11 2019 . [25]. ↵ M. Fritsche , P. Mostert , and F. P. de Lange . Opposite effects of recent history on perception and decision . Current Biology , 27 ( 4 ): 590 – 595 , 2 2017 . OpenUrl CrossRef PubMed [26]. ↵ M. Fritsche , E. Spaak , and F. P. de Lange . A Bayesian and efficient observer model explains concurrent attractive and repulsive history biases in visual perception . eLife , 9 ( e55389 ): 1 – 32 , 6 2020 . OpenUrl CrossRef PubMed [27]. ↵ T. Hanks , R. Kiani , and M. N. Shadlen . A neural mechanism of speed-accuracy tradeoff in macaque area LIP . eLife , 3 ( e02260 ), 5 2014 . [28]. ↵ A. Heathcote and D. Matzke . Winner takes all! What are race models, and why and how should psychologists use them? Current Directions in Psychological Science , 31 ( 5 ): 383 – 394 , 10 2022 . OpenUrl CrossRef [29]. ↵ H. Higashi . Individuality transfer: Predicting human decision-making across tasks . eLife , 14 ( RP107163 ), 6 2025 . [30]. ↵ S.-M. Hsu and Z.-R. Wu . The roles of preceding stimuli and preceding responses on assimilative and contrastive sequential effects during facial expression perception . Cognition and Emotion , 34 ( 5 ): 890 – 905 , 7 2020 . OpenUrl [31]. ↵ A. C. Huk , L. N. Katz , and J. L. Yates . The role of the lateral intraparietal area in (the study of) decision making . Annual Review of Neuroscience , 40 ( 1 ): 349 – 372 , 7 2017 . OpenUrl CrossRef PubMed [32]. ↵ A. C. Huk and M. N. Shadlen . Neural activity in macaque parietal cortex reflects temporal integration of visual motion signals during perceptual decision making . The Journal of Neuroscience , 25 ( 45 ): 10420 – 10436 , 11 2005 . OpenUrl Abstract / FREE Full Text [33]. ↵ N. Kriegeskorte . Deep neural networks: A new framework for modeling biological vision and brain information processing . Annual Review of Vision Science , 1 ( 1 ): 417 – 446 , 11 2015 . OpenUrl CrossRef PubMed [34]. ↵ N. Kriegeskorte and T. Golan . Neural network models and deep learning . Current Biology , 29 ( 7 ): R231 – R236 , 4 2019 . OpenUrl CrossRef PubMed [35]. ↵ A. Krizhevsky , I. Sutskever , and G. E. Hinton . ImageNet classification with deep convolutional neural networks . In Advances in Neural Information Processing Systems , 2012 . [36]. ↵ Liberman , J. Fischer , and D. Whitney . Serial dependence in the perception of faces . Current Biology , 24 ( 21 ): 2569 – 2574 , 11 2014 . OpenUrl CrossRef PubMed [37]. ↵ Liberman , M. Manassi , and D. Whitney . Serial dependence promotes the stability of perceived emotional expression depending on face similarity . Attention, Perception, & Psychophysics , 80 ( 6 ): 1461 – 1473 , 8 2018 . OpenUrl PubMed [38]. ↵ M. Manassi , C. Ghirardo , T. Canas-Bajo , Z. Ren , W. Prinzmetal , and D. Whitney . Serial dependence in the perceptual judgments of radiologists . Cognitive Research: Principles and Implications , 6 ( 1 ): 65 , 10 2021 . OpenUrl [39]. ↵ M. Manassi , A. Kristjansson , and D. Whitney . Serial dependence in a simulated clinical visual search task . Scientific Reports , 9 ( 1 ): 19937 , 12 2019 . OpenUrl PubMed [40]. ↵ M. Manassi , A. Liberman , A. Kosovicheva , K. Zhang , and D. Whitney . Serial dependence in position occurs at the time of perception . Psychonomic Bulletin & Review , 25 ( 6 ): 2245 – 2253 , 12 2018 . OpenUrl PubMed [41]. ↵ M. Manassi and D. Whitney . Illusion of visual stability through active perceptual serial dependence . Science Advances , 8 ( 2 ): 2480 , 1 2022 . OpenUrl [42]. ↵ M. Manassi and D. Whitney . Continuity fields enhance visual perception through positive serial dependence . Nature Reviews Psychology , 3 ( 5 ): 352 – 366 , 4 2024 . OpenUrl [43]. ↵ Y. Murai and D. Whitney . Serial dependence revealed in history-dependent perceptual templates . Current Biology , 31 ( 14 ): 3185 – 3191 , 7 2021 . OpenUrl CrossRef PubMed [44]. ↵ Papadimitriou , A. Ferdoash , and L. H. Snyder . Ghosts in the machine: Memory interference from the previous trial . Journal of Neurophysiology , 113 ( 2 ): 567 – 577 , 1 2015 . OpenUrl CrossRef PubMed [45]. ↵ Pascucci , G. Mancuso , E. Santandrea , C. Della Libera , G. Plomp , and L. Chelazzi . Laws of concatenated perception: Vision goes for novelty, decisions for perseverance . PLOS Biology , 17 ( 3 ): e3000144 , 3 2019 . OpenUrl CrossRef PubMed [46]. ↵ J. Peirce , J. R. Gray , S. Simpson , M. MacAskill , R. Höchenberger , H. Sogo Kastman ,, and J.K. Lindeløv . PsychoPy2: Experiments in behavior made easy . Behavior Research Methods , 51 ( 1 ): 195 – 203 , 2019 . OpenUrl CrossRef PubMed [47]. ↵ A. Prat-Carrabin , F. Meyniel , and R. Azeredo da Silveira . Resourcerational account of sequential effects in human prediction . eLife , 13 ( e81256 ), 1 2024 . [48]. ↵ Rafiei , M. Shekhar , and D. Rahnev . The neural network RTNet exhibits the signatures of human perceptual decision-making . Nature Human Behaviour , 8 ( 9 ): 1752 – 1770 , 7 2024 . OpenUrl PubMed [49]. ↵ R. Ratcliff . A theory of memory retrieval . Psychological Review , 85 ( 2 ): 59 – 108 , 3 1978 . OpenUrl CrossRef Web of Science [50]. ↵ R. Ratcliff and G. McKoon . The diffusion decision model: Theory and data for two-choice decision tasks . Neural Computation , 20 ( 4 ): 873 – 922 , 4 2008 . OpenUrl CrossRef PubMed Web of Science [51]. ↵ R. Ratcliff , P. L. Smith , S. D. Brown , and G. McKoon . Diffusion decision model: Current issues and history . Trends in Cognitive Sciences , 20 ( 4 ): 260 – 281 , 4 2016 . OpenUrl CrossRef PubMed [52]. ↵ M. Schwiedrzik , C. C. Ruff , A. Lazar , F. C. Leitner , W. Singer , and L. Melloni . Untangling perceptual memory: Hysteresis and adaptation map into separate cortical networks . Cerebral Cortex , 24 ( 5 ): 1152 – 1164 , 5 2014 . OpenUrl CrossRef PubMed [53]. ↵ T. C. Sheehan and J. T. Serences . Attractive serial dependence overcomes repulsive neuronal adaptation . PLOS Biology , 20 ( 9 ): e3001711 , 9 2022 . OpenUrl CrossRef PubMed [54]. ↵ St. John-Saaltink , P. Kok , H. C. Lau , and F. P. de Lange . Serial dependence in perceptual decisions is reflected in activity patterns in primary visual cortex . The Journal of Neuroscience , 36 ( 23 ): 6186 – 6192 , 6 2016 . OpenUrl Abstract / FREE Full Text [55]. ↵ J. Taubert , D. Alais , and D. Burr . Different coding strategies for the perception of stable and changeable facial attributes . Scientific Reports , 6 ( 1 ): 32239 , 9 2016 . OpenUrl PubMed [56]. ↵ K. Turbett , R. Palermo , J. Bell , D. A. Hanran-Smith , and L. Jeffery . Serial dependence of facial identity reflects high-level face coding . Vision Research , 182 : 9 – 19 , 5 2021 . OpenUrl CrossRef PubMed [57]. ↵ A. E. Urai and T. H. Donner . Persistent activity in human parietal cortex mediates perceptual choice repetition bias . Nature Communications , 13 ( 1 ): 6015 , 10 2022 . OpenUrl PubMed [58]. ↵ R. van den Berg , H. Shin , W.-C. Chou , R. George , and W. J. Ma . Variability in encoding precision accounts for visual short-term memory limitations . Proceedings of the National Academy of Sciences , 109 ( 22 ): 8780 – 8785 , 5 2012 . OpenUrl Abstract / FREE Full Text [59]. ↵ Vickers . Evidence for an accumulator model of psychophysical discrimination . Ergonomics , 13 ( 1 ): 37 – 58 , 4 2007 . OpenUrl [60]. ↵ Y. Xia , A. Y. Leib , and D. Whitney . Serial dependence in the perception of attractiveness . Journal of Vision , 16 ( 15 ): 28 , 12 2016 . OpenUrl CrossRef [61]. ↵ L. K. Yamins and J. J. DiCarlo . Using goal-driven deep learning models to understand sensory cortex . Nature Neuroscience , 19 ( 3 ): 356 – 365 , 3 2016 . OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted August 27, 2025. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following A residual memory trace in an accumulator explains serial dependence Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share A residual memory trace in an accumulator explains serial dependence Hiroshi Higashi bioRxiv 2025.08.24.671986; doi: https://doi.org/10.1101/2025.08.24.671986 Share This Article: Copy Citation Tools A residual memory trace in an accumulator explains serial dependence Hiroshi Higashi bioRxiv 2025.08.24.671986; doi: https://doi.org/10.1101/2025.08.24.671986 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Animal Behavior and Cognition Subject Areas All Articles Animal Behavior and Cognition (7629) Biochemistry (17660) Bioengineering (13881) Bioinformatics (41911) Biophysics (21436) Cancer Biology (18578) Cell Biology (25482) Clinical Trials (138) Developmental Biology (13371) Ecology (19887) Epidemiology (2067) Evolutionary Biology (24302) Genetics (15599) Genomics (22483) Immunology (17728) Microbiology (40364) Molecular Biology (17163) Neuroscience (88537) Paleontology (666) Pathology (2830) Pharmacology and Toxicology (4821) Physiology (7637) Plant Biology (15129) Scientific Communication and Education (2045) Synthetic Biology (4290) Systems Biology (9817) Zoology (2269)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00