Impact of Task Similarity and Training Regimes on Cognitive Transfer and Interference

doi:10.1101/2025.09.22.677779

Impact of Task Similarity and Training Regimes on Cognitive Transfer and Interference

2025 · doi:10.1101/2025.09.22.677779

preprint OA: gold CC-BY-NC-ND-4.0

📄 Open PDF Full text JSON View at publisher

Full text 66,163 characters · extracted from preprint-html · click to expand

Impact of Task Similarity and Training Regimes on Cognitive Transfer and Interference | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Impact of Task Similarity and Training Regimes on Cognitive Transfer and Interference View ORCID Profile N. Menghi , S. Vigano’ , View ORCID Profile W. J. Johnston , S. Elnagar , View ORCID Profile S. Fusi , F. C. Doeller doi: https://doi.org/10.1101/2025.09.22.677779 N. Menghi 1 Max Planck Institute for Human Cognitive and Brain Sciences, Department of Psychology , Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for N. Menghi For correspondence: menghi{at}cbs.mpg.de S. Vigano’ 1 Max Planck Institute for Human Cognitive and Brain Sciences, Department of Psychology , Germany 2 Center for Mind/Brain Sciences, University of Trento , Rovereto 38068, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site W. J. Johnston 3 Center for Theoretical Neuroscience Columbia University , New York, NY, USA Mortimer B. Zuckerman Mind, Brain and Behavior Institute, Columbia University , New York, NY, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for W. J. Johnston S. Elnagar 1 Max Planck Institute for Human Cognitive and Brain Sciences, Department of Psychology , Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site S. Fusi 3 Center for Theoretical Neuroscience Columbia University , New York, NY, USA Mortimer B. Zuckerman Mind, Brain and Behavior Institute, Columbia University , New York, NY, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for S. Fusi F. C. Doeller 1 Max Planck Institute for Human Cognitive and Brain Sciences, Department of Psychology , Germany 4 Kavli Institute for Systems Neuroscience, Center for Neural Computation, Jebsen Center for Alzheimer’s Disease, Norwegian University of Science and Technology , Trondheim 7491, Norway Find this author on Google Scholar Find this author on PubMed Search for this author on this site Abstract Full Text Info/History Metrics Preview PDF Abstract Learning depends not only on the content of what we learn, but also on how we learn and on how experiences are structured over time. To investigate how task similarity and training regime interact during learning, we trained participants on spatial and conceptual learning tasks that shared either similar or distinct underlying structures, using either interleaved or blocked regimes. Interleaving the two tasks hindered performance when their structures were similar, compared to when they were different. In contrast, blocked training produced the opposite effect: it improved performance and facilitated transfer across similar tasks. This effect, however, emerged only when participants first learned the conceptual task, followed by the spatial task, suggesting an asymmetric interaction between task order and structural similarity. We also replicated our results using a neural network model, providing converging evidence for the computational principles governing the interplay between training regime and structural similarity in multi-task learning. 1 Introduction Unlike machines, humans exhibit an extraordinary capacity for learning and adapting to a wide range of tasks, demonstrating resilience against interference and forgetting. We can effortlessly learn to navigate through vast cities in the United States while retaining our spatial memory and orientation of smaller, irregular towns in Italy. Similarly, we can acquire new languages without forgetting our native tongue. Unraveling the principles of how “continual learning” ( Parisi, Kemker, Part, Kanan, & Wermter, 2019 ; Flesch, Balaguer, Dekker, Nili, & Summerfield, 2018 ; Hadsell, Rao, Rusu, & Pascanu, 2020 ; Kirkpatrick et al., 2017 ; Fusi, 2021 ; Flesch, Saxe, & Summerfield, 2023 ) works is crucial not only for comprehending our own cognitive processes but also for guiding contemporary artificial intelligence research, especially in the face of the “catastrophic forgetting” artificial neural networks suffer from. Despite its significance, however, the precise mechanisms responsible for driving this ability remain unresolved ( Kudithipudi et al., 2022 ). Studies exploring the neurocognitive principles governing the organization and representation of knowledge in humans propose that the brain is equipped with processing principles supporting the extraction of structural regularities from the environment, informing models of the world and guiding decision-making ( Behrens et al., 2018 ; Bellmund, Gärdenfors, Moser, & Doeller, 2018 ; Kaplan, Schuck, & Doeller, 2017 ; Whittington et al., 2020 ). Within this framework, items, concepts, or “states” can be organized in relational maps where their relative positions are determined by a set of relevant features, dimensions, or outcomes ( Shepard & Metzler, 1971 ; Gardenfors, 2004 ; Bellmund et al., 2018 ), and distances in these maps code for similarity, placing similar inputs closer than dissimilar ones ( Viganò, Rubino, Di Soccio, Buiatti, & Piazza, 2021 ; Viganò, Bayramova, Doeller, & Bottini, 2023 ; Theves, Fernandez, & Doeller, 2019 ; Theves, Fernández, & Doeller, 2020 ; Nitsch, Garvert, Bellmund, Schuck, & Doeller, 2024 ; Barnaveli, Viganò, Reznik, Haggard, & Doeller, 2025 ). Extracting these models not only facilitates storage and memorization but also promotes generalization and the transfer of acquired knowledge to similar situations ( Mark, Moran, Parr, Kennerley, & Behrens, 2020 ; Aho, Roads, & Love, 2022 ; Dekker, Otto, & Summerfield, 2022 ). For example, after learning the water and light requirements for one plant in our garden, this information can be easily applied to new exemplars or species that share sufficient similarities, avoiding the need to (re)learn from scratch. Inspired also by intuitions from machine learning (e.g., ( Caruana, 1997 )), prior studies have indeed demonstrated that humans exploit structural similarities between tasks, and that this can enhance knowledge transfer and generalization ( Menghi, Kacar, & Penny, 2021 ; Wu, Schulz, Garvert, Meder, & Schuck, 2020 ; K. Garner, Lynch, & Dux, 2016 ; Holton, Braun, Thompson, Grohn, & Summerfield, 2025 ). Directly comparing humans and machines, Flesch and colleagues (2018) observed that humans, but not machines, benefit from learning different, orthogonal, classification tasks in separated and temporally autocorrelated contexts. This blocked training regime prevented interference between tasks even on later generalization tests, demonstrating humans’ ability to decompose complex tasks into non-interfering subcomponents. According to their perspective, this approach might support continual learning by facilitating participants to create separated and non-overlapping low-dimensional embeddings of the stimulus space, which thus align with the behaviorally relevant orthogonal rules. In other words, a blocked training regime helps to differentiate what needs to be differentiated, efficiently meeting the requirements of a “continual learning” system. Following this logic, one might interpret the factorization/separation proposed by Flesch and colleagues as a mechanism employed by the brain to specifically protect against the interference that very different tasks might produce. In other words, to ensure that the system is not overloaded by contrasting information, contextual dissociation proves beneficial, making a blocked regime favorable for decorrelation/differentiation compared to an interleaved one. If this is the case, then the effect should reverse when the subspaces are not orthogonal but rather similar. In such instances, the system should have better performance when presented with multiple tasks of similar structure in an interleaved fashion, or at least it should remain unchanged: we might get confused if, in our garden, we constantly alternate taking care of plants with very different light or water requirements, but if they all share the same needs, our cost should be highly reduced. In a previous study, we tested the above hypothesis by designing an experiment with two tasks from different domains — spatial and conceptual — each featuring either similar or distinct structures, under an interleaved training regime. Contrary to our expectations, the interleaved regime did not facilitate transfer; instead, it caused significant interference between tasks with similar structures during learning ( Menghi et al., 2025 ). These results highlighted a more complex interplay between task similarities and training regime than previously assumed. To further characterize this interplay, in the current study, we test both human participants and a neural network model under a blocked training regime, and compare the results to those we previously obtained under an interleaved training regime. Specifically, we reuse the same neural network architecture and task design from our prior study ( Menghi et al., 2025 ), but modify the training regime to present tasks in separate blocks rather than in an interleaved fashion. Crucially, our goal is not only to examine the individual effects of task structure similarity and training regime, but to understand how these two factors interact to shape learning dynamics. While prior work has often treated task similarity and training regime as independent variables, their interaction may be key to understanding when generalization is facilitated and when interference occurs. Investigating this interaction will provide insight into the conditions under which shared structure is beneficial versus detrimental, offering a more comprehensive account of how humans and machines build internal representations for continual learning. We predict that participants trained under a blocked regime will perform better during the learning phase compared to those trained interleaved, although this advantage may not persist during the subsequent testing phase (see also ( Flesch et al., 2018 )). Furthermore, we expect both the neural network and participants to transfer knowledge between tasks during blocked training when structures are shared. In our behavioral data, we find evidence of transfer between tasks under blocked training. Interestingly, and in contrast to previous findings ( Wu, Schulz, Garvert, Meder, & Schuck, 2018 ; Wu et al., 2020 ; Lerousseau & Summerfield, 2024 ), this transfer appears to be directional, from conceptual to spatial tasks. We discuss the reason for this unexpected asymmetry in the Discussion. Consistent with our predictions, the neural network simulations also exhibit transfer between blocked consecutive tasks, but only when the tasks share the same underlying structure, reinforcing the idea that structural similarity facilitates generalization under specific training regimes. 2 Results We trained participants to perform an associative learning task across two contexts in either an interleaved regime or a blocked one; data for the interleaved training regime were collected as part of a different experiment (see ( Menghi et al., 2025 )). They had to predict if a seed was going to “grow” or “die” based on two distinct sets of features, where the relevant features were determined by the identity of the seed (See Fig. 1A-B ). Decisions about the first seed relied on what we called the “conceptual features”: participants had to learn the association between configurations of the opacity of a sun and a drop of water images and the outcome (grow or die). Decisions about the second seed relied on “spatial features”: participants had to learn the association between configurations of position in space in which the seed was planted and an outcome (grow or die). The different contexts were cued by two different seeds (See Fig. 1A ). Download figure Open in new tab Figure 1: Stimuli, Task Structures and Trial Structure Panel A Shows the experimental stimuli and cues. Two seeds were used to cue for the two different tasks, spatial and conceptual. In the conceptual task, we used a sun and a water drop symbol as features composing a stimulus configuration. In the spatial task, we used a position (x,y) on a square map as a stimulus. Panel B shows the different structures used. In the conceptual task, each vertical (sun opacity) and horizontal (a drop of water opacity) position can be combined, creating a continuous map, or structure, from which we draw stimuli. In these structures, black colour is associated with the outcome “die” and white colour is associated with the outcome “grow”. The structures of the two tasks were the same in one group and orthogonal in the other group of participants. Panel C shows the different phases of the experiment. In each phase, conceptual and spatial tasks were organized in either an interleaved or a blocked regime. Blocked regimes were further divided into two groups, one starting with the conceptual task, the other with the spatial one. Panel D shows the schematic of a trial structure during the training phase. A fixation cross was shown for 0.5 seconds, and then the seed cueing the task domain appeared for 1 second. Brown seed cued participants to pay attention to the conceptual features and ignore the spatial ones, and vice-versa, the grey seed cued participants to pay attention to the spatial features and ignore the conceptual ones. Afterwards, both spatial and conceptual configurations appeared on screen and stayed there for 2.5 seconds maximum, or until response. This is when participants used a button box to predict if, based on the relevant features presented, the seed was associated with “grow” or “die”. Finally, feedback appeared and stayed on screen for 1 second. Panel E shows the schematic of a trial structure during the testing phase. A fixation cross was shown for 0.5 seconds, and then the seed cueing the task domain appeared for 1 second. Afterwards, spatial and conceptual configurations appeared on screen and stayed there for 2.5 seconds maximum, or until response. Unlike the training phase, no feedback was provided. Participants were randomly assigned to different groups, see table 1 in the methods section for a breakdown of the groups and participants assignments. Half of the participants were assigned to either a “Same structure” (SaSt) or a “Different structure” (DiSt) group, which differed based on the similarity between the feature to outcome mappings (see Fig.1B ). Participants in the SaSt group had the same feature-outcome structure in both contexts, while participants in the DiSt group had a flipped structure across the two contexts ( Fig.1B ). 60 participants were assigned to the interleaved condition and 120 to the blocked condition. Participants in the interleaved group were trained and tested with an interleaved regime: trials from the conceptual and spatial task were sampled randomly (see Fig.1C ). Participants in the blocked group were trained with a blocked regime: 144 trials in one task followed by 144 trials in the other one, followed by a testing session with an interleaved regime. Finally, we divided participants in the blocked condition into two groups, one starting with the spatial task, and one beginning with the conceptual one (see Table 1 for a breakdown of the experimental design). Each participant was first trained via feedback learning (see Fig.1D ), and then tested (see Fig.1E ) during two separate sessions, on the same day, separated by a navigation task that pertained to a different question and will be analysed separately (See Methods). View this table: View inline View popup Download powerpoint Table 1: Subjects and groups Subjects were assigned to either the SaSt/DiSt or to blocked/Interleaved conditions. Numbers between brackets are the number of participants discarded. To assess the effect of task similarity and training regime on representation learning, we divided the analysis into three parts. First, we compared participant accuracies between the interleaved and the blocked group by assessing their learning and generalization performance. Second, we looked at the effect of task similarity and its interaction with the training regime. Finally, we checked if there was a directionality of the effect by looking at the learning performance between participants who either started with the spatial or the conceptual tasks in the blocked training regime. 2.1 Training Regime We operationalized learning accuracy as the proportion of correct responses over all trials in the training and test phases. We then quantified generalization during the test session by computing the proportion of correct responses for novel configurations that, contrary to old ones, were not presented during training. First, we performed two between-subject t-tests to see if general performance during training and test was different between the two training regime groups. We found that participants belonging to the blocked group performed better compared to those in the interleaved regime during both the training phase (t(168) = 6.693, p < 0.001) and test phase (t(168) = 3.488, p < 0.001), as shown in Figure 2 A and B . To look at the difference in performance between old and new stimuli, during the testing phase, we performed a 2x2 mixed-design ANOVA, with training regime as between factor and novelty of stimuli (new or old) as within factor. We found both main effects and the interaction to be statistically significant (Regime: F(1,168) = 14.109, p < 0.001; Novelty: F(1,168) = 204.16, p < 0.001; Interaction: F(1,168) = 16.395, p < 0.001). This indicates that, overall, participants performed better for the old stimuli compared to the new, unseen ones and that they had a better performance when trained with a blocked regime, but that this group difference was mostly led by their performance for the old stimuli, as shown in Figure 2 C . Indeed, despite being numerically different, the performance of the two groups for the new configurations during the test phase did not diverge in a statistically significant way ( p = 0.113), suggesting that generalization happened under both training regimes, as both groups performed above chance (Blocked: p < 0.001; Interleaved: p < 0.001). Download figure Open in new tab Figure 2: General performance and Generalization Panel A shows participants’ mean accuracies during the training blocks and Panel B during test phases. Panel C shows participants’ performance for old and new stimuli during the testing phase. Participants are divided into the different training regimes. All the error bars show standard error of the mean. 2.2 Task Similarity and Training Regime To examine the interaction between training regime and task similarity in more detail, we ran separate analyses for blocked and interleaved regimes, looking at the difference in performance between SaSt and DiSt groups. 2.2.1 Interleaved We performed two between-subject t-tests to see if general performance in the two task similarity groups was different. We found that participants belonging to the DiSt group performed better compared to those in the SaSt group during the training phase (t(52) = 2.908, p = 0.005), as shown in Figure 3 A . Their performance, however, was not statistically different during the test phase (t(52) = 1.426, p = 0.159). We performed two 2x2 mixed-design ANOVAs, with between factor the group and within factor the novelty of the stimuli in the test phase (For a comparison of performance between the two testing sessions, see the supplementary materials). We found a significant main effect of novelty (F(1,52) = 37.141, p < 0.001) and interaction (F(1,52) = 5.240, p = 0.026), indicating that participants performed better with old stimuli compared to new ones, but no group main effect (F(1,52) = 2.497, p = 0.12) (See Figure 3C ). Download figure Open in new tab Figure 3: General performance and Generalization for SaSt and DiSt groups Panel A shows participants’ mean accuracies during the training blocks and Panel B during test phases. Participants are divided into SaSt and DiSt group conditions and into the different training regimes groups. Panel C shows participants’ performance for old and new stimuli during the testing phase. Participants are divided into the different training regimes and into the different training regimes groups. All the error bars show the standard error of the mean. 2.2.2 Blocked We performed two between-subject t-tests to see if general performance in the two task similarity groups was different. We found no differences in performance between DiSt group and the SaSt group during the training phase (t(114) = 0.387, p = 0.699), nor during the testing phase (t(114) = 0.387, p = 0.699) as shown in Figure 3 A and B . We performed two 2x2 mixed-design ANOVAs, with between factor being the group (DiSt Vs SaSt) and within factor the novelty of the stimuli on the test phase. We found only the novelty main effect (F(1,114) = 284.9, p < 0.001) but no significant group effect nor interaction (Task Similarity F(1,114) = 0.346, p = 0.557; Interaction F(1,114) = 2.766, p = 0.099), indicating that participants performed better with old stimuli compared to new ones (See Figure 3C ). 2.3 Directionality of transfer learning in blocked regime Next, we focused our analysis on the blocked group to see whether there is a directionality in the way task similarity influenced transfer during the training phase, specifically when switching from one task to the next. One possibility is that transfer is stronger when switching from a conceptual task to a spatial one, indicating that conceptual representations may support performance in more concrete spatial contexts. Conversely, it could be that transfer is more effective in the opposite direction—from spatial to conceptual—indicating that grounding in (more concrete) spatial representations may scaffold the acquisition of (more abstract) conceptual ones. For the spatial-first group, we compared performance on the conceptual task between the SaSt and DiSt conditions. Similarly, for the conceptual-first group, we compared performance on the spatial task between the SaSt and DiSt conditions. We performed two between-subject t-tests and found that participants in the SaSt performed significantly better in the spatial task for participants starting with the conceptual one (t(56) = 2.162, p = 0.034), but no differences in the conceptual task for participants starting with the spatial one (t(56) = 0.352, p = 0.726). The direction of transfer appears to be asymmetric, with a significant effect when transferring from conceptual to spatial tasks, but not the other way around. 2.4 Artificial neural networks offer insight into the difference in learning performance To investigate how different training regimes influence learning under shared versus distinct task structures, we employed the same neural network architecture used in our previous work( Menghi et al., 2025 ). In the current study, however, the tasks were presented in a blocked fashion rather than interleaved as in the previous study. The networks received input variables specific to each task, along with additional inputs that signaled the context of each trial—analogous to the seed identity cues used in the behavioral experiment (see Methods). Some networks were trained on sequential tasks that shared the same underlying structure across, while others were trained on sequential tasks with different structures. We then assessed the learning speed for both the first and second tasks in the sequence. We first tested the network using input variables assigned to perfectly orthogonal dimensions. We observed no difference in learning speed between networks trained on same-structure and different-structure tasks, for both the first and second tasks ( Figure 5 , panel D, left). This is because, from the network’s perspective, same- and different-structure conditions are indistinguishable: the orthogonality of the input variables prevents any shared representational overlap between the two task contexts, eliminating any potential for transfer or interference. To introduce a representational bias in the network, we manipulated the similarity between task features by representing the different features in the input along semi-orthogonal dimensions ( Figure 5 , panel C, middle), with similarity quantified using the cosine similarity between the vectors defining each feature. For instance, under high feature similarity manipulation, the amount of water in context 1 might be aligned with the x-position of seeds in context 2. This alignment encourages the network to treat different features with different levels of similarity. Networks trained on tasks with higher feature similarity and the same task structure across contexts exhibited faster learning for the second task ( Figure 5 , panel E, middle). This pattern qualitatively mirrors the behavioral effect observed in our participants. Finally, we examined an extreme version of this similarity manipulation in which the network received only two task-relevant features, perfectly aligned across contexts ( Figure 5 , panel C, right). In this scenario, the same-structure task becomes non-contextual: the network—or, by analogy, the participant—can ignore the contextual variable (e.g., seed identity) and still perform the task accurately. In contrast, for the different-structure condition, context remains essential for correct task execution. As a result, networks trained on the same-structure task learned the second task substantially faster than those trained on different-structure tasks ( Figure 5 , panel E, right). Overall, the neural networks revealed that increasing similarity between relevant features enhances learning in tasks with the same underlying structure, which is consistent with our behavioral results. Interestingly, in the intermediate feature similarity regime ( Figure 5 , panels C, D, E, middle), this pattern depends on whether the network was trained in a block or interleaved manner. In particular, blocked training produces faster learning in the same structure condition, while interleaved training produces faster learning in the different structure condition – just as in our human participants. 3 Discussion We investigated how training regime, task similarity, and their interaction influence representation learning. Participants learned two tasks under different training regimes, where stimulus–outcome associations were defined by a low-dimensional manifold that was either shared or distinct across tasks (see Fig. 1 ). Our behavioral analyses revealed that a blocked training regime benefited learning during the training phase (see Fig. 2 ). Although test performance was also higher in the blocked condition, participants performed better on previously encountered configurations than on novel ones, indicating that this advantage was led by improved memorization rather than enhanced generalization. Supporting this, performance on novel stimuli did not differ between training regimes, suggesting no difference in generalization ability. During training, participants exposed to interleaved regime with similar structures showed worse performance compared to participants trained with tasks with different structures, consistent with interference from overlapping representations (see ( Menghi et al., 2025 )). Importantly, this interference effect diminished over time, and group differences disappeared during the testing phase (see Fig. 3 ). Additionally, we observed a directional transfer effect in the blocked condition. Participants who began with the conceptual task and trained on structurally similar tasks performed better on the second, spatial, task compared to those trained on dissimilar structures (see Fig. 4 ). However, no such benefit was observed when participants started with the spatial task, suggesting an asymmetric transfer from conceptual to spatial domains. These results highlight the critical role of both training regime and task structure in shaping representation learning, demonstrating how blocked training can facilitate transfer when task structures align, while interleaved training may lead to interference, particularly when tasks share similarities. Download figure Open in new tab Figure 4: Transfer benefit during training The figure shows participants’ mean accuracies, during blocked training regime, for the second task, which appears in the third and fourth blocks of the study. Participants are divided into SaSt and DiSt groups. Error bars show the standard error of the mean. The neural network model offered additional insight into the nature of the shared representations (see Fig. 5 ). When the two tasks involved orthogonal dimensions, task structure had no impact on the network’s performance—the same and different conditions were functionally indistinguishable from the network’s perspective. In contrast, as the similarity between task dimensions increased, the network learned more efficiently when the task structures were aligned, mirroring the effect observed in human participants. This pattern differed under an interleaved training regime, where the network experienced interference due to overlapping representations, consistent with our previous findings ( Menghi et al., 2025 ). These results highlight an interaction between the training regime and task structure. Our human and network findings align with Holton et al. ( Holton et al., 2025 ), who showed that both biological and artificial learners benefit from shared representations during learning. However, they also revealed the flip side of this effect: reusing existing representations can lead to interference with previously acquired knowledge (See also (K. G. Garner & Dux, 2023 ; Musslick & Cohen, 2021 ). Download figure Open in new tab Figure 5: Blocked training in an RNN with aligned latent variables replicates our behavioral finding. Panel A Schematic of the neural network. There are two latent variables (LVs) relevant to the first context (cLV1 and cLV2), two relevant to the second (sLV1, sLV2), and two variables that signal the context (i.e., the seed identity in the experiment). There is a single hidden layer and one output unit. Panel B The tasks the network is trained to perform in two contexts (conceptual and spatial, left and right). The tasks are a coarser version of the experimental task and also have the same structure and different structure conditions. Panel C Schematic of the three input conditions for the network: (left) the latent variables are all orthogonal to each other; (middle) pairs of latent variables across the two contexts are encoded along semi-orthogonal directions; (right) there are only two, rather than four, total latent variables, and the latent variables across the different contexts are identical in the input to the network. Panel D The learning trajectories across 50 training epochs for each input structure, averaged over n = 50 random initializations of the model parameters. The error bars are the standard error of the mean (SEM), but are smaller than the line width. Panel E The average total difference in learning trajectory across the networks above for orthogonal inputs (left), a range of semi-orthogonal inputs (middle), and identical inputs (right). Each point shows a different initialization of the network. 3.1 Training Regime Our results align with those of Flesch and colleagues (2018) , showing that participants in the blocked regime perform better than those in the interleaved regime. This performance advantage persists into the testing phase. We found that the performance difference during testing is driven by improved memorization of old stimuli rather than by a benefit generalization to new stimuli. The literature on the benefits of different training regimes presents mixed evidence ( Rohrer, Dedrick, & Stershic, 2015 ; Carvalho & Goldstone, 2014 ; Zhou, Singh, Tandoc, & Schapiro, 2023 ). These discrepancies may stem from differences in what is being blocked or interleaved—specifically, whether the manipulation occurs at the level of entire tasks or within a single task at the level of individual stimulus configurations. In our study, tasks were blocked or interleaved, but it is possible that the effect would reverse if the manipulation were applied to the stimuli instead. That is, interleaving different stimulus configurations within a single task—rather than switching between different tasks—might encourage the integration of overlapping features and promote generalization in humans. However, interleaving two tasks might create interference between representations that would otherwise be separated. 3.2 Transfer Learning in blocked training regime Consistent with findings by Wu et al. (2020) and Lerousseau and Summerfield (2024) , we observed a directional transfer effect in the blocked training regime, with performance on the second task influenced by the first. However, the direction of transfer in our study was reversed: whereas previous studies reported transfer from a spatial to a conceptual task, we found transfer from a conceptual to a spatial task. We suggest this discrepancy stems from differences in task nature. Wu et al.’s tasks involved navigation in spatial and conceptual spaces—that is, participants had to search for rewards by systematically exploring options based on two varying features, effectively navigating through a structured space of possibilities. These paradigms are likely grounded in spatial cognition. In such cases, spatial navigation may scaffold conceptual navigation, whereas spatial tasks may rely on more hardwired neural mechanisms hence remain unaffected by prior conceptual navigation. In contrast, our tasks involved classification, arguably more rooted in conceptual processing, as participants had to group stimuli based on abstract feature relationships rather than explore a physical or feature-based layout. This may have enabled knowledge acquired in the conceptual task to support learning in the spatial classification task, but not the reverse. Lerousseau and Summerfield (2024) further showed that their spatial task promoted learning of a low-dimensional rule transferable to a conceptual context. In our case, learning the conceptual rule (e.g., “if light and water levels are similar, the seed grows”) required compressing a two-dimensional feature space into a one-dimensional rule space. Spatial classification, by contrast, may remain intrinsically two-dimensional, hence less generalizable. This asymmetry in representational complexity may account for the reversed direction of transfer observed in our study. 3.3 Cognitive control: Compositionality or Conjunctive Representation Our findings also contribute to the cognitive control literature, which has long debated the nature of task representations, specifically whether they are compositional or conjunctive ( Badre, 2024 ). Compositional representations are built from reusable components that transfer across tasks, enabling flexible behavior but at the cost of increased interference ( Musslick & Cohen, 2019 ; Badre, Bhandari, Keglovits, & Kikumoto, 2021 ; Fusi, Miller, & Rigotti, 2016 ; Schwartenbeck et al., 2023 ; Bakermans, Warren, Whittington, & Behrens, 2025 ; Johnston, Fine, Yoo, Ebitz, & Hayden, 2024 ). In contrast, conjunctive representations bind task elements into task-specific codes, limiting generalizability but protecting from interference ( Kikumoto & Mayr, 2020 ; Duncan, Doll, Daw, & Shohamy, 2018 ; Bhandari, Keglovits, & Badre, 2024 ). The pattern of interference we observed under interleaved training regime, particularly when tasks shared structural similarity, suggests that early in learning, representations may be compositional, allowing shared task features to overlap while being subject to interference. Over time, however, this interference diminishes, pointing toward a shift toward more conjunctive, task-specific representations. This learning-dependent transformation from compositional to conjunctive coding may reflect a mechanism by which the cognitive system balances generalization and interference as task demands and experience evolve (see also ( Kikumoto & Mayr, 2020 ; O’Reilly & Rudy, 2001 ; Franklin & Frank, 2020 ; Boyle, Posani, Irfan, Siegelbaum, & Fusi, 2024 )). 3.4 Consolidation theory and Cognitive Maps: Interference and Transfer A similar dynamic is proposed in consolidation theories, which suggest that there is a critical window in which newly formed memories or knowledge are susceptible to interference from newly learned information ( Lechner, Squire, & Byrne, 1999 ; Robertson, Pascual-Leone, & Miall, 2004 ; Zaki & Cai, 2024 ; Mutanen, Bracco, & Robertson, 2020 ). This period of instability allows the encoding of different knowledge to interact, potentially resulting in transfer and formation of high-level representations ( Robertson, 2012 ; Mosha & Robertson, 2016 ; Robertson, 2018 ). Once knowledge is fully consolidated, transfer becomes less likely ( Mosha & Robertson, 2016 ; Lu, Hummos, & Norman, 2024 ). Our results align with and expand upon this framework. Our study suggests the existence of an additional layer of instability. Participants learning with an interleaved training regime experienced interference between tasks with similar structures, indicating the need for this knowledge to be stabilized. In contrast, participants in the blocked regime, who had more time for training on a single task, demonstrated knowledge transfer when the structures between tasks were similar. We propose a new relationship between the instability of newly learned information and transferability: high levels of instability of knowledge may be associated with interference, whereas some instability is necessary for knowledge transfer between tasks. On the other hand, full stabilization results in neither transfer nor interference ( Mosha & Robertson, 2016 ). Furthermore, our findings provide additional evidence of the brain’s ability to abstract relationships between tasks in different domains into a higher-level representation. This representation is compatible with the concept of an amodal cognitive map—meaning a flexible, domain-general representation of structural relationships across various types of information, independent of the specific sensory or conceptual modalities involved ( Behrens et al., 2018 ). 3.5 Conclusion In conclusion, our study shows that the interaction between training regime and task structure similarity critically shapes representation learning. Participants trained under a blocked regime outperformed those in an interleaved regime during both training and testing. Crucially, when task structures were similar, the blocked regime facilitated knowledge transfer across tasks, though asymmetrically, with transfer occurring from the conceptual to the spatial task but not the reverse. In contrast, the same structural similarity impaired learning under the interleaved regime, where shared representations led to interference and reduced performance. This interference, however, decreased with practice, suggesting partial resolution over time. These findings underscore that similar task structures can either support (transfer) or hinder (interference) learning, depending on the training regime. 4 Methods 4.1 Participants A total of 180 volunteers participated in the experiment (mean age = 28.9, SD = 4.4, 77 identified as males and 103 as females). All the participants were naive to the purpose of the experiment. 60 participants, belonging to interleaved group condition, completed the experiment while we recorded MEG. The remaining 120 participants completed the experiment in the behavioural lab. Data from ten participants were discarded because their performance was below the chance level (56%) in both the spatial and the conceptual tasks. We performed analyses on the remaining 170 participants. All participants gave informed written consent, and the study procedure was approved by the local institutional review board of the University of Leipzig (Ethics Reference Number: 045/22-ek). At the end of the experiment, participants received reimbursement for their participation. 4.2 Apparatus and Stimuli Participants completed the experiments inside a sound-attenuated, dimly lit, and magnetically shielded room. Stimuli were displayed on a monitor with a screen resolution 1920 x 1080 pixels and a refresh rate of 60 Hz using the Psychophysics Toolbox ( http://psychtoolbox.org/ ) ( Brainard, 1997 ) for Matlab (Mathworks). Two images of seeds were used as cues to which kind of task (spatial or conceptual tasks) participants had to do. In the conceptual task, the opacity of a sun and a drop of water images governed the simulated amount of water and light received by the seed. Participants were instructed that greater opacity indicated higher levels of water or sunlight. Literature suggests that lower magnitudes are represented to the left and downward, while higher magnitudes are represented to the right and upward ( Viganò, Bayramova, Doeller, & Bottini, 2024 ; Loetscher, Bockisch, Nicholls, & Brugger, 2010 ; Hesse & Bremmer, 2017 ). The spatial task involved a black dot positioned on a white square, with the vertical and horizontal placements of the dot dictating the virtual planting location for the seed. We sampled a subset of these two dimensional spaces to create the stimuli; see the supplementary materials for a breakdown of all the feature combinations that were used to create the stimuli. 4.2.1 Task Structures We used two different feature-outcome maps, which we refer to as structure (see Fig. 1 ). These structures can be approximated by two different “diagonal” rules, allowing participants to learn the value of different spatial or conceptual combinations without sampling them first. Both task structures were defined using a deterministic mapping where the rounded value of the log-odds of the outcome was a quadratic function of stimulus characteristics, either the opacity of the two images or the position in space. u t here defines all the combinations of the feature of the task at hand. Water and light opacity for the conceptual task, and x and y positions for the spatial task. Flipping the sign of the wd parameter in this mapping produced the two structures depicted in Figure 1 . 4.3 Experimental Design Each participant was trained to do two tasks in either a blocked or an interleaved fashion. In the first task, the conceptual task, they had to learn the association between the opacity of a sun and a drop of water images and an outcome (grow or die); in the second one, they had to learn the association between a position in space and an outcome (grow or die). Importantly, spatial positions did not affect the conceptual task and conceptual features did not affect the spatial one. Participant trained in an interleaved fashion, during both training and test phases were presented with the two tasks interleaved. Participants trained with the blocked design were trained either with the spatial task first or with the conceptual one. Tasks were interleaved during the testing phase. Participants were randomly assigned to either a “Same structure” (SaSt) or a “Different structure” group (DiSt) and to either the blocked or the interleaved design. The features-outcome mappings for the SaSt group were generated using wd = 0.71 for both spatial and conceptual tasks (See previous paragraph and equation 1 ). The features-outcome mappings for the DiSt group were generated using wd = 0.71 for the conceptual task and wd = − 0.71 for the spatial task. 4.4 Procedure The experiment comprises four distinct phases, as illustrated in the C panel of Figure 1 and lasted about 2 hours. Throughout these phases, participants engage in a computerized task where they assume the roles of scientists within a biology laboratory. In this simulated scenario, the laboratory has successfully cultivated two novel plant species, and participants are tasked with acquiring knowledge about the specific environmental conditions required for the successful germination of these plant seeds. 4.4.1 Training As illustrated on the right part of Fig. 1 , during the first phase, the training task, in each trial participants will first be prompted with one of two seeds cueing which task to focus on and then the stimuli appeared and stayed on screen for 2500 ms maximum or until a response was made. Responses were made on a standard button box, one button indicating a prediction of ‘grow’ and another predicting “die”. Responses not given within the required time constitute “missed trials”. Right after the button press feedback was provided, saying “correct” if the prediction was correct, “incorrect” if it was not and “too slow” if they missed the trial (no response within 2500 ms). By making predictions and receiving feedback, participants learned the association between relevant features and the outcome “grow” or “die” as in a classic associative learning task. During the training phase, participants were exposed to 18 different configurations in both spatial and conceptual tasks. Each configuration was repeated 8 times, with a different irrelevant configuration. For example, in the spatial condition, each spatial configuration was paired with 8 conceptual configurations (4 associated with “grow” and 4 with “die”). The total number of trials in the training phase was thus 288 (18 configurations × 8 repetitions x 2 tasks). It’s important to note that some stimuli (i.e., coordinates in the two-dimensional feature spaces) were common between the two contexts, while others were unique to each context, providing a multifaceted learning experience for the participants. 4.4.2 Test During the second phase, the test tasks, we tested participants’ knowledge about the structures learned during the training. We presented old and new stimuli to test for differences in memorization, transfer and generalization. Some of the new stimuli were new in both contexts and some were previously encountered (old) in one context but entirely new in the other context. During the testing phase, participants were exposed to 28 different configurations in both spatial and conceptual tasks. Like during the training session, each configuration was repeated 8 times, with a different irrelevant configuration. For example, in the spatial condition, each spatial configuration was paired with 8 conceptual configurations (4 associated with “grow” and 4 with “die”). The total number of trials in the training phase was thus 896 (28 configurations × 8 repetitions x 2 tasks). This phase is divided into “first testing session” and “second testing session” with 8 repetition each, separated by a navigation task that will be analysed separately. 4.4.3 Navigation The navigation task addresses a distinct question that will be analyzed separately. Here we provide a short description of the task. Participants were presented with one of the two seeds and an expected outcome: “grow” or “die”. Participants were then asked to navigate the appropriate (spatial or conceptual) space, by varying the two features (x and y for the spatial seed, amount of sun and rain for the conceptual seed), locate a position on the map and “plant” the seed according to the outcome requested. Data and Code Availability The code for the neural network was written in python, using TensorFlow and numpy. The code is freely available on https://github.com/wj2/modularity/tree/master . Behavioural data and analyses implemented in Matlab software are available from https://github.com/Nich0Me/ . Acknowledgments We thank Yvonne Wolf-Rosier, Anna Krauspe and Dareen Darwish for their invaluable assistance with participant recruitment and data collection, Kerstin Schumer for her exceptional management of the project. C.F.D.’s research is supported by the Max Planck Society, the European Research Council (ERC-CoG GEOCOG 724836), the Kavli Foundation, the Jebsen Foundation, the Centre of Excellence scheme of the Research Council of Norway—Centre for Neural Computation (223262/F50), The Egil and Pauline Braathen and Fred Kavli Centre for Cortical Microcircuits, and the National Infrastructure scheme of the Research Council of Norway—NORBRAIN (197467/F50). Funder Information Declared European Research Council, https://ror.org/0472cxd90 , ERC-CoG GEOCOG 724836 Kavli Institute , 223262/F50 References ↵ Aho , K. , Roads , B. D. , & Love , B. C. ( 2022 ). System alignment supports cross-domain learning and zero-shot generalisation . Cognition , 227 , 105200 . OpenUrl PubMed ↵ Badre , D. ( 2024 ). Cognitive control . Annual Review of Psychology , 76 . ↵ Badre , D. , Bhandari , A. , Keglovits , H. , & Kikumoto , A. ( 2021 ). The dimensionality of neural representations for control . Current Opinion in Behavioral Sciences , 38 , 20 – 28 . OpenUrl PubMed ↵ Bakermans , J. J. , Warren , J. , Whittington , J. C. , & Behrens , T. E. ( 2025 ). Constructing future behavior in the hippocampal formation through composition and replay . Nature neuroscience , 1 – 12 . ↵ Barnaveli , I. , Viganò , S. , Reznik , D. , Haggard , P. , & Doeller , C. F. ( 2025 ). Hippocampal-entorhinal cognitive maps and cortical motor system represent action plans and their outcomes . Nature Communications , 16 ( 1 ), 4139 . OpenUrl PubMed ↵ Behrens , T. E. , Muller , T. H. , Whittington , J. C. , Mark , S. , Baram , A. B. , Stachenfeld , K. L. , & Kurth-Nelson , Z. ( 2018 ). What is a cognitive map? organizing knowledge for flexible behavior . Neuron , 100 ( 2 ), 490 – 509 . OpenUrl CrossRef PubMed ↵ Bellmund , J. L. , Gärdenfors , P. , Moser , E. I. , & Doeller , C. F. ( 2018 ). Navigating cognition: Spatial codes for human thinking . Science , 362 ( 6415 ), eaat6766 . OpenUrl Abstract / FREE Full Text ↵ Bhandari , A. , Keglovits , H. , & Badre , D. ( 2024 ). Task structure tailors the geometry of neural representations in human lateral prefrontal cortex . bioRxiv . ↵ Boyle , L. M. , Posani , L. , Irfan , S. , Siegelbaum , S. A. , & Fusi , S. ( 2024 ). Tuned geometries of hippocampal representations meet the computational demands of social memory . Neuron , 112 ( 8 ), 1358 – 1371 . OpenUrl CrossRef PubMed ↵ Brainard , D. H. ( 1997 ). The psychophysics toolbox . Spatial Vision , 10 , 433 – 436 . OpenUrl CrossRef PubMed Web of Science ↵ Caruana , R. ( 1997 ). Multitask learning . Machine learning , 28 , 41 – 75 . OpenUrl ↵ Carvalho , P. F. , & Goldstone , R. L. ( 2014 ). Putting category learning in order: Category structure and temporal arrangement affect the benefit of interleaved over blocked study . Memory & cognition , 42 , 481 – 495 . OpenUrl CrossRef PubMed ↵ Dekker , R. B. , Otto , F. , & Summerfield , C. ( 2022 ). Curriculum learning for human compositional generalization . Proceedings of the National Academy of Sciences , 119 ( 41 ), e2205582119 . OpenUrl CrossRef PubMed ↵ Duncan , K. , Doll , B. B. , Daw , N. D. , & Shohamy , D. ( 2018 ). More than the sum of its parts: a role for the hippocampus in configural reinforcement learning . Neuron , 98 ( 3 ), 645 – 657 . OpenUrl CrossRef PubMed ↵ Flesch , T. , Balaguer , J. , Dekker , R. , Nili , H. , & Summerfield , C. ( 2018 ). Comparing continual task learning in minds and machines . Proceedings of the National Academy of Sciences , 115 ( 44 ), E10313 – E10322 . OpenUrl Abstract / FREE Full Text ↵ Flesch , T. , Saxe , A. , & Summerfield , C. ( 2023 ). Continual task learning in natural and artificial agents . Trends in neurosciences , 46 ( 3 ), 199 – 210 . OpenUrl CrossRef PubMed ↵ Franklin , N. T. , & Frank , M. J. ( 2020 ). Generalizing to generalize: Humans flexibly switch between compositional and conjunctive structures during reinforcement learning . PLoS computational biology , 16 ( 4 ), e1007720 . OpenUrl ↵ Fusi , S. ( 2021 ). Memory capacity of neural network models . arXiv preprint arxiv: 2108.07839 . ↵ Fusi , S. , Miller , E. K. , & Rigotti , M. ( 2016 ). Why neurons mix: high dimensionality for higher cognition . Current opinion in neurobiology , 37 , 66 – 74 . OpenUrl CrossRef PubMed ↵ Gardenfors , P. ( 2004 ). Conceptual spaces: The geometry of thought . MIT press . ↵ Garner , K. , Lynch , C. R. , & Dux , P. E. ( 2016 ). Transfer of training benefits requires rules we cannot see (or hear) . Journal of Experimental Psychology: Human Perception and Performance , 42 ( 8 ), 1148 . OpenUrl CrossRef PubMed ↵ Garner , K. G. , & Dux , P. E. ( 2023 ). Knowledge generalization and the costs of multitasking . Nature Reviews Neuroscience , 24 ( 2 ), 98 – 112 . OpenUrl CrossRef PubMed ↵ Hadsell , R. , Rao , D. , Rusu , A. A. , & Pascanu , R. ( 2020 ). Embracing change: Continual learning in deep neural networks . Trends in cognitive sciences , 24 ( 12 ), 1028 – 1040 . OpenUrl CrossRef PubMed ↵ Hesse , P. N. , & Bremmer , F. ( 2017 ). The snarc effect in two dimensions: Evidence for a frontoparallel mental number plane . Vision research , 130 , 85 – 96 . OpenUrl CrossRef PubMed ↵ Holton , E. , Braun , L. , Thompson , J. , Grohn , J. , & Summerfield , C. ( 2025 ). Humans and neural networks show similar patterns of transfer and interference during continual learning . ↵ Johnston , W. J. , Fine , J. M. , Yoo , S. B. M. , Ebitz , R. B. , & Hayden , B. Y. ( 2024 ). Semi-orthogonal subspaces for value mediate a binding and generalization trade-off . Nature Neuroscience , 27 ( 11 ), 2218 – 2230 . OpenUrl CrossRef PubMed ↵ Kaplan , R. , Schuck , N. W. , & Doeller , C. F. ( 2017 ). The role of mental maps in decision-making . Trends in Neurosciences , 40 ( 5 ), 256 – 259 . OpenUrl CrossRef PubMed ↵ Kikumoto , A. , & Mayr , U. ( 2020 ). Conjunctive representations that integrate stimuli, responses, and rules are critical for action selection . Proceedings of the National Academy of Sciences , 117 ( 19 ), 10603 – 10608 . OpenUrl Abstract / FREE Full Text ↵ Kirkpatrick , J. , Pascanu , R. , Rabinowitz , N. , Veness , J. , Desjardins , G. , Rusu , A. A. , … others ( 2017 ). Overcoming catastrophic forgetting in neural networks . Proceedings of the national academy of sciences , 114 ( 13 ), 3521 – 3526 . OpenUrl Abstract / FREE Full Text ↵ Kudithipudi , D. , Aguilar-Simon , M. , Babb , J. , Bazhenov , M. , Blackiston , D. , Bongard , J. , … others ( 2022 ). Biological underpinnings for lifelong learning machines . Nature Machine Intelligence , 4 ( 3 ), 196 – 210 . OpenUrl ↵ Lechner , H. A. , Squire , L. R. , & Byrne , J. H. ( 1999 ). 100 years of consolidation—remembering müller and pilzecker . Learning & memory , 6 ( 2 ), 77 – 87 . OpenUrl FREE Full Text ↵ Lerousseau , J. P. , & Summerfield , C. ( 2024 ). Space as a scaffold for rotational generalisation of abstract concepts . Elife , 13 , RP93636 . OpenUrl PubMed ↵ Loetscher , T. , Bockisch , C. J. , Nicholls , M. E. , & Brugger , P. ( 2010 ). Eye position predicts what number you have in mind . Current Biology , 20 ( 6 ), R264 – R265 . OpenUrl CrossRef PubMed ↵ Lu , Q. , Hummos , A. , & Norman , K. A. ( 2024 ). Episodic memory supports the acquisition of structured task representations . bioRxiv , 2024 – 05 . ↵ Mark , S. , Moran , R. , Parr , T. , Kennerley , S. W. , & Behrens , T. E. ( 2020 ). Transferring structural knowledge across cognitive maps in humans and models . Nature communications , 11 ( 1 ), 4783 . OpenUrl PubMed ↵ Menghi , N. , Johnston , W. , Vigano’ , S. , Hinrichs , M. , Maess , B. , Fusi , S. , & Doeller , C. ( 2025 ). The effects of task similarity during representation learning in brains and neural networks . bioRxiv , 2025 – 01 . ↵ Menghi , N. , Kacar , K. , & Penny , W. ( 2021 ). Multitask learning over shared subspaces . PLoS Computational Biology . ↵ Mosha , N. , & Robertson , E. M. ( 2016 ). Unstable memories create a high-level representation that enables learning transfer . Current Biology , 26 ( 1 ), 100 – 105 . OpenUrl CrossRef PubMed ↵ Musslick , S. , & Cohen , J. D. ( 2019 ). A mechanistic account of constraints on control-dependent processing: Shared representation, conflict and persistence . In Proceedings of the annual meeting of the cognitive science society (Vol. 41 ). ↵ Musslick , S. , & Cohen , J. D. ( 2021 ). Rationalizing constraints on the capacity for cognitive control . Trends in cognitive sciences , 25 ( 9 ), 757 – 775 . OpenUrl CrossRef PubMed ↵ Mutanen , T. P. , Bracco , M. , & Robertson , E. M. ( 2020 ). A common task structure links together the fate of different types of memories . Current Biology , 30 ( 11 ), 2139 – 2145 . OpenUrl PubMed ↵ Nitsch , A. , Garvert , M. M. , Bellmund , J. L. , Schuck , N. W. , & Doeller , C. F. ( 2024 ). Grid-like entorhinal representation of an abstract value space during prospective decision making . Nature Communications , 15 ( 1 ), 1198 . OpenUrl PubMed ↵ O’Reilly , R. C. , & Rudy , J. W. ( 2001 ). Conjunctive representations in learning and memory: principles of cortical and hippocampal function . Psychological review , 108 ( 2 ), 311 . OpenUrl CrossRef PubMed Web of Science ↵ Parisi , G. I. , Kemker , R. , Part , J. L. , Kanan , C. , & Wermter , S. ( 2019 ). Continual lifelong learning with neural networks: A review . Neural networks , 113 , 54 – 71 . OpenUrl CrossRef PubMed ↵ Robertson , E. M. ( 2012 ). New insights in human memory interference and consolidation . Current Biology , 22 ( 2 ), R66 – R71 . OpenUrl CrossRef PubMed ↵ Robertson , E. M. ( 2018 ). Memory instability as a gateway to generalization . PLoS biology , 16 ( 3 ), e2004633 . OpenUrl CrossRef PubMed ↵ Robertson , E. M. , Pascual-Leone , A. , & Miall , R. C. ( 2004 ). Current concepts in procedural consolidation . Nature Reviews Neuroscience , 5 ( 7 ), 576 – 582 . OpenUrl CrossRef PubMed Web of Science ↵ Rohrer , D. , Dedrick , R. F. , & Stershic , S. ( 2015 ). Interleaved practice improves mathematics learning . Journal of Educational Psychology , 107 ( 3 ), 900 . OpenUrl CrossRef ↵ Schwartenbeck , P. , Baram , A. , Liu , Y. , Mark , S. , Muller , T. , Dolan , R. , … Behrens , T. ( 2023 ). Generative replay underlies compositional inference in the hippocampal-prefrontal circuit . Cell , 186 ( 22 ), 4885 – 4897 . OpenUrl CrossRef PubMed ↵ Shepard , R. N. , & Metzler , J. ( 1971 ). Mental rotation of three-dimensional objects . Science , 171 ( 3972 ), 701 – 703 . OpenUrl Abstract / FREE Full Text ↵ Theves , S. , Fernandez , G. , & Doeller , C. F. ( 2019 ). The hippocampus encodes distances in multidimensional feature space . Current Biology , 29 ( 7 ), 1226 – 1231 . OpenUrl CrossRef PubMed ↵ Theves , S. , Fernández , G. , & Doeller , C. F. ( 2020 ). The hippocampus maps concept space, not feature space . Journal of Neuroscience , 40 ( 38 ), 7318 – 7325 . OpenUrl Abstract / FREE Full Text ↵ Viganò , S. , Bayramova , R. , Doeller , C. F. , & Bottini , R. ( 2023 ). Mental search of concepts is supported by egocentric vector representations and restructured grid maps . Nature Communications , 14 ( 1 ), 8132 . OpenUrl PubMed ↵ Viganò , S. , Bayramova , R. , Doeller , C. F. , & Bottini , R. ( 2024 ). Spontaneous eye movements reflect the representational geometries of conceptual spaces . Proceedings of the National Academy of Sciences , 121 ( 17 ), e2403858121 . OpenUrl CrossRef PubMed ↵ Viganò , S. , Rubino , V. , Di Soccio , A. , Buiatti , M. , & Piazza , M. ( 2021 ). Grid-like and distance codes for representing word meaning in the human brain . NeuroImage , 232 , 117876 . OpenUrl CrossRef PubMed ↵ Whittington , J. C. , Muller , T. H. , Mark , S. , Chen , G. , Barry , C. , Burgess , N. , & Behrens , T. E. ( 2020 ). The tolman-eichenbaum machine: unifying space and relational memory through generalization in the hippocampal formation . Cell , 183 ( 5 ), 1249 – 1263 . OpenUrl CrossRef PubMed ↵ Wu , C. M. , Schulz , E. , Garvert , M. M. , Meder , B. , & Schuck , N. W. ( 2018 ). Connecting conceptual and spatial search via a model of generalization . bioRxiv , 258665 . ↵ Wu , C. M. , Schulz , E. , Garvert , M. M. , Meder , B. , & Schuck , N. W. ( 2020 ). Similarities and differences in spatial and non-spatial cognitive maps . PLoS computational biology , 16 ( 9 ), e1008149 . OpenUrl PubMed ↵ Zaki , Y. , & Cai , D. J. ( 2024 ). Memory engram stability and flexibility . Neuropsychopharmacology , 1 – 9 . ↵ Zhou , Z. , Singh , D. , Tandoc , M. C. , & Schapiro , A. C. ( 2023 ). Building integrated representations through interleaved learning . Journal of Experimental Psychology: General , 152 ( 9 ), 2666 . OpenUrl PubMed View the discussion thread. Back to top Previous Next Posted September 22, 2025. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Impact of Task Similarity and Training Regimes on Cognitive Transfer and Interference Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Impact of Task Similarity and Training Regimes on Cognitive Transfer and Interference N. Menghi , S. Vigano’ , W. J. Johnston , S. Elnagar , S. Fusi , F. C. Doeller bioRxiv 2025.09.22.677779; doi: https://doi.org/10.1101/2025.09.22.677779 Share This Article: Copy Citation Tools Impact of Task Similarity and Training Regimes on Cognitive Transfer and Interference N. Menghi , S. Vigano’ , W. J. Johnston , S. Elnagar , S. Fusi , F. C. Doeller bioRxiv 2025.09.22.677779; doi: https://doi.org/10.1101/2025.09.22.677779 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Neuroscience Subject Areas All Articles Animal Behavior and Cognition (7635) Biochemistry (17691) Bioengineering (13892) Bioinformatics (41937) Biophysics (21452) Cancer Biology (18588) Cell Biology (25504) Clinical Trials (138) Developmental Biology (13378) Ecology (19899) Epidemiology (2067) Evolutionary Biology (24320) Genetics (15609) Genomics (22506) Immunology (17736) Microbiology (40394) Molecular Biology (17181) Neuroscience (88605) Paleontology (666) Pathology (2832) Pharmacology and Toxicology (4824) Physiology (7641) Plant Biology (15156) Scientific Communication and Education (2045) Synthetic Biology (4294) Systems Biology (9825) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall: last seen: 2026-05-21T05:10:58.409756+00:00

License: CC-BY-NC-ND-4.0