Full text
97,402 characters
· extracted from
preprint-html
· click to expand
Unfolding the Black Box of Recurrent Neural Networks for Path Integration | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Unfolding the Black Box of Recurrent Neural Networks for Path Integration Tianhao Chu , Yuling Wu , Neil Burgess , View ORCID Profile Zilong Ji , Si Wu doi: https://doi.org/10.1101/2025.10.25.684492 Tianhao Chu 1 School of Psychological and Cognitive Sciences, Key Laboratory of Machine Perception (Ministry of Education), Peking University , China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Yuling Wu 2 Peking-Tsinghua Center for Life Sciences, Academy for Advanced Interdisciplinary Studies, Peking University , China Find this author on Google Scholar Find this author on PubMed Search for this author on this site Neil Burgess 3 Institute of Cognitive Neuroscience, Department of Neuroscience, Physiology and Pharmacology, University College London , UK 4 UCL Queen Square Institute of Neurology, University College London , UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site Zilong Ji 1 School of Psychological and Cognitive Sciences, Key Laboratory of Machine Perception (Ministry of Education), Peking University , China 3 Institute of Cognitive Neuroscience, Department of Neuroscience, Physiology and Pharmacology, University College London , UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Zilong Ji Si Wu 1 School of Psychological and Cognitive Sciences, Key Laboratory of Machine Perception (Ministry of Education), Peking University , China 2 Peking-Tsinghua Center for Life Sciences, Academy for Advanced Interdisciplinary Studies, Peking University , China 5 Beijing Key Laboratory of Behavior and Mental Health, IDG/McGovern Institute for Brain Research, Center of Quantitative Biology, Peking University , China Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: siwu{at}pku.edu.cn Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Path integration is essential for spatial navigation. Experimental studies have identified neural correlates for path integration, but exactly how the neural system accomplishes this computation remains unresolved. Here, we adopt recurrent neural networks (RNNs) trained to perform a path integration task to explore this issue. After training, we borrow neuroscience prior knowledge and methods to unfold the black box of the trained model, including: clarifying neuron types based on their receptive fields, dissecting information flows between neuron groups by pruning their connections, and analyzing internal dynamics of neuron groups using the attractor framework. Intriguingly, we uncover a hierarchical information processing pathway embedded in the RNN model, along which velocity information of an agent is first forwarded to band cells, band and grid cells then coordinate to carry out path integration, and finally grid cells output the agent location. Inspired by the RNN-based study, we construct a neural circuit model, in which band cells form one-dimensional (1D) continuous attractor neural networks (CANNs) and serve as upstream neurons to support downstream grid cells to carry out path integration in the 2D space. Our study challenges the conventional view of considering grid cells as the principal velocity integrator, and supports a neural circuit model with the hierarchy of band and grid cells. Introduction Path integration refers to the process of computing the position of an agent by continuously integrating self-motion information of the agent over time [ 1 ]. It is fundamental for spatial navigation in both humans and rodents, and also plays an important role in robot control [ 2 ]. Experimental studies have shown that grid cells in the medial entorhinal cortex (MEC) are deeply involved in path integration [ 3 ]. These cells exhibit periodic hexagonal firing patterns in the two-dimensional space, providing a metric representation for implementing path integration [ 1 , 4 ]. Disruption of grid cells through medial septal inactivation or entorhinal lesions impairs spatial memory and navigation based on path integration [ 3 , 5 ]. Despite these experimental evidence, exactly how the neural system performs path integration remains largely unknown, and there are unresolved issues. First, in addition to grid cells, experimental data has shown that there exists a rich diversity of spatially modulated cell types in the MEC [ 6 , 7 , 8 , 9 ]. In particular, band cells, found in parasubiculum (an upstream region of MEC), exhibit periodic firing patterns that can be modeled as a superposition of bands, and they are hypothesized to perform path integration in a 1D space [ 9 , 10 ]. However, the functional relationship between grid and band cells remains to be clarified. Second, neural circuit models have been proposed to implement path integration. The conventional models consider only grid cells, and in order to implement 2D path integration, these models either consider a large amount of direction-conjunctive grid cells [ 11 , 12 , 13 ] or assume that the recurrent connections between grid cells are tuned instantly by the velocity signal [ 14 ]. A different model considering the hierarchy of band and grid cells for implementing path integration was proposed [ 15 , 16 ]. The question of which model is biologically more plausible remains debated. Related RNN-based navigated studies Recently, AI approaches have been used to study the association between path integration and grid cells. Specifically, recurrent neural networks (RNNs) were trained to perform spatial navigation to ascertain the involvement of grid cells in path integration, and inconclusive results have been reported so far. In one line of works, it was found that training an RNN based solely on motion velocity in a supervised way (i.e., reconstructing the place cell activity at the given location from pure velocity input) can lead to the emergence of grid-cell-like activity pattern in the RNN, especially under the biological constraints such as non-negative firing rate [ 17 , 18 ]. This result implies that grid cells are associated with path integration. Building on this work, subsequent studies have extended the supervised training paradigm to more unsupervised-guided ones, using objective functions derived from group theory, information efficiency, and actionability, emphasizing the isometric structure, high coding capacity, and integrative functionality of grid cells [ 19 , 14 , 20 ]. These studies have systematically explored the conditions under which grid-like representations emerge in RNNs, examining how the network structure, the training objective, and biological priors jointly shape grid-like representations. In the other line of works, the necessity of grid cells for path integration is challenged. For instance, [ 21 ] demonstrated that grid-like firing patterns can arise as the principal components of place cell activities under the non-negativity constraint, without path integration involved. More recently, [ 22 ] argued that grid cells may emerge from a principle of efficient pattern formation for reconstructing place fields, rather than from the demand of path integration. Supporting this view, ablation studies of trained RNNs have shown that removing velocity inputs to high grid-score units has negligible impact on the path integration performance [ 23 , 24 ]. Overall, current RNN-based studies have primarily focused on exploring the conditions under which grid cells emerge and on the necessity of grid cells for path integration. However, they have not addressed the question of how a trained RNN implements path integration, nor examined the functional role of band cells in this process [ 18 , 25 ]. The internal mechanisms of the trained RNN model thus remain a black box. In this work, we take the same approach of training RNNs to perform path integration, but our goal is different, that is, we aim to unveil the detailed mechanism concealed in the trained RNNs, and from which, to ascertain the neural mechanism of path integration. To achieve this goal, we will borrow neuroscience prior knowledge and methods to unfold the black box of the trained RNNs in much more detail than in previous studies. These include: clarifying neuron types based on their receptive fields, dissecting information flows between neuron groups by pruning their connections, and analyzing internal dynamics of neuron groups in the attractor framework. It turns out that there exists a hierarchical information processing pathway embedded in the RNN model, along which velocity information is first forwarded to band cells, band and grid cells then coordinate to carry out path integration, and finally grid cells output the location of the agent. Inspired by the RNN-based study and previous mechanistic models [ 16 , 26 ], we construct a hierarchical neural circuit model for path integration in the brain, in which band and grid cells form 1D and 2D continuous attractor neural networks (CANNs), respectively, and they coordinate to accomplish path integration. Contemporary models often assume that grid cells are primarily responsible for path integration [ 11 , 12 , 13 ]. Our study challenges this view and suggests that the hierarchy of band and grid cells is necessary. Our model also makes predictions testable in neuroscience experiments. 2 Neuroscience for AI: unfolding the black box 2.1 An RNN model for path integration We adopt a well-established paradigm to train RNNs for path integration [ 17 , 22 ], obtaining the key results as reported here, which are further validated by consistent results from other modeling frameworks (see Supplement Information (SI) E). As illustrated in Fig. 1a , an agent is moving in a square environment with velocity v t ∈ R 2 . Mimicking place cells’ position encoding in the neural system, the agent’s location x t is represented by a bump vector in the 2D space centered at x t , with N p the number of place cells. The task of path integration is formulated as: given the initial location x 0 of the agent, the RNN model infers its subsequent positions x 1: T by using only the self-motion information of the agent, i.e., the sequence of velocity vectors v 0: T − 1 ; no other position cue is available. Within the conceptual framework of the MEC-HPC loop, the model’s information flow can be interpreted as follows: the initial state of the RNN (representing a nascent MEC population) is set by a projection from the place cell population (representing hippocampus, HPC), i.e., r 0 = M 0 p 0 , where p 0 corresponds to the initial location x 0 and the matrix , with N R the number of neurons in the RNN ( Fig. 1b ). This initialization embodies a critical HPC → MEC projection signal that anchors the path-integration process to an environmental cue. Download figure Open in new tab Figure 1. (a) Illustration of the path integration task. (b) The structure of the RNN model. (c) Examples of band cell, grid cell and undefined cell found in MEC (middle panel, adapted from [ 9 ]) and in the trained RNN (right panel). At each time step, the RNN receives the agent’s instantaneous velocity signal v t and updates its internal state following the recurrent dynamics, which is written as, where is the recurrent connection matrix between neurons in the RNN, the matrix , and σ ( · ) is the ReLU function, enforcing non-negative firing rates of neurons. At each time step, the agent’s location is read out by, where the read-out matrix . The free parameters of a RNN, including J, M, W , and M 0 , are optimized using BPTT through minimizing the cross-entropy loss between the network outputs and the ground truth p t for all time steps t = 1, …, T and for all randomly generated motion trajectories. The details of the model training and fixed parameters are given in SI A. The trained RNN model effectively implements path integration, with quantitative results (SI D) indicating that it achieved competent performance on the task. 2.2 Interpreting the trained RNN model with neuroscience It is straightforward to train the RNN model well to achieve a good path integration performance, but unveiling the underlying computational mechanism is challenging, which is known as the black box problem of AI-trained models. Without prior knowledge, we have no clue to interpret the data. Here, we borrow neuroscience prior knowledge and methods to unfold the black box. 2.2.1 Clarifying neuron types Our first step is to clarify neuron types in the trained RNN based on their receptive fields. Following the common practice in neuroscience, we first compute the spatial tuning maps of neurons in the trained RNN. Specifically, we consider that the agent performs random walks in the environment, covering the whole arena, and the corresponding velocity signals are used as inputs to stimulate neuronal responses in the RNN. We record the activities of each neuron at all locations, which gives a 2D heatmap for each neuron, reflecting their spatial tuning characteristics. Inspired by the spatial tuning properties of grid and band cells observed in the neural system, we search for analogous unit types in the trained RNN. To classify neuron types quantitatively, we adopt established criteria from neuroscience (see SI B). We have identified three mutually exclusive types based on neuronal receptive fields ( Fig. 1c , right panel), which are: 1) Grid cell, which exhibits the hexagonally patterned firing field; 2) Band cell, whose receptive field consists of multiple equally spaced parallel lines (the so-called bands) (see more details below); and 3) Undefined cell, which displays neither grid-like nor band-like spatial tuning. All three cell types emerge robustly in the trained RNNs (see SI E). For example, in one trained RNN with N R = 4096 units, we identify 764 grid cells, 764 band cells, and 2568 undefined cells). 2.2.2 Dissecting information flows between neuron groups After identifying neuron groups, we further investigate how information is propagated between them by applying pruning studies. We carry out four step-by-step pruning operations (see SI C), with each of them building upon the previous one and aiming to probe one aspect of path integration. See SI E for reproducibility results. Step 1: Pruning velocity inputs To identify which cell types are primarily responsible for receiving and processing velocity inputs, we selectively prune the afferent velocity inputs to each cell group one-by-one ( Fig. 2a , upper panel). We find that pruning velocity inputs to band cells leads to a significant increase in the path integration error, while pruning velocity inputs to other groups has little effect ( Fig. 2a , lower panel). This indicates that the velocity information is predominantly processed by band cells, and we remove velocity inputs to other cell types in the followed pruning. Download figure Open in new tab Figure 2. Results of pruning the RNN model. Four pruning operations are carried out step-by-step, with each step building upon the previous one. Upper panels: (a) Pruning velocity inputs to each cell group one-by-one; (b) Pruning read-out connections from each cell group one-by-one; (c) Pruning each cell type one-by-one; (d) Pruning the connections from band to grid and the connections from grid to band cells, respectively. Lower panels: Path integration error vs. the number of connections/cells pruned in each step. The path integration error is measured by the standard division of location prediction errors divided by the arena size. For calculation details, see SI C, E. Step 2: Pruning read-out connections To identify which cell types are primarily responsible for outputting the path integration result, we selectively prune the read-out connections from each cell group one-by-one ( Fig. 2b , upper panel), and find that pruning the read-out connections from grid cells have the largest effect on increasing the path integration error ( Fig. 2b , lower panel). This indicates that grid cells are predominately responsible for outputting the path integration result, and we remove the read-out connections from other cell types in the followed pruning. Step 3: Pruning cell types To evaluate the relative contributions of different cell types on path integration, we compare the model performances after pruning one of them in equal numbers ( Fig. 2c , upper panel). We find that pruning band or grid cells causes a substantial drop in the model performance, whereas pruning undefined cells has a much less effect ( Fig. 2c , lower panel). This suggests that band and grid cells play much more important roles than undefined cells in path integration, and we remove them in the followed pruning. Step 4: Pruning connections between band and grid cells To probe the functional relationship between band and grid cells in path integration, we separately prune the connections from band to grid cells and the connections from grid to band cells ( Fig. 2d , upper panel). We find that pruning either type of connections has a big impact on the model performance ( Fig. 2d , lower panel), indicating that the bidirectional, cooperative interactions between two cell types are critical for path integration. 2.3 A hierarchical path integration pathway embedded in the RNN Combining pruning results while discarding less relevant components, we identify a hierarchical path integration pathway embedded in the trained RNN ( Fig. 3a ), along which velocity information is first received and processed by band cells; band and grid cells then interact via reciprocal connections to integrate movement information; finally grid cells output the agent location in the 2D space. Download figure Open in new tab Figure 3. (a) The hierarchical path integration pathway embedded in trained RNNs. (b) A new RNN model taking the hierarchical pathway as a prior. (c) Neuron types found in the newly trained RNN. (d) An RNN model for a location reconstruction task. For simulation details, see SI C. It is surprising that such a well-organized pathway naturally emerges in training a RNN for a path integration task. To further validate that this hierarchical pathway constitutes the functional core structure, we conduct two additional experiments. In one experiment, we construct a new RNN model which takes the hierarchical pathway as a prior ( Fig. 3b ), that is, the first module receives velocity inputs, intending to play the role of band cells; the second module outputs the agent location, intending to play the role of grid cells; the two modules are reciprocally connected, intending to mimic the interactions between band and grid cells. We train this new model with the same path integration task and have two key observations as expected, which are: 1) the new model achieves a performance comparable to the original model; 2) band and grid cells emerge naturally as the dominant neuron types in the first and second modules, respectively ( Fig. 3c ). In the other experiment, we change the task from path integration to pure location reconstruction ( Fig. 3d ), i.e., the RNN receives the agent’s location inputs and reconstruct them; no velocity information is available. After training the RNN with the new task, we observe only grid cells without band cells (see SI C), indicating the necessity of path integration for the emergence of band cells. Together, these two additional experiments further reinforce our finding that the hierarchical pathway, characterized by the hierarchy of band and grid cells, and their reciprocal interactions, is the core structure for path integration. 2.3.1 Continuous attractor dynamics of band cells We now delve deeper into the internal structure and dynamics of band cells in the trained RNN. Fig. 4a displays the receptive field of an idealized band cell, which consists of multiple equally spaced parallel lines (bands), on which the cell’s response is invariant. A band cell can be characterized by three parameters: 1) spacing λ , which is the distance between adjacent bands; 2) orientation θ , which is the orientation of bands in the 2D space; 3) phase ϕ , which defines the positional separation between band cells having the same spacing and orientation. Denote Δ ∈ ( −λ/ 2, λ/ 2) the offset between the adjacent bands of two band cells, their phase difference is given by ϕ = (Δ /λ ) × π ∈ ( −π, π ). Download figure Open in new tab Figure 4. Properties of band cells in the trained RNN. (a) Illustration of the receptive field of an idealized band cells. Left panel: the receptive field consists of parallel bands, which are equally spaced with spacing λ and have the same orientation θ . Right panel: the positional separation between two band cells having the same spacing and orientation (blue and yellow) is quantified by a phase ϕ , whose value is given by ϕ = (Δ /λ ) × 2 π , with Δ the offset between the adjacent bands of two band cells. (b) Band cells in the trained RNN are grouped into four clusters according to their spacing λ and orientation θ . (c) An example band cell with direction-tuning at π . (d) Distribution of directional scores (a measurement of the direction-tuning level) of band cells in an example cluster. (e) Histograms of preferred directions of band cells in two example clusters, which have a bimodal shape peaked at either the cluster orientation θ or its opposite direction θ + π . (f) A 3D isomap embedding of the population activities of band cells in an example group with the same spacing and direction tuning. Coloured by time steps 5–20 of 200 trajectories. (g) The averaged connection profile of band cells as a function of their phase difference. For detail calculations, see SI B. First, we inspect the clustering property of band cells in the trained RNN. Using Fourier analysis, we extract the dominant spatial frequency of the receptive field of each band cell and obtain the cell’s spacing and orientation (see SI B for details). We find that band cells can be grouped into four well-separated clusters based on their spacing and orientation ( Fig. 4b ). For each cluster, we further differentiate cells’ direction-tuning by calculating how the averaged response of a band cell varies with motion direction of the agent. Interestingly, we find that in each cluster, the majority of band cells exhibit clear direction-tuning ( Fig. 4c-d ), and they constitute two sub-groups with preferred directions along either the cluster orientation θ or its opposite θ + π ( Fig. 4e ). Second, inspired by recent successes in modeling spatially tuned neurons in the hippocampal-entorhinal system using Continuous Attractor Neural Networks (CANNs) [ 27 , 28 , 29 , 11 ], we set out to investigate whether the low-dimensional manifold of neural activity and its underlying connectivity conform to CANN principles. Second, to uncover the latent structure and dynamics of band cells in each group having the same spacing and direction-tuni ng, we performed dimensionality reduction dimensionality reduction analysis (Isomap, details shown in SI B) on the activity trajectories of the group during path integration. Strikingly, we observed that the low-dimensional embedding of neural trajectories in each group forms a continuous ring ( Fig. 4f ), consistent with the dynamics of a 1D CANN with periodicity. We also inspected the recurrent connectivity pattern between band cells, looking for the signature of the CANN structure. For each band cell group having the same spacing and direction-tuning, we calculated the averaged connection weights between cell pairs as a function of their phase differences. The result shows that the connectivity profile exhibits an approximately symmetric shape with weight decreasing with phase difference ( Fig. 4g ), reminiscent of the center-surround connection pattern in a 1D CANN [ 30 ]. In summary, the above study reveals that band cells in the trained RNN constitute modules of different spacing and direction-tuning, and each module displays the 1D CANN-like structure and dynamics. 3 AI for neuroscience: the neural mechanism for path integration The above RNN-based navigation study also gives us insight into the path integration mechanism in the neural system. Band cells were reported in a neuroscience experiment [ 9 ], and an early computational model [ 15 , 16 ] (in which band cells were called Velocity-Controled-Oscillator (VCO)) was also proposed, which considered that band cells are responsible for 1D path integration, and multiple modules of band cells of different orientations jointly support grid cells to execute path integration in the 2D space. Our RNN-based study tends to support this view, and challenges the conventional models of relying only on grid cells for path integration. 3.1 A neural circuit model for path integration Inspired by the findings in the trained RNN, we construct a neural circuit model for path integration. It has the similar idea as that in [ 15 , 16 ], but have different mathematical formulations. In the below, we introduce the main structure of the model, with details presented in SI F. 3.1.1 The modules of band cells Motivated by the properties of band cells found in the trained RNN and the 1D head-direction system in Drosophila [ 31 , 32 ], we propose a theoretical model for band cells. Specifically, we consider that band cells are clustered into multiple modules with varying spacing λ and orientation θ . Each module consists of three sub-populations ( Fig. 5a ), which are: 1) pure band cells, 2) direction-conjunctive band cells v + , and 3) direction-conjunctive band cells v − , and they are aligned on a 1D manifold according to their preferred phases ϕ ∈ ( −π, π ]. Each module of band cells implements path integration in a 1D direction, along either the module orientation v + = θ or the opposite direction v − = θ + π . Download figure Open in new tab Figure 5. A neural circuit model for path integration. (a) The structure of a band cell module, which consists of three sub-populations: pure band cells, direction-conjunctive band cells v + , and direction-conjunctive band cells v − . A band cell module performs 1D path integration in the form of continuous attractor dynamics, along either the module orientation v + = θ or the opposite direction v − = θ + π . (b) Two band cells modules with different orientations support the grid cell module of the 2D CANN structure to accomplish path integration in the 2D space. (c) Examples of band and grid cells in the neural circuit model. (d) Inferred trajectory of the neural circuit model closely matches the ground-truth trajectory, demonstrating the path integration capability of the model. The pure band cell population forms a 1D CANN, whose dynamics is given by, where u b ( ϕ, t ) and r b ( ϕ, t ) denote the synaptic input and firing rate of pure band cells at ϕ , respectively. J b ( ϕ, ϕ ′ ) denotes the recurrent connections between band cells, and W m , with m = ±, denotes the connections from direction-conjunctive cells v m to pure band cells. I g denotes the input from grid cells (to be defined below). The firing rate of pure band cells is given by , with k b regulating the global inhibitory strength to ensure a stable bump activity of band cells. Conjunctive band cells v ± receive excitatory inputs from pure band cells and are tuned by the moving direction of the agent, whose dynamics are written as, where u ± ( ϕ, t ) and r ± ( ϕ, t ) denote the synaptic input and firing rate of conjunctive cells at phase ϕ , respectively. w b denotes the connection from pure band to conjunctive cells at the same phase. k = (sin θ/λ , cos θ/λ ) denotes a module-specific vector, and the projection of the agent velocity v ( t ) on it, v ( t ) · k , defines the moving speed of the agent along the orientation θ. g 0 is a baseline constant. [·] + denotes rectification. Eq.5 reflects that the firing rates of conjunctive cells contain the projected 1D speed information of the agent along the module orientation [ 31 ]. Importantly, we set the recurrent connections between pure band cells to be symmetric and translation-invariant, i.e., , while the connections from conjunctive cells to pure band cells are offset with a constant value δ , i.e., . Together, three populations of band cells in a module achieve 1D path integration along the module orientation [ 31 ]. 3.1.2 The module of grid cells A single band cell module supports path integration in two directions θ and θ + π . To realize 2D path integration, grid cells integrate the outputs of band cell modules of different orientations. With loss of generality, we consider only two band cell modules in the present study ( Fig. 5b ). The orientations of two modules are denoted as θ 1 and θ 2 , respectively, and they are 60 ? apart. Grid cells are aligned on a 2D toroidal manifold with a phase vector ϕ = ( ϕ 1 , ϕ 1 ). They form a 2D CANN with dynamics given by, [where u g ( ϕ, t ) and r g ( ϕ, t ) are the synaptic input and firing rate of grid cells at phase ϕ . The recurrent connections between grid cells are symmetric and translation-invariant, i.e., , with || · || g denotes circular distance on the torus and σ g controlling the bump activity size. The firing rate of grid cells also follows divisive normalization, i.e., . I 1 ( ϕ 1 , t ) and I 2 ( ϕ 2 , t ) represent the inputs from two band cell modules having orientations θ 1 and θ 2 , respectively (to be defined below). 3.1.3 Interactions between band and grid cells We set the reciprocal connections between band and grid cells to be symmetric, which are written as, where k = 1, 2 indexes the band cell module. Thus, the inputs from grid cells to each band cell module are given by, and the inputs from each band module to grid cells are given by The forward connections from band to grid cells enable the grid cell module to integrate 1D motion trajectories into 2D, while the feedback connections from grid to band cells enable the circuit to amend errors. They jointly support accurate path integration in the 2D space. 3.2 Simulation results We carry out simulations to test the performance of the neural circuit model (for details, see SI F). We observe that band and grid cells of varying spacings and orientations appear in the hand-designed model ( Fig. 5c ). The moving trajectory inferred by the model agrees well with ground truth, demonstrating the path integration capacity of the model ( Fig. 5d ). It should be noted that the path integration capability demonstrated here builds upon well-established computational frameworks [ 11 , 31 ], and thus we do not perform additional tests on its robustness in this regard. Furthermore, the absence of accumulated error in this simulation is due to the idealized setting where neither input signals nor the model contain any random noise. In more realistic scenarios where noise is present, small errors would accumulate over time, leading to gradual drift in the estimated position; corresponding results under noisy conditions are provided in SI F. 4 Discussion In the present study, by using neuroscience prior knowledge and methods, we unfold the black box of RNNs trained to perform a path integration task, and we identify a hierarchical path integration pathway embedded in trained RNNs. Using a combination of analyses (neuron type classification, connection pruning, attractor dynamics inspection et al.), we uncover that along this hierarchical pathway, velocity information of an agent is first conveyed to band cells, band and grid cells then coordinate to carry out path integration, and finally grid cells output the agent location. Furthermore, we reveal that band cells form multiple modules of varying spacing and orientation, and each module constitutes a 1D CANN-like structure. Inspired by the RNN-based study and other neuroscience evidence, we formulate a neural circuit model for path integration. In this model, band cells form multiple functional modules in the form of 1D CANNs, and each of them is responsible for path integration along the module orientation; grid cells form a 2D CANN, which integrates the 1D results of band cell modules to carry out 2D path integration and meanwhile provides feedback to band cells to correct errors. We demonstrate that this computational model works well. Related neural circuit models Previous neural circuit models for path integration based only on grid cells require a large amount of direction-conjunctive grid cells, whereby these conjunctive cells receive velocity inputs and shift the activity of the downstream pure grid cells along the same direction to perform location updating [ 11 ]. Compared to this model, which requires N 2 pure grid cells and at least 4 N 2 conjunctive grid cells to represent four allocentric directions (north, south, east, and west), the hierarchical model we propose requires only 2 N pure band cells, 4 N conjunctive band cells (2 N per each module), and N 2 grid cells. Thus, the total number of neurons required to perform path integration is significantly reduced from 5 N 2 to 6 N + N 2 , without sacrificing the performance. This computational efficiency offers new insight for the advantage of employing the combination of band and grid cells. To reduce the neuron number, another neural circuit model based only on grid cells considers that the recurrent connection weights between grid cells are velocity-dependent [ 14 ]. This requires that neuronal connections are instantly tuned by the agent’ velocity and is hence unlikely biologically feasible. Our neural circuit model has the similar structure as that in [ 15 , 16 ], but has different mathematical formulations. Model predictions This body of work also generates predictions testable in experiments, including: 1) band cells should be organized into clusters based on their orientation and spacing in the brain, analogous to the way grid cells are organized along the dorsal-ventral axis in MEC [ 33 ]; 2) band cells in the same module should further be organized into attractor networks, similar to head-direction cells in the thalamic nuclei and postsubiculum [ 34 ]; 3) disruption of band cells should lead to deficits in path integration in downstream grid cells, potentially offering insights into the mechanisms underlying navigation impairments observed in the early stages of Alzheimer’s disease [ 35 ]. Investigating these computationally derived predictions using experiments will not only prompt a re-evaluation of the functional role of grid cells in providing a spatial metric for the environment, but also advance our understanding of the computational contribution of band cells in neural circuits. Limitation and future works Several important aspects remain to be explored in future studies. For example, it is not fully clear whether undefined cells in the trained RNN hold certain spatial tuning properties, such as those seen in head direction cells [ 36 ] or boundary vector cells [ 37 ], and whether they play a role in path integration; and if so, at which point along the hierarchical pathway they contribute. Additionally, the nature of interactions between band and grid cells in the trained RNN remains not fully solved, and it needs to be inspected more thoroughly whether these interactions correspond directly to the connectivity profile in our proposed mechanistic neural model. Finally, the current training paradigm is restricted to path integration in physical space. It will be valuable to explore whether this framework is generalizable to path integration in abstract spaces (e.g., social network, value space in decision making) and whether the same hierarchical pathway is preserved [ 38 ]. Cross-talk between AI and neuroscience AI approaches are a powerful tool to train network models for executing tasks, but they also face the challenge that the trained networks are often hard to interpret. Without prior knowledge, one has no cue to open up the black box. Here, we demonstrate that by using neuroscience prior knowledge and methods, we can uncover the detailed hierarchical pathway embedded in the trained RNNs for path integration. On the other hand, the RNN-based findings can advance our understanding of the neural circuit mechanism underlying path integration in the brain. This study presents an example of using cross-field knowledge to facilitate AI interpretation and neuroscience research. A Training details of RNN To train RNNs on path integration tasks, we implemente an established computational framework adapted from the open-source repository developed by Ganguli Lab ( https://github.com/ganguli-lab/grid-pattern-formation ). Code used for this paper is publicly available at https://github.com/yuling-wu/band_grid_hierarchy . Vanilla RNN architectures are trained using the hyperparameters specified in Table S1 . Our weight matrices are initialized randomly using PyTorch’s default scheme and there are no hand-crafted or localized initialization tricks. The trajectory used to train each iteration or test is sampled randomly from a distribution. The training loss is presented in Fig. S1 . Download figure Open in new tab Figure S1. Training loss for the vanilla RNN. Place cell activity The receptive field centers of place cells are randomly distributed across the square environment. Each place cell’s firing activity is modeled using a difference-of-softmax tuning curve, analogous to the difference-of-Gaussians function: where x is the current location of the agent, c i denotes the center of the i th place cell’s receptive field, and σ 1 and σ 2 parameterize the width of the center and surround, respectively. The network received velocity inputs derived from the simulated trajectory and was trained to produce the simulated place cell activities as output. Path integration error Locations of the agent are decoded from the place cell activities by considering three maximally active place cells and averaging the x and y coordinates of their place field centers. We quantified decoding accuracy using the mean Euclidean distance between the decoded positions and ground truth locations: where ( x i , y i ) denotes the true position and represents the decoded position for the i-th sample. B Using neuroscience knowledge to analyse RNN B.1 Rate map construction Rate mapping—a fundamental technique in systems neuroscience—quantifies how neuronal firing rates vary with spatial location, providing crucial insights into neural representations of space. When applied to RNNs trained on path integration, this approach has revealed the spontaneous emergence of functionally specialized units analogous to biological grid cells, and band cells observed in biological navigation systems. To do this, we generate a test batch ( n = 200 trajectories) as inputs to the RNN and record the activation states of all recurrent layer units, the agent’s current position and head direction at each step. To construct spatial rate maps, we partition the environment into an m × m grid, resulting in m 2 spatial bins, and compute the mean activation for each unit within each bin. Here we set m = 20 to compute a set of low resolution maps to use for evaluating grid score and set m = 50 to compute a set of high resolution maps to plot the resulting tuning curves and visualize the spatial firing patterns. To construct angular activation profiles, we partition the head direction ranging from − π to π into 100 bins, and compute the mean activation for each unit within each bin. B.2 Neuron type classification Band cell Ideal band cells exhibit a defining electrophysiological signature characterized by spatially periodic firing fields that form bands across the environment [ 9 ]. To quantify this, we developed a spectral analysis method. We first compute the 2D Fourier transform of the spatial rate map, suppressing negative frequencies. The resulting power spectrum is fitted with a 2D Gaussian model parameterized by amplitude (A), spatial frequency (k), orientation angle ( θ ), and bandwidth ( σ ) using constrained nonlinear optimization. The band score is calculated as the normalized correlation between the actual spectral power distribution and the Gaussian model, weighted by σ : where: F is the spectral power matrix obtained from the 2D Fourier transform of the rate map: with negative frequencies suppressed ( F ( u, v ) = 0 for ) G is the fitted 2D Gaussian model: Parameters are optimized via: subject to k ∈ [0.2, 1], ϕ ∈ [0, π ], σ ∈ [0.05, 0.5] The spatial frequency components are derived as: where Δ x is the spatial bin size. Band score distribution is show in Fig. S2a and cells with a band score of over 5.8 are classified as band cells. Example band cells are shown in Fig. S2b . Download figure Open in new tab Figure S2. (a) Band score distribution. (b) The top 128 band cells with the highest scores. Grid cell Ideal grid cells exhibit a defining electrophysiological signature characterized by spatially periodic firing fields that form a hexagonal lattice tessellation across the environment [ 4 ]. Grid score was quantified through a rotational analysis of the autocorrelogram derived from the spatial rate map. Specifically, the autocorrelogram underwent circular rotations in 30° increments, followed by computation of Pearson correlations between each rotated version and the original map. The final grid score metric was calculated as: where ρ ( θ ) represents the correlation coefficient after θ -degree rotation. This measure captures the hexagonal periodicity signature by comparing correlations at the theoretical peaks (60° and 120°) versus troughs (30°, 90°, and 150°) of an ideal grid pattern. Finally, cells with a grid score of over 0.88 are classified as grid cells. Undefined cell Any cells that are neither band nor grid cells are classified as undefined cells. B.3 Properties of band cells tuning Spatial tuning To quantitatively characterize band cell activity patterns, we derive three key spatial parameters from the spatial rate maps: Spacing λ , the distance between adjacent bands, calculated by , where k x and k y are the same as in Eq.16; Orientation θ , the orientation of bands in the 2D space, computed through the following spectral analysis procedure: where θ ( ω ) = tan − 1 ( f y /f x ) is the orientation of frequency component ω (constrained to [0, π ]), P ( ω ) is the spectral power at frequency ω , the angle(·) handles the π -periodicity of band patterns, the π − (·) − π/ 2 sequence performs the requested axis transformation, and the modulo π operation ensures angular continuity; Phase ϕ , the positional separation between band cells having the same spacing and orientation. Denote Δ ∈ ( −λ/ 2, λ/ 2) the offset between the adjacent bands of two band cells, their phase difference is given by ϕ = (Δ /λ ) × π ∈ ( −π, π ). As illustrated in Fig. S3a , the connection weight of band cells varies with their phase difference, reminiscent to the center-surround connection pattern. Download figure Open in new tab Figure S3. (a) The averaged connection profile of band cells as a function of their phase difference. In figures a and c, colors indicate distinct band cell clusters, and each cluster has the same spacing and orientation. (b) Example band cells with opposite preferred direction. (c) Histograms of preferred directions of band cells in three clusters, which have a bimodal shape peaked at either the cluster orientation θ or its opposite direction θ + π . (d) 3D isomap embedding population activity from a band cell cluster. Directional tuning To quantitatively characterize band cell direction, we calculate two parameters from the angular activation profiles: The direction score quantifies directional tuning by fitting angular activation patterns y i ( ψ ) with a circular Gaussian function: where d ( ψ, µ ) = min(| ψ − µ |, 2 π −| ψ − µ |) is the circular distance between angle ϕ and preferred direction µ , and σ determines tuning width. Parameters ( A, µ, σ ) are estimated via nonlinear least-squares fitting initialized at [1, 0, 1]. The direction score is computed as the normalized projection between observed ( y data ) and fitted ( y model ) activation patterns: The preferred direction ξ i ∈ [− π, π ) for each band cell i is derived from its angular activation profile y i ( ψ k ) through circular moment analysis, computed as: where ψ k = − π + 2 πk/N ψ ( k = 0, …, N ψ − 1) defines N ψ equally spaced angular bins, represents the unit vector in complex space, and arg(·) extracts the phase of the resultant vector. We find that, for each cluster with the same spacing and direction tuning, the majority of band cells form two subgroups with opposite preferred directions ( Fig. S3b-c ). B.4 Population activity analysis Neural population dynamics were analyzed using the following pipeline: Data extraction : A test batch ( n = 200 trajectories) was generated as inputs to the RNN to generate the network’s corresponding latent representations. Then neuron subset X raw was extracted (shape: T × N , where T is timepoints and N is neurons to be analyzed). Preprocessing : Neural activity was standardized using z-score normalization: Dimensionality reduction : – PCA projected data to 15 principal components – Isomap further reduced to 3D ( k = 8 neighbors, geodesic distance metric) Visualization : The 3D neural manifold was plotted against animal trajectory (5-frame offset corrected) using time-indexed coloring (viridis colormap). Fig. S3d displays an alternative Isomap embedding for a distinct band cell group not analyzed in the main text. C Dissecting information flows in RNN C.1 Pruning experiments To systematically investigate the computational roles of recurrent layer units in path integration, we performed four distinct pruning experiments with rigorous controls: Pruning velocity inputs : For each pruning level n ∈ {1, …, 700}, we randomly selecte n units across cell types and nullify their velocity input weights: where 𝒮 n denotes a size- n random subset of units, and encodes velocity-to-recurrent layer weights. Pruning read-out connections : We prune output projections from n randomly selected units by zeroing their readout weights: with representing the recurrent-to-output weight matrix. Pruning cell types : For comprehensive cell inactivation, we simultaneously nullified all incoming and outgoing connections of selected units: where is the recurrent weight matrix. Pruning connections between band and grid cells : For the cell-type specific pruning analysis, we conducted bidirectional connection pruning between band (A) and grid (B) cell populations: – A → B Pruning : Nullified all forward connections from a random subset of n band cells to every grid cell: – B → A Pruning : Symmetrically ablated all feedback connections from a random subset of n grid cells to every band cell: Error bars represent standard deviation across n = 30 independent repetitions, reflecting the variability in individual measurements. C.2 RNN with predefined hierarchical structure We implement a hierarchical RNN architecture that takes the hierarchical pathway as a prior ( Fig. 4b ). The model consists of two reciprocally connected modules: First module (RNN1) : Processes velocity inputs ( v t ) combined with feedback from the second module, designed to emulate the properties of band cells: where represents the feedback from RNN2, J 1 and J 2 represent the recurrent weights of RNN1 and RNN2 respectively. Second module (RNN2) : Receives inputs from RNN1 and generates spatial representations, mimicking grid cell functionality: We train this hierarchical RNN model on the standard path integration task using the same hyperparameters specified in Table S1 . The training loss is presented in Fig. S4 a . Download figure Open in new tab Figure S4. (a) Training loss for the RNN with predefined hierarchical structure. (b) Training loss for RNN for location reconstruction. (c) Example grid cells found in the newly trained RNN for location reconstruction. (d) The number of band cells found in the Vanilla RNN (Baseline) and newly trained RNN (Reconstruction). View this table: View inline View popup Download powerpoint Table S1. Parameters used to train Vanilla RNNs C.3 RNN trained for location reconstruction We modify the task from path integration to pure location reconstruction by replacing velocity inputs of the vanilla RNN with place cell activations at each timestep, expressed as: where denotes the ground truth place cell activation pattern corresponding to the current position. All hyperparameters are the same as in Table S1 . The training loss is presented in Fig. S4 b . After training the RNN on this modified task, we observe the emergence of grid-like activity patterns while notably lacking band cell representations ( Fig. S4 c-d ). D Quantitative Performance Analysis D.1 Error Distribution Analysis We quantified path integration performance across 30 independent trials for each of 10 different RNN implementations (Seeds 0–9). The results demonstrate consistent performance, with errors (normalized by arena size) reported as mean ± standard deviation (units: %): D.2 Computational Complexity Scaling We analyzed the relationship between hidden layer size ( N R ) and path integration error, with errors (normalized by arena size) reported as mean ± standard deviation (units: %): This analysis demonstrates that our model achieves stable performance ( < 2.19% error) with N ≥ 4096 neurons, suggesting our approach provides computationally efficient spatial representation. D.3 Pruning Baseline For each pruning condition, we prune connections selected from random groups as baseline to assess the relative importance of our specific pruning choices. The key results are presented in Table S2 , which demonstrates that pruning specific functional connections (input-to-band or grid-read-out) produces significantly larger errors compared to random pruning, suggesting specialized functional roles for these specific cell groups. View this table: View inline View popup Download powerpoint Table S2. Path integration error increase (mean SD across 30 trials when 750 connections are pruned). Error is measured by the standard deviation of location prediction errors divided by the arena size (unit: %). E Reproducibility E.1 Experiments Across Different Seeds we repeat the experiments across 10 random seeds for Vanilla RNN. Our results robustly demonstrate that band cells consistently serve as the primary recipients of velocity inputs and grid cells reliably encode spatial location information. The additional results are: Neuron Counts and Pruned Connections: View this table: View inline View popup Download powerpoint Pruning Performance (mean ± SD): Velocity Input Pruning: View this table: View inline View popup Download powerpoint Read-out Connection Pruning: View this table: View inline View popup Download powerpoint E.2 Different Training Paragram To check the flexibility of our results, we trained three additional path-integration RNN variants: Vanilla RNN → LSTM transition (different in net structure). Xu et al. (2022) [ 19 ] training paradigm (different in net structure (RNN and LSTM), place field (Gaussian), and loss function (conformal isometry and path integration loss)). Petterson et al. (2024) [ 24 ] training paradigm (different in initial state (MLP), loss function (distance preservation and capacity loss), and decoder (none)). The quantitative analysis of path integration performance across the three RNN variants are presented below, which demonstrates that velocity inputs are preferentially processed by band cells across all three RNN variants, as evidenced by their greater sensitivity to velocity pruning. However, the absence of decoder modules in some variants prevented systematic pruning read-out experiments, limiting direct comparisons of read-out performance. E.2.1 Vanilla RNN→LSTM transition The pruning experiments show that models degrade severely when velocity inputs to band cells are pruned, but remain relatively stable when inputs to grid cells or undefined cells are pruned under the same conditions: Neuron Counts and Pruned Connections: View this table: View inline View popup Download powerpoint Velocity Input Pruning Performance (mean ± SD): View this table: View inline View popup Download powerpoint E.2.2 Xu et al. (2022) The pruning experiments reveal that band cells exhibit significantly greater sensitivity to input manipulation compared to grid or undefined cells, which is consistently observed across all experimental seeds except seed 1: Neuron Counts and Pruned Connections: View this table: View inline View popup Download powerpoint Velocity Input Pruning Performance (mean ± SD): View this table: View inline View popup Download powerpoint E.2.3 Petterson et al. (2024) Our 10-seed replication of Petterson et al. (2024) demonstrates robust preferential processing of velocity inputs by band cells. The additional results are: Neuron Counts and Pruned Connections: View this table: View inline View popup Download powerpoint Pruning Performance (mean ± SD): View this table: View inline View popup Download powerpoint F Neural circuit model details F.1 Overview of the model architecture We provide a mathematical overview of the neural circuit model for 2D path integration, consisting of band cell modules and a grid cell module. Each component performs specific computations described below. 1. Pure band cell dynamics (1D CANN) Each band cell module maintains a bump of activity along a 1D phase space ϕ ∈ (− π, π ], via recurrent dynamics: where u b and r b are synaptic input and firing rate of pure band cells. The recurrent connectivity is symmetric and translation-invariant: Their firing rates are normalized to stabilize the bump: 2. Direction-conjunctive band cells These cells receive excitatory input from pure band cells and encode the agent’s projected velocity along the module’s preferred orientation θ and its opposite direction θ + π . Their dynamics are defined as: where u ± ( ϕ, t ) and r ± ( ϕ, t ) are the synaptic input and firing rate of the conjunctive cells. The velocity projection vector is k = (sin θ/λ , cos θ/λ ), determining the speed component along the module’s axis. The firing rates reflect the movement direction and strength of the agent. Feedback to pure band cells Direction-conjunctive cells modulate the activity bump in pure band cells via asymmetric projections. The connection weights from conjunctive to pure band cells are: These connections are offset by ± δ along the phase axis and thus induce a translation of the activity bump, driving 1D path integration along the module orientation. Specifically, W + promotes bump motion in the forward direction ( θ ), and W − in the opposite direction ( θ + π ). 3. Grid cells Grid cells are organized on a 2D toroidal manifold and integrate inputs from two band cell modules with orientations θ 1 and θ 2 , which are 60 ° apart. They form a 2D continuous attractor neural network (CANN) with the following dynamic where u g ( ϕ, t ) and r g ( ϕ, t ) are the synaptic input and firing rate of a grid cell at phase ϕ = ( ϕ 1 , ϕ 2 ). The recurrent connectivity J g is translation-invariant and shaped to support hexagonal grid patterns: with firing rates given by a divisive normalization: The distance metric || · || g between grid cell phases is defined to produce a hexagonal pattern. Specifically, letting Δ ϕ = ϕ − ϕ ′ , we apply periodic wrapping and a linear transformation: where wrap(·) maps values to (− π, π ] to account for periodic boundary conditions. The linear transformation aligns the phase coordinates with the axes of a hexagonal lattice. This design ensures that the bump activity on the grid cell manifold has a hexagonal structure rather than a square one, consistent with biological grid cell tuning. 4. Reciprocal connections between grid and band modules Bidirectional connections allow information exchange between grid and band cells. From grid cells to band cells: From band cells to grid cells: The weights are symmetric and phase-aligned: F.2 Parameters The model is composed of multiple path integration modules , each responsible for encoding spatial location at a specific scale. Each module consists of two band cell modules and one grid cell module . The two band modules within a path integration module differ only in their preferred orientation (offset by 60 ° ), but share all other dynamic and connectivity parameters. The five modules operate at distinct spatial scales λ ( i ) , which influence their velocity projection vectors k ( i ) and resulting grid periodicity. Within each module, band cells perform velocity integration using directionally tuned input, coupled through asymmetric recurrent and cross-module connections. Their outputs drive the activity of grid cells, which integrate spatial phase across the two orientations to generate hexagonal grid patterns. The grid cell dynamics are shaped by their own recurrent connectivity and normalization mechanisms. All modules share a common set of parameters for band and grid dynamics, except for the spatial scale λ and the orientation θ , which define the velocity-to-phase projection. These design choices allow for a consistent multi-scale encoding of space, which is later used for spatial decoding via a grid-to-place projection. The table below summarizes all parameters used in the model and their hierarchical roles. F.3 Simulation details We performed two simulations to evaluate the functionality of the proposed neural circuit model for path integration. Simulation 1: Activity mapping in full environment We simulated a freely foraging rat in a square box environment, generating a trajectory of 100,000 time steps with a fixed time step size Δ t = 0.05. The simulated trajectory densely covers the entire spatial environment. At each time step, we recorded the activity of different neural populations in the model, including band cells (from each module) and grid cells. We then computed the average firing rate at each spatial location to obtain the spatial tuning maps (i.e., heatmaps) for different cells. Simulation 2: Decoding trajectory from neural activity In this simulation, we generated a continuous trajectory of 1,000 time steps, again with Δ t = 0.05. Using the spatial tuning maps (heatmaps) of grid cells obtained from Simulation 1, we decoded the animal’s position at each time step from the instantaneous population activity of grid cells. The decoding procedure was carried out in two stages: View this table: View inline View popup Download powerpoint Table S3. Parameters of the path integration model. Each path integration module consists of two band cell modules (offset by 60 ° in orientation) and one grid cell module, with shared dynamics and connectivity parameters. Grid-to-place cell transformation: The grid cell activity vector at each time step was linearly projected onto a population of place cells. Each place cell was assigned a spatial location ( x, y ) on a uniform 2D grid. To define the synaptic connection between a grid cell and a place cell, we first projected the place cell’s spatial location into the phase space ( ϕ 1 , ϕ 2 ) of the two band cell modules used to construct grid cells. This projection was done by computing the inner product of the place field center ( x, y ) with the two module wave vectors k 1 and k 2 , i.e., This yields the wrapped phases ( ϕ 1 , ϕ 2 ) corresponding to the grid cell’s toroidal phase space. The connection strength between each grid cell (with preferred phase ϕ g ) and a place cell (located at ( x, y ) with corresponding ϕ pc = ( ϕ 1 , ϕ 2 )) is then defined by a Gaussian kernel on the torus: where the toroidal phase distance ∥ · ∥ g is computed using the same hexagonal metric as in the grid cell CANN. Specifically, for d = ϕ pc − ϕ g (wrapped to [ −π, π ]), with δ x = d 1 and δ y = d 2 . This construction ensures that the grid-to-place connection matrix respects the periodic and hexagonal structure of the underlying grid cell code. Population vector decoding: After obtaining the activity of place cells from the grid cell input, we decoded the position by computing a population vector (center-of-mass) over place field centers, weighted by the activity of each place cell at each time step. We then evaluated the model’s path integration accuracy by comparing the decoded positions with the true trajectory. Results obtained under idealized conditions—where both the input signals and the model were free of random noise—are presented in Fig. 5 . In more realistic noisy scenarios, small errors accumulate over time, resulting in a gradual drift in the estimated position, as illustrated in Fig. S5 . Download figure Open in new tab Figure S5. Inferred trajectory of the noisy neural circuit model compared with the ground-truth trajectory. (b) Decoding error of the neural circuit under noisy conditions. NeurIPS Paper Checklist 1. Claims Question: Do the main claims made in the abstract and introduction accurately reflect the paper’s contributions and scope? Answer: [Yes] Justification: The main claims made in the abstract and introduction truthfully summarize the paper’s contributions and scope. Guidelines: The answer NA means that the abstract and introduction do not include the claims made in the paper. The abstract and/or introduction should clearly state the claims made, including the contributions made in the paper and important assumptions and limitations. A No or NA answer to this question will not be perceived well by the reviewers. The claims made should match theoretical and experimental results, and reflect how much the results can be expected to generalize to other settings. It is fine to include aspirational goals as motivation as long as it is clear that these goals are not attained by the paper. 2. Limitations Question: Does the paper discuss the limitations of the work performed by the authors? Answer: [Yes] Justification: The discussion section explicitly examines the study’s limitations, ensuring transparent acknowledgment of the work’s boundaries. Guidelines: The answer NA means that the paper has no limitation while the answer No means that the paper has limitations, but those are not discussed in the paper. The authors are encouraged to create a separate “Limitations” section in their paper. The paper should point out any strong assumptions and how robust the results are to violations of these assumptions (e.g., independence assumptions, noiseless settings, model well-specification, asymptotic approximations only holding locally). The authors should reflect on how these assumptions might be violated in practice and what the implications would be. The authors should reflect on the scope of the claims made, e.g., if the approach was only tested on a few datasets or with a few runs. In general, empirical results often depend on implicit assumptions, which should be articulated. The authors should reflect on the factors that influence the performance of the approach. For example, a facial recognition algorithm may perform poorly when image resolution is low or images are taken in low lighting. Or a speech-to-text system might not be used reliably to provide closed captions for online lectures because it fails to handle technical jargon. The authors should discuss the computational efficiency of the proposed algorithms and how they scale with dataset size. If applicable, the authors should discuss possible limitations of their approach to address problems of privacy and fairness. While the authors might fear that complete honesty about limitations might be used by reviewers as grounds for rejection, a worse outcome might be that reviewers discover limitations that aren’t acknowledged in the paper. The authors should use their best judgment and recognize that individual actions in favor of transparency play an important role in developing norms that preserve the integrity of the community. Reviewers will be specifically instructed to not penalize honesty concerning limitations. 3. Theory assumptions and proofs Question: For each theoretical result, does the paper provide the full set of assumptions and a complete (and correct) proof? Answer: [NA] Justification: The paper does not include theoretical results. Guidelines: The answer NA means that the paper does not include theoretical results. All the theorems, formulas, and proofs in the paper should be numbered and cross-referenced. All assumptions should be clearly stated or referenced in the statement of any theorems. The proofs can either appear in the main paper or the supplemental material, but if they appear in the supplemental material, the authors are encouraged to provide a short proof sketch to provide intuition. Inversely, any informal proof provided in the core of the paper should be complemented by formal proofs provided in appendix or supplemental material. Theorems and Lemmas that the proof relies upon should be properly referenced. 4. Experimental result reproducibility Question: Does the paper fully disclose all the information needed to reproduce the main experimental results of the paper to the extent that it affects the main claims and/or conclusions of the paper (regardless of whether the code and data are provided or not)? Answer: [Yes] Justification: The paper provides sufficient methodological details, hyperparameters, and experimental setups to allow reproduction of the key results supporting its claims. Details are presented in Sec. 2, 3 and SI. Guidelines: The answer NA means that the paper does not include experiments. If the paper includes experiments, a No answer to this question will not be perceived well by the reviewers: Making the paper reproducible is important, regardless of whether the code and data are provided or not. If the contribution is a dataset and/or model, the authors should describe the steps taken to make their results reproducible or verifiable. Depending on the contribution, reproducibility can be accomplished in various ways. For example, if the contribution is a novel architecture, describing the architecture fully might suffice, or if the contribution is a specific model and empirical evaluation, it may be necessary to either make it possible for others to replicate the model with the same dataset, or provide access to the model. In general. releasing code and data is often one good way to accomplish this, but reproducibility can also be provided via detailed instructions for how to replicate the results, access to a hosted model (e.g., in the case of a large language model), releasing of a model checkpoint, or other means that are appropriate to the research performed. While NeurIPS does not require releasing code, the conference does require all submissions to provide some reasonable avenue for reproducibility, which may depend on the nature of the contribution. For example If the contribution is primarily a new algorithm, the paper should make it clear how to reproduce that algorithm. If the contribution is primarily a new model architecture, the paper should describe the architecture clearly and fully. If the contribution is a new model (e.g., a large language model), then there should either be a way to access this model for reproducing the results or a way to reproduce the model (e.g., with an open-source dataset or instructions for how to construct the dataset). We recognize that reproducibility may be tricky in some cases, in which case authors are welcome to describe the particular way they provide for reproducibility. In the case of closed-source models, it may be that access to the model is limited in some way (e.g., to registered users), but it should be possible for other researchers to have some path to reproducing or verifying the results. 5. Open access to data and code Question: Does the paper provide open access to the data and code, with sufficient instructions to faithfully reproduce the main experimental results, as described in supplemental material? Answer: [Yes] Justification: We provide the link to our publicly available Github repository in the SI. Guidelines: The answer NA means that paper does not include experiments requiring code. Please see the NeurIPS code and data submission guidelines ( https://nips.cc/public/guides/CodeSubmissionPolicy ) for more details. While we encourage the release of code and data, we understand that this might not be possible, so “No” is an acceptable answer. Papers cannot be rejected simply for not including code, unless this is central to the contribution (e.g., for a new open-source benchmark). The instructions should contain the exact command and environment needed to run to reproduce the results. See the NeurIPS code and data submission guidelines ( https://nips.cc/public/guides/CodeSubmissionPolicy ) for more details. The authors should provide instructions on data access and preparation, including how to access the raw data, preprocessed data, intermediate data, and generated data, etc. The authors should provide scripts to reproduce all experimental results for the new proposed method and baselines. If only a subset of experiments are reproducible, they should state which ones are omitted from the script and why. At submission time, to preserve anonymity, the authors should release anonymized versions (if applicable). Providing as much information as possible in supplemental material (appended to the paper) is recommended, but including URLs to data and code is permitted. 6. Experimental setting/details Question: Does the paper specify all the training and test details (e.g., data splits, hyper-parameters, how they were chosen, type of optimizer, etc.) necessary to understand the results? Answer: [Yes] Justification: The paper thoroughly documents all the training and test details required to comprehend and replicate the reported findings in SI. Guidelines: The answer NA means that the paper does not include experiments. The experimental setting should be presented in the core of the paper to a level of detail that is necessary to appreciate the results and make sense of them. The full details can be provided either with the code, in appendix, or as supplemental material. 7. Experiment statistical significance Question: Does the paper report error bars suitably and correctly defined or other appropriate information about the statistical significance of the experiments? Answer: [Yes] Justification: The paper reports error bars and provides appropriate information about the statistical significance of the experiments, as evidenced in the presented figures and SI. Guidelines: The answer NA means that the paper does not include experiments. The authors should answer “Yes” if the results are accompanied by error bars, confidence intervals, or statistical significance tests, at least for the experiments that support the main claims of the paper. The factors of variability that the error bars are capturing should be clearly stated (for example, train/test split, initialization, random drawing of some parameter, or overall run with given experimental conditions). The method for calculating the error bars should be explained (closed form formula, call to a library function, bootstrap, etc.) The assumptions made should be given (e.g., Normally distributed errors). It should be clear whether the error bar is the standard deviation or the standard error of the mean. It is OK to report 1-sigma error bars, but one should state it. The authors should preferably report a 2-sigma error bar than state that they have a 96% CI, if the hypothesis of Normality of errors is not verified. For asymmetric distributions, the authors should be careful not to show in tables or figures symmetric error bars that would yield results that are out of range (e.g. negative error rates). If error bars are reported in tables or plots, The authors should explain in the text how they were calculated and reference the corresponding figures or tables in the text. 8. Experiments compute resources Question: For each experiment, does the paper provide sufficient information on the computer resources (type of compute workers, memory, time of execution) needed to reproduce the experiments? Answer: [No] Justification: The manuscript does not explicitly report computational resource requirements, as the lightweight architecture of the proposed model renders such specifications non-essential for reproducibility. Guidelines: The answer NA means that the paper does not include experiments. The paper should indicate the type of compute workers CPU or GPU, internal cluster, or cloud provider, including relevant memory and storage. The paper should provide the amount of compute required for each of the individual experimental runs as well as estimate the total compute. The paper should disclose whether the full research project required more compute than the experiments reported in the paper (e.g., preliminary or failed experiments that didn’t make it into the paper). 9. Code of ethics Question: Does the research conducted in the paper conform, in every respect, with the NeurIPS Code of Ethics https://neurips.cc/public/EthicsGuidelines? Answer: [Yes] Justification: The research fully complies with the NeurIPS Code of Ethics in all aspects by ensuring transparency, reproducibility, and fairness in reporting experimental results. Guidelines: The answer NA means that the authors have not reviewed the NeurIPS Code of Ethics. If the authors answer No, they should explain the special circumstances that require a deviation from the Code of Ethics. The authors should make sure to preserve anonymity (e.g., if there is a special consideration due to laws or regulations in their jurisdiction). 10. Broader impacts Question: Does the paper discuss both potential positive societal impacts and negative societal impacts of the work performed? Answer: [NA] Justification: There is no societal impact of the work performed. Guidelines: The answer NA means that there is no societal impact of the work performed. If the authors answer NA or No, they should explain why their work has no societal impact or why the paper does not address societal impact. Examples of negative societal impacts include potential malicious or unintended uses (e.g., disinformation, generating fake profiles, surveillance), fairness considerations (e.g., deployment of technologies that could make decisions that unfairly impact specific groups), privacy considerations, and security considerations. The conference expects that many papers will be foundational research and not tied to particular applications, let alone deployments. However, if there is a direct path to any negative applications, the authors should point it out. For example, it is legitimate to point out that an improvement in the quality of generative models could be used to generate deepfakes for disinformation. On the other hand, it is not needed to point out that a generic algorithm for optimizing neural networks could enable people to train models that generate Deepfakes faster. The authors should consider possible harms that could arise when the technology is being used as intended and functioning correctly, harms that could arise when the technology is being used as intended but gives incorrect results, and harms following from (intentional or unintentional) misuse of the technology. If there are negative societal impacts, the authors could also discuss possible mitigation strategies (e.g., gated release of models, providing defenses in addition to attacks, mechanisms for monitoring misuse, mechanisms to monitor how a system learns from feedback over time, improving the efficiency and accessibility of ML). 11. Safeguards Question: Does the paper describe safeguards that have been put in place for responsible release of data or models that have a high risk for misuse (e.g., pretrained language models, image generators, or scraped datasets)? Answer: [NA] Justification: The paper poses no such risks. Guidelines: The answer NA means that the paper poses no such risks. Released models that have a high risk for misuse or dual-use should be released with necessary safeguards to allow for controlled use of the model, for example by requiring that users adhere to usage guidelines or restrictions to access the model or implementing safety filters. Datasets that have been scraped from the Internet could pose safety risks. The authors should describe how they avoided releasing unsafe images. We recognize that providing effective safeguards is challenging, and many papers do not require this, but we encourage authors to take this into account and make a best faith effort. 12. Licenses for existing assets Question: Are the creators or original owners of assets (e.g., code, data, models), used in the paper, properly credited and are the license and terms of use explicitly mentioned and properly respected? Answer: [Yes] Justification: We appropriately acknowledge all third-party code and data sources through proper citations of original works and the code base is also linked in SI. Guidelines: The answer NA means that the paper does not use existing assets. The authors should cite the original paper that produced the code package or dataset. The authors should state which version of the asset is used and, if possible, include a URL. The name of the license (e.g., CC-BY 4.0) should be included for each asset. For scraped data from a particular source (e.g., website), the copyright and terms of service of that source should be provided. If assets are released, the license, copyright information, and terms of use in the package should be provided. For popular datasets, paperswithcode.com/datasets has curated licenses for some datasets. Their licensing guide can help determine the license of a dataset. For existing datasets that are re-packaged, both the original license and the license of the derived asset (if it has changed) should be provided. If this information is not available online, the authors are encouraged to reach out to the asset’s creators. 13. New assets Question: Are new assets introduced in the paper well documented and is the documentation provided alongside the assets? Answer: [Yes] Justification: The completeness of documentation for newly introduced assets will be verified upon release of the data and code on GitHub, ensuring all reproducibility requirements are met. Guidelines: The answer NA means that the paper does not release new assets. Researchers should communicate the details of the dataset/code/model as part of their submissions via structured templates. This includes details about training, license, limitations, etc. The paper should discuss whether and how consent was obtained from people whose asset is used. At submission time, remember to anonymize your assets (if applicable). You can either create an anonymized URL or include an anonymized zip file. 14. Crowdsourcing and research with human subjects Question: For crowdsourcing experiments and research with human subjects, does the paper include the full text of instructions given to participants and screenshots, if applicable, as well as details about compensation (if any)? Answer: [NA] Justification: The paper does not involve crowdsourcing nor research with human subjects. Guidelines: The answer NA means that the paper does not involve crowdsourcing nor research with human subjects. Including this information in the supplemental material is fine, but if the main contribution of the paper involves human subjects, then as much detail as possible should be included in the main paper. According to the NeurIPS Code of Ethics, workers involved in data collection, curation, or other labor should be paid at least the minimum wage in the country of the data collector. 15. Institutional review board (IRB) approvals or equivalent for research with human subjects Question: Does the paper describe potential risks incurred by study participants, whether such risks were disclosed to the subjects, and whether Institutional Review Board (IRB) approvals (or an equivalent approval/review based on the requirements of your country or institution) were obtained? Answer: [NA] Justification: The paper does not involve crowdsourcing nor research with human subjects. Guidelines: The answer NA means that the paper does not involve crowdsourcing nor research with human subjects. Depending on the country in which research is conducted, IRB approval (or equivalent) may be required for any human subjects research. If you obtained IRB approval, you should clearly state this in the paper. We recognize that the procedures for this may vary significantly between institutions and locations, and we expect authors to adhere to the NeurIPS Code of Ethics and the guidelines for their institution. For initial submissions, do not include any information that would break anonymity (if applicable), such as the institution conducting the review. 16. Declaration of LLM usage Question: Does the paper describe the usage of LLMs if it is an important, original, or non-standard component of the core methods in this research? Note that if the LLM is used only for writing, editing, or formatting purposes and does not impact the core methodology, scientific rigorousness, or originality of the research, declaration is not required. Answer: [NA] Justification: The core method development in this research does not involve LLMs as any important, original, or non-standard components. Guidelines: The answer NA means that the core method development in this research does not involve LLMs as any important, original, or non-standard components. Please refer to our LLM policy ( https://neurips.cc/Conferences/2025/LLM ) for what should or should not be described. Acknowledgments and Disclosure of Funding This work was supported by the National Natural Science Foundation of China (no. T2421004 to S.W.), the National Key Research and Development Program of China (2024YFF1206500), the Science and Technology Innovation 2030-Brain Science and Brain-inspired Intelligence Project (no. 2021ZD0200204, S.W.), and the Wellcome Principal Research Fellowship (222457/Z/21/Z, N.B.). Funder Information Declared the National Natural Science Foundation of China , T2421004 the National Key Research and Development Program of China , 2024YFF1206500 the Science and Technology Innovation 2030-Brain Science and Brain-inspired Intelligence Project , 2021ZD0200204 the Wellcome Principal Research Fellowship , 222457/Z/21/Z Footnotes Figure 4g revised: phase updated; References updated. https://github.com/yuling-wu/hierarchy_band_grid References [1]. ↵ Bruce L McNaughton , Francesco P Battaglia , Ole Jensen , Edvard I Moser , and May-Britt Moser . Path integration and the neural basis of the’cognitive map’ . Nature Reviews Neuroscience , 7 ( 8 ): 663 – 678 , 2006 . OpenUrl CrossRef PubMed Web of Science [2]. ↵ Hugh Durrant-Whyte and Tim Bailey . Simultaneous localization and mapping: part i . IEEE robotics & automation magazine , 13 ( 2 ): 99 – 110 , 2006 . OpenUrl Web of Science [3]. ↵ Mariana Gil , Mihai Ancau , Magdalene I Schlesiger , Angela Neitz , Kevin Allen , Rodrigo J De Marco , and Hannah Monyer . Impaired path integration in mice with disrupted grid cell firing . Nature neuroscience , 21 ( 1 ): 81 – 91 , 2018 . OpenUrl CrossRef PubMed [4]. ↵ Torkel Hafting , Marianne Fyhn , Sturla Molden , May-Britt Moser , and Edvard I Moser . Mi-crostructure of a spatial map in the entorhinal cortex . Nature , 436 ( 7052 ): 801 – 806 , 2005 . OpenUrl CrossRef PubMed Web of Science [5]. ↵ Johnson Ying , Alexandra T Keinath , Raphael Lavoie , Erika Vigneault , Salah El Mestikawy , and Mark P Brandon . Disruption of the grid cell network in a mouse model of early alzheimer’s disease . Nature Communications , 13 ( 1 ): 886 , 2022 . OpenUrl PubMed [6]. ↵ Emilio Kropff , James E Carmichael , May-Britt Moser , and Edvard I Moser . Speed cells in the medial entorhinal cortex . Nature , 523 ( 7561 ): 419 – 424 , 2015 . OpenUrl CrossRef PubMed [7]. ↵ Francesca Sargolini , Marianne Fyhn , Torkel Hafting , Bruce L McNaughton , Menno P Witter , May-Britt Moser , and Edvard I Moser . Conjunctive representation of position, direction, and velocity in entorhinal cortex . Science , 312 ( 5774 ): 758 – 762 , 2006 . OpenUrl Abstract / FREE Full Text [8]. ↵ øyvind Arne Høydal , Emilie Ranheim Skytøen , Sebastian Ola Andersson , May-Britt Moser , and Edvard I Moser . Object-vector coding in the medial entorhinal cortex . Nature , 568 ( 7752 ): 400 – 404 , 2019 . OpenUrl CrossRef PubMed [9]. ↵ Julija Krupic , Neil Burgess , and John O’Keefe. Neural representations of location composed of spatially periodic bands . Science , 337 ( 6096 ): 853 – 857 , 2012 . OpenUrl Abstract / FREE Full Text [10]. ↵ Neil Burgess , Caswell Barry , and John O’keefe . An oscillatory interference model of grid cell firing . Hippocampus , 17 ( 9 ): 801 – 812 , 2007 . OpenUrl CrossRef PubMed Web of Science [11]. ↵ Yoram Burak and Ila R Fiete . Accurate path integration in continuous attractor network models of grid cells . PLoS computational biology , 5 ( 2 ): e1000291 , 2009 . OpenUrl [12]. ↵ Mark C Fuhs and David S Touretzky . A spin glass model of path integration in rat medial entorhinal cortex . Journal of Neuroscience , 26 ( 16 ): 4266 – 4276 , 2006 . OpenUrl Abstract / FREE Full Text [13]. ↵ Alexis Guanella , Daniel Kiper , and Paul Verschure . A model of grid cells based on a twisted torus topology . International journal of neural systems , 17 ( 04 ): 231 – 240 , 2007 . OpenUrl CrossRef PubMed Web of Science [14]. ↵ Rylan Schaeffer , Mikail Khona , Tzuhsuan Ma , Cristobal Eyzaguirre , Sanmi Koyejo , and Ila Fiete . Self-supervised learning of representations for space generates multi-modular grid cells . Advances in Neural Information Processing Systems , 36 : 23140 – 23157 , 2023 . OpenUrl [15]. ↵ Christopher P Burgess and Neil Burgess . Controlling phase noise in oscillatory interference models of grid cell firing . Journal of Neuroscience , 34 ( 18 ): 6224 – 6232 , 2014 . OpenUrl Abstract / FREE Full Text [16]. ↵ Daniel Bush and Neil Burgess . A hybrid oscillatory interference/continuous attractor network model of grid cell firing . Journal of Neuroscience , 34 ( 14 ): 5065 – 5079 , 2014 . OpenUrl Abstract / FREE Full Text [17]. ↵ Andrea Banino , Caswell Barry , Benigno Uria , Charles Blundell , Timothy Lillicrap , Piotr Mirowski , Alexander Pritzel , Martin J Chadwick , Thomas Degris , Joseph Modayil , et al. Vector-based navigation using grid-like representations in artificial agents . Nature , 557 ( 7705 ): 429 – 433 , 2018 . OpenUrl CrossRef PubMed [18]. ↵ Christopher J Cueva and Xue-Xin Wei . Emergence of grid-like representations by training recurrent neural networks to perform spatial localization . arXiv preprint arxiv: 1803.07770 , 2018 . [19]. ↵ Dehong Xu , Ruiqi Gao , Wen-Hao Zhang , Xue-Xin Wei , and Ying Nian Wu . Conformal isometry of lie group representation in recurrent network of grid cells . arXiv preprint arxiv: 2210.02684 , 2022 . [20]. ↵ William Dorrell , Peter E Latham , Timothy EJ Behrens , and James CR Whittington . Actionable neural representations: Grid cells from minimal constraints . arXiv preprint arxiv: 2209.15563 , 2022 . [21]. ↵ Yedidyah Dordek , Daniel Soudry , Ron Meir , and Dori Derdikman . Extracting grid cell characteristics from place cell inputs using non-negative principal component analysis . Elife , 5 : e10094 , 2016 . OpenUrl CrossRef PubMed [22]. ↵ Ben Sorscher , Gabriel C Mel , Samuel A Ocko , Lisa M Giocomo , and Surya Ganguli . A unified theory for the computational and mechanistic origins of grid cells . Neuron , 111 ( 1 ): 121 – 137 , 2023 . OpenUrl CrossRef PubMed [23]. ↵ Vemund Schøyen , Markus Borud Pettersen , Konstantin Holzhausen , Marianne Fyhn , Anders Malthe-Sørenssen , and Mikkel Elle Lepperød . Coherently remapping toroidal cells but not grid cells are responsible for path integration in virtual agents . Iscience , 26 ( 11 ), 2023 . [24]. ↵ Markus Pettersen , Vemund Sigmundson Schøyen , Mattis Dalsætra østby , Anders Malthe-Sørenssen , and Mikkel Elle Lepperød . Self-supervised grid cells without path integration . bioRxiv , pages 2024 – 05 , 2024 . [25]. ↵ William Redman , Francisco Acosta , Santiago Acosta-Mendoza , and Nina Miolane . Not so griddy: Internal representations of rnns path integrating more than one agent . Advances in Neural Information Processing Systems , 37 : 22657 – 22689 , 2024 . OpenUrl [26]. ↵ Changmin Yu , Timothy EJ Behrens , and Neil Burgess . Prediction and generalisation over directed actions by grid cells . arXiv preprint arxiv: 2006.03355 , 2020 . [27]. ↵ Tianhao Chu , Zilong Ji , Junfeng Zuo , Yuanyuan Mi , Wen-hao Zhang , Tiejun Huang , Daniel Bush , Neil Burgess , and Si Wu . Firing rate adaptation affords place cell theta sweeps, phase precession, and procession . Elife , 12 : RP87055 , 2024 . OpenUrl CrossRef PubMed [28]. ↵ Zilong Ji , Tianhao Chu , Si Wu , and Neil Burgess . A systems model of alternating theta sweeps via firing rate adaptation . Current Biology , 35 ( 4 ): 709 – 722 , 2025 . OpenUrl CrossRef PubMed [29]. ↵ Zilong Ji , Tianhao Chu , Xingsi Dong , Changmin Yu , Daniel Bush , Neil Burgess , and Si Wu . Dynamical modulation of hippocampal replay sequences through firing rate adaptation . BioRxiv , pages 2024 – 09 , 2024 . [30]. ↵ Si Wu , Kosuke Hamaguchi , and Shun-ichi Amari . Dynamics and computation of continuous attractors . Neural computation , 20 ( 4 ): 994 – 1025 , 2008 . OpenUrl CrossRef PubMed Web of Science [31]. ↵ Wenhao Zhang , Ying Nian Wu , and Si Wu . Translation-equivariant representation in recurrent networks with a continuous manifold of attractors . Advances in Neural Information Processing Systems , 35 : 15770 – 15783 , 2022 . OpenUrl [32]. ↵ Junfeng Zuo , Ying N Wu , Si Wu , and Wen-Hao Zhang . The motion planning neural circuit in goal-directed navigation as lie group operator search . Advances in Neural Information Processing Systems , 37 : 110369 – 110387 , 2024 . OpenUrl [33]. ↵ Hanne Stensola , Tor Stensola , Trygve Solstad , Kristian Frøland , May-Britt Moser , and Edvard I Moser . The entorhinal grid map is discretized . Nature , 492 ( 7427 ): 72 – 78 , 2012 . OpenUrl CrossRef PubMed Web of Science [34]. ↵ Jeffrey S Taube . The head direction signal: origins and sensory-motor integration . Annu. Rev. Neurosci ., 30 ( 1 ): 181 – 207 , 2007 . OpenUrl CrossRef PubMed Web of Science [35]. ↵ Coco Newton , Marianna Pope , Catarina Rua , Richard Henson , Zilong Ji , Neil Burgess , Christopher T Rodgers , Matthias Stangl , Maria-Eleni Dounavi , Andrea Castegnaro , et al. Entorhinal-based path integration selectively predicts midlife risk of alzheimer’s disease . Alzheimer’s & Dementia , 20 ( 4 ): 2779 – 2793 , 2024 . OpenUrl [36]. ↵ Jeffrey S Taube , Robert U Muller , and James B Ranck . Head-direction cells recorded from the postsubiculum in freely moving rats. i. description and quantitative analysis . Journal of Neuroscience , 10 ( 2 ): 420 – 435 , 1990 . OpenUrl Abstract / FREE Full Text [37]. ↵ Colin Lever , Stephen Burton , Ali Jeewajee , John O’Keefe , and Neil Burgess . Boundary vector cells in the subiculum of the hippocampal formation . Journal of Neuroscience , 29 ( 31 ): 9771 – 9777 , 2009 . OpenUrl Abstract / FREE Full Text [38]. ↵ James CR Whittington , Timothy H Muller , Shirley Mark , Guifen Chen , Caswell Barry , Neil Burgess , and Timothy EJ Behrens . The tolman-eichenbaum machine: unifying space and relational memory through generalization in the hippocampal formation . Cell , 183 ( 5 ): 1249 – 1263 , 2020 . OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted November 29, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Unfolding the Black Box of Recurrent Neural Networks for Path Integration Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Unfolding the Black Box of Recurrent Neural Networks for Path Integration Tianhao Chu , Yuling Wu , Neil Burgess , Zilong Ji , Si Wu bioRxiv 2025.10.25.684492; doi: https://doi.org/10.1101/2025.10.25.684492 Share This Article: Copy Citation Tools Unfolding the Black Box of Recurrent Neural Networks for Path Integration Tianhao Chu , Yuling Wu , Neil Burgess , Zilong Ji , Si Wu bioRxiv 2025.10.25.684492; doi: https://doi.org/10.1101/2025.10.25.684492 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Neuroscience Subject Areas All Articles Animal Behavior and Cognition (7621) Biochemistry (17645) Bioengineering (13867) Bioinformatics (41873) Biophysics (21420) Cancer Biology (18550) Cell Biology (25443) Clinical Trials (138) Developmental Biology (13360) Ecology (19866) Epidemiology (2067) Evolutionary Biology (24289) Genetics (15587) Genomics (22472) Immunology (17707) Microbiology (40318) Molecular Biology (17142) Neuroscience (88457) Paleontology (666) Pathology (2826) Pharmacology and Toxicology (4815) Physiology (7634) Plant Biology (15111) Scientific Communication and Education (2042) Synthetic Biology (4285) Systems Biology (9813) Zoology (2268)
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.