Brain Network Differences in Second Language Learning Depend on Individual Competencies

doi:10.1101/2025.09.28.679014

Brain Network Differences in Second Language Learning Depend on Individual Competencies

2025 · doi:10.1101/2025.09.28.679014

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 91,894 characters · extracted from preprint-html · click to expand

Brain Network Differences in Second Language Learning Depend on Individual Competencies | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Brain Network Differences in Second Language Learning Depend on Individual Competencies View ORCID Profile Nicole H. Skieresz , View ORCID Profile Sandy C. Marca , View ORCID Profile Micah M. Murray , View ORCID Profile Thomas P. Reber , View ORCID Profile Nicolas Rothen doi: https://doi.org/10.1101/2025.09.28.679014 Nicole H. Skieresz 1 Faculty of Psychology, UniDistance Suisse , Brigue, Switzerland 2 The LINE (Laboratory for Integrative Neurosciences), Radiology Department, Lausanne University Hospital and University of Lausanne , Lausanne, Switzerland 3 The Sense Innovation and Research Center, Lausanne and Sion , Switzerland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Nicole H. Skieresz For correspondence: skieresznicole{at}gmail.com Sandy C. Marca 1 Faculty of Psychology, UniDistance Suisse , Brigue, Switzerland 4 Faculty of Psychology, University of Geneva , Geneva, Switzerland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Sandy C. Marca Micah M. Murray 2 The LINE (Laboratory for Integrative Neurosciences), Radiology Department, Lausanne University Hospital and University of Lausanne , Lausanne, Switzerland 3 The Sense Innovation and Research Center, Lausanne and Sion , Switzerland 5 Department of Hearing and Speech Sciences, Vanderbilt University , Nashville, TN, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Micah M. Murray Thomas P. Reber 1 Faculty of Psychology, UniDistance Suisse , Brigue, Switzerland 6 Department of Epileptology, University of Bonn Medical Center , Bonn 53127, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Thomas P. Reber Nicolas Rothen 1 Faculty of Psychology, UniDistance Suisse , Brigue, Switzerland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Nicolas Rothen Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Integrating new words into an existing semantic network is a core challenge of second language (L2) acquisition. We investigated how evidence-based learning strategies and individual performance shape the neurocognitive dynamics of vocabulary learning. Eighty- three adults with German or French as their native language (L1) learned 48 Finnish (L2) nouns over 14 days using a mobile app that systematically varied retrieval practice, corrective feedback, multisensory learning, and distributed learning. Before and after training, EEG was recorded during a translation recognition task designed to elicit the N400, an index of semantic integration. Vocabulary accuracy increased from 0.41% pre-learning to 75.5% post- learning ( d z = 3.96), and the N400 incongruity effect increased significantly, F (1, 75) = 99.52, p < .001, η² g = .32, reflecting successful integration of new L2 words into the mental lexicon. High performers showed larger N400 responses and distinct ERP template-map preponderance (i.e., the proportion of epoch time points assigned to a given template map) indicating more efficient and specialized neural processing. Despite systematic manipulation of learning strategies, no single approach yielded consistent behavioral or neural advantages, suggesting that overall exposure and cumulative practice—rather than any specific strategy— were the key drivers of robust learning. ERP template-map analyses further revealed that learning not only amplified neural responses but also shifted the preponderance of maps in the N400 window, signaling a qualitative reorganization of semantic processing. These findings bridge cognitive neuroscience and language education, suggesting that the depth and success of vocabulary learning may depend more on the degree of integration achieved than on the specific instructional strategy employed. 1 Introduction Language comprehension depends on the rapid integration of novel lexical items into an existing semantic network. The N400 component—an event-related potential (ERP) that typically peaks around 400 ms post-stimulus—is widely recognized for its sensitivity to semantic congruency. Words incongruent with the preceding context elicit larger (more negative) N400 amplitudes. This phenomenon, known as the N400 incongruity effect, is interpreted as reflecting increased semantic processing demands ( Kutas & Hillyard, 1980 ). The scalp distribution of the N400 is dynamic, varying with stimulus type and learning stage. In standard visual-word paradigms, the N400 emerges as a monophasic negativity between 200 and 600 ms, with maximal amplitude over centro-parietal electrodes and a slight right-hemisphere bias ( Kutas & Federmeier, 2011 ). For isolated written words, the N400 typically peaks at centro-parietal sites, while more frontal distributions are observed during early learning or in highly contextual scenarios ( Van Petten & Luka, 2012 ). In a recent ERP study of novel-word learning, Armstrong et al. (2024) traced picture-word associative learning from initial encoding to multi-day retention and observed this topographic shift: early learning elicited a predominantly fronto-central N400, which later shifted toward the canonical centro-parietal maximum as representations consolidated. Crucially, the N400 effect also emerges in translation paradigms, where participants view word pairs in two languages: correctly matched (“congruent”) translation pairs elicit smaller N400 amplitudes than mismatched (“incongruent”) pairs ( Midgley et al., 2009 ; Pu et al., 2016 ; Yum et al., 2014 ), reflecting sensitivity to semantic mismatch. This property has established the N400 as a key neural marker in second language (L2) vocabulary acquisition research. Pu et al. (2016) demonstrated that learners initially display no reliable N400 incongruity effect between congruent and incongruent L2–L1 translation pairs, but following vocabulary training, a robust N400 incongruity effect emerges, indicating successful integration of new L2 words into semantic memory. Similarly, Yum et al. (2014) found that rapid learners exhibited increased N400 amplitudes to incorrect translations early in training. Recent studies in adult learners further underscore the N400’s sensitivity to lexical- semantic learning. McLaughlin et al. (2004) demonstrated that an N400 incongruity effect can emerge after only minimal L2 exposure, indicating rapid semantic integration. Elgort et al. (2014) further showed that L2 proficiency influences both behavioral performance and N400 topography: high-proficiency learners exhibited stronger semantic-relatedness effects with a canonical centro-parietal distribution, whereas low-proficiency learners displayed attenuated amplitudes and delayed peaks. Qi et al. (2017) reported that pre-training N400 amplitudes to native language stimuli predicted subsequent vocabulary and grammar learning in an artificial language. García-Gámez and Macizo (2022) demonstrated that semantic training involving word-picture pairs and categorization tasks elicited stronger N400 incongruity effects than lexical training with L1–L2 word associations, suggesting deeper semantic encoding. Together, these findings support the N400 as a neural marker of individual learning potential, highlighting that proficiency not only predicts learning outcomes but also modulates the component’s amplitude, timing, and scalp distribution. Beyond semantic congruency, N400 amplitude also reflects lexical-access fluency ( Van Petten & Luka, 2012 ) and, within predictive-coding frameworks, indexes prediction error ( Lau et al., 2008 ; Kuperberg & Jaeger, 2016 ). Reduced N400 amplitudes for contextually expected stimuli are thought to reflect minimized discrepancies between predicted and encountered semantic information. Importantly, N400 modulations extend to multisensory stimuli ( Kutas & Federmeier, 2011 ) and have even been observed in non-human species such as dogs ( Boros et al., 2024 ; Murray et al., 2024 ), highlighting its evolutionary robustness as a marker of semantic processing. Despite a growing body of ERP research in L2 acquisition, few studies have directly examined how specific learning strategies affect neural indices of vocabulary acquisition (e.g., García-Gámez & Macizo, 2022 ; Li et al., 2023 ; Soskey et al., 2016 ). The present study addresses this gap by combining the ERP translation recognition paradigm from Pu et al. (2016) with a learning intervention incorporating four evidence-based strategies. These strategies were selected based on empirically supported principles outlined by Reber and Rothen (2018), which have been identified as particularly effective for promoting retention in digital vocabulary learning: retrieval practice, corrective feedback, multisensory encoding, and distributed learning. Retrieval practice involves actively recalling learned items rather than passively re- exposing learners to them. This strategy has been shown to enhance long-term retention by reinforcing memory traces through active recall ( Roediger & Karpicke, 2006 ). In the context of vocabulary learning, retrieval is associated with more stable lexical associations and improved recall accuracy ( Barcroft, 2007 ; Kang et al., 2013 ). It is hypothesized that retrieval practice sharpens lexical access and supports more robust semantic integration, which may be reflected in larger N400 incongruity effects after learning—that is, a greater neural differentiation between congruent and incongruent word pairs. However, some studies report reduced N400 amplitudes following successful retrieval, potentially reflecting more automatic or efficient semantic access ( Li et al., 2023 ). These findings suggest that N400 modulation may vary with learning stage, task demands, or the strength of lexical-semantic associations. While behavioral benefits of retrieval practice are well established, neurophysiological evidence remains limited, and further research is needed to clarify how such strategies modulate ERP components during vocabulary acquisition. Corrective feedback during learning is provided by immediately presenting the correct information after a failed or erroneous retrieval attempt. This approach supports the formation of accurate internal representations of word meanings by directly addressing incorrect associations ( Nicol & Macfarlane-Dick, 2006 ; Pashler et al., 2005 ). It is hypothesized that this process supports the development of more distinct lexical-semantic mappings, which may lead to greater neural differentiation between congruent and incongruent word pairs. However, while its pedagogical benefits are well established, ERP-based research specifically investigating the neural correlates of feedback in vocabulary learning remains sparse. Multisensory learning refers to instructional conditions in which information is presented through more than one sensory modality, such as visual, auditory, or kinesthetic channels. Multisensory inputs have been shown to improve recall and support deeper semantic encoding ( Shams & Seitz, 2008 ; Thelen & Murray, 2013 ). Empirical studies demonstrate that multisensory, compared to unisensory, inputs lead to more robust and differentiated neural representations, including stronger and earlier ERP components ( Murray et al., 2004 ) as well as enhanced free recall performance following audiovisual compared to auditory-only encoding ( Atkin et al., 2023 ; Soto-Faraco & Spence, 2025 ). Distributed learning refers to study conditions in which study sessions are spaced over time rather than amassed within a single block. This spacing enables memory traces to consolidate between sessions and has been shown to enhance long-term retention and semantic stability ( Cepeda et al., 2006 ; Edmonds et al., 2021 ). Neuroimaging research indicates that spaced learning strengthens lexical-semantic representations by increasing neural pattern similarity across repetitions, suggesting more consistent and consolidated memory traces ( Feng et al., 2019 ). It is hypothesized that this consolidation-driven strengthening supports the formation of more stable semantic expectations, potentially resulting in more robust N400 incongruity effects, although this link remains to be clarified. To test the impact of these four evidence-based learning strategies—retrieval practice, corrective feedback, multisensory encoding, and distributed learning—on neural markers of vocabulary learning, we employed a translation recognition ERP paradigm and analyzed the data using both canonical ERP methods and an electrical neuroimaging framework based on global measures of the electric field at the scalp ( Murray et al., 2008 ) to characterize the spatiotemporal dynamics of the N400. We further explored how individual learning success (high vs. low performers) modulates these strategy effects. Guided by prior ERP research on L2 vocabulary acquisition (e.g., Pu et al., 2016 ; García-Gámez & Macizo, 2022 ) and learning theory from cognitive psychology (e.g., Roediger & Karpicke, 2006 ; Cepeda et al., 2006 ), we formulated four hypotheses: Hypothesis 1 (Replication): Successful L2 vocabulary learning will elicit a robust N400 incongruity effect from pre- to post-test, replicating prior findings of semantic integration. Hypothesis 2 (Neural Effects of Strategy): Learning strategies that promote lexical-semantic integration—namely retrieval practice, corrective feedback, multisensory encoding, and distributed learning—will enhance the N400 incongruity effect after training. Hypothesis 3 (Behavioral Impact): Items learned under these strategies will show superior learning outcomes compared to items trained without them. Hypothesis 4 (Individual Differences): High-performing learners will show larger N400 incongruity effects than low performers, indicating more efficient and robust lexical-semantic integration. Together, these hypotheses aim to clarify how evidence-based learning strategies modulate both the neural and behavioral outcomes of L2 vocabulary learning. 2 Methods 2.1 Participants Eighty-three healthy adults (M age = 28.59 years; range = 18–40; 54 females) with normal or corrected-to-normal vision participated as part of a larger project. Participants were either native German or French speakers or had advanced proficiency in one of these languages (N German = 50; N French = 33). Recruitment was conducted via the UniDistance Suisse online participant database. All participants provided written informed consent and completed a comprehensive cognitive test battery. Six individuals were excluded from EEG analysis due to incomplete neurophysiological assessment or poor data quality. Participants received either compensation for up to eleven experimental hours or a payment of 200 CHF upon study completion. The ethics committee of UniDistance Suisse approved all procedures (Nr. 2019-12-00002). 2.2 Design The study employed a mixed factorial design incorporating both within-subject factors—Session (pre vs. post); Congruency (congruent vs. incongruent); Retrieval Practice (high vs. low); Corrective Feedback (corrective vs. non-corrective); Multisensory Learning at Encoding (multisensory vs. unisensory); Multisensory Learning at Retrieval (multisensory vs. unisensory)—and two between-subject factors—Performance Group (high vs. low performers) and Distributed Learning (distributed vs. massed), implemented across three sequential phases: pre-learning assessment, vocabulary learning intervention, and post- learning reassessment. Dependent variables included vocabulary-test accuracy (percent correct) and translation recognition task response-bias measures ( d′ , c , ln β ). Neurophysiological measures comprised mean N400 amplitude (300–500 ms, six channels), preponderance of ERP template maps (topographic clustering), Global Field Power (GFP), and Global Map Dissimilarity (GMD). 2.3 Materials 2.3.1 Stimuli Forty-eight Finnish nouns (L2) were each paired with a German or French translation (L1) and consistently presented across phases. Language direction (L1–L2 vs. L2–L1) was varied across the vocabulary test, the translation recognition task, and the mobile-app intervention, but was held constant within each participant across phases. Across the sample, items were intended to appear approximately equally often in L1–L2 and L2–L1 (50:50). Due to a small number of stimulus exclusions (see below and Supplementary Table S1 ), the final analyzed dataset deviates slightly from the intended balance. All stimuli were presented in three modalities during the intervention: auditory, visual, and pictorial. Auditory stimuli were sourced from Universal-Soundbank.com, freesound.org , or generated via Google Translate (a female voice). Visual stimuli (written form) were presented in dark blue on a white background, with associated images, adhering to a 4:3 aspect ratio, sourced mainly from Wikimedia Commons or created using Microsoft Paint 3D. Stimulus characteristics are detailed in Table 1 , with the complete list provided in Supplementary Table S1 . View this table: View inline View popup Download powerpoint Table 1 Description of the Stimuli by Language Four items contained typographical errors. Three of these affected all French-speaking participants and were excluded from all analyses. In a fourth case, the Finnish word huili (instead of huilu , “flute”) was presented during the intervention phase for four German- speaking participants, while huilu was used in the test phases. Due to this inconsistency, data for this specific word were excluded for these participants. Items with typographical errors are marked with an asterisk (*) in Supplementary Table S1 . Additionally, nine Finnish words used in the experiment did not correspond exactly to the intended German source words due to translation errors during stimulus preparation (marked with a dagger [ † ] in the Supplement). These translation discrepancies are detailed in the Supplementary Table and Table Note. All translation errors were present in the stimuli as presented to participants. Since none of the participants had prior knowledge of Finnish, these errors are not expected to have affected task performance or interpretation of results. 2.3.2 Vocabulary Test and Scoring The vocabulary test was administered as part of a cognitive test battery, involving cued recall tasks where participants translated between L1 and L2. Stimuli appeared centrally (black on grey background) via a standard 14-inch Hewlett-Packard laptop. For each participant and test session, accuracy was calculated as the proportion of correctly translated items. Responses were scored using a semi-automated algorithm based on orthographic similarity (optimal string alignment; see van der Loo, 2014 , for stringdist package), allowing for minor spelling errors and variations. A response was classified as correct if it matched the target translation exactly or differed by only a single character (“perfect” or “close” responses). All other responses were scored as incorrect. In cases where a response was equally close to more than one possible target word (“tie”), the item was excluded from scoring to ensure unambiguous classification. Additional cognitive tests included: Adapted French l’EVIP (Dunn & Thériault- Whalen, 1993) to assess L1 vocabulary size, Test of Variables of Attention (TOVA; Leark et al., 2008 ) for sustained attention, Standard Progressive Matrices (Raven et al., 1958) measuring fluid intelligence, a serial order reconstruction task ( Leclercq & Majerus, 2010 ; Gorin & Majerus, 2019 ; Majerus et al., 2006 ) for short-term order memory, a non-word short- term recognition task ( Leclercq & Majerus, 2010 ; Gorin & Majerus, 2019 ; Majerus et al., 2006 ) assessing item-specific short-term memory, and a tapping continuation task (Dalla Bella et al., 2017 ; Gorin & Majerus, 2019 ) for rhythmic processing. Tests were programmed and conducted using Lab.js (version 20.2.4; Henninger et al., 2020 ). 2.3.3 Translation Recognition Task A translation recognition task, adapted from Pu et al. (2016) , was used to assess the N400 incongruity effect. The task was conducted in Octave (version 4.0.3) with PsychToolbox extensions (3.0.14) on a Debian system. In each trial, two words were presented in black color sequentially at the center of a 24-inch LCD color monitor (HP LA2405x) with a light grey background. Each word appeared for 800 ms, with no interstimulus interval. The intertrial interval was fixed at 1,000 ms and included a jitter of 300–600 ms. Participants used the left or right arrow key to indicate whether they believed the second word was a correct translation of the first word. Immediately afterward, they responded to a second prompt by again using the arrow keys to indicate whether their decision was based on knowledge or guessing. Task duration ranged from approximately 30 to 50 minutes with optional breaks between blocks. Each of the 48 stimuli appeared once in a correct (congruent) and once in an incorrect (incongruent) translation per block, yielding 96 trials per block. Across four blocks—with alternating translation directions—participants completed either two blocks of L2–L1 followed by two blocks of L1–L2, or vice versa (two blocks L1–L2 followed by two blocks L2–L1). The order of these four blocks was counterbalanced across participants. Each block comprised 96 trials, with each of the 48 stimuli appearing once in a congruent and once in an incongruent pairing, yielding a total of 384 experimental trials per session. Incongruent pairs were generated by randomly combining words from the same stimulus set, ensuring semantic mismatch. In the first version of the task (N = 16), incongruent combinations were newly generated for each block, such that each incongruent pairing appeared at least once per session. This design introduced a potential learning artifact, as participants could begin to infer incongruent pairs through repetition. To address this, a second version (N = 67) fixed all incongruent combinations across blocks and sessions. In both versions, congruent pairs remained constant. Response key assignments were randomized and counterbalanced in the first version but fixed in the second version for consistency across sessions. 2.4 Procedure All sessions were conducted at the same UniDistance Suisse site for each participant—either one of the German-speaking locations (Naters or Brig) or the French- speaking site (Sierre). The study comprised a pre-learning phase (Sessions 1 and 2), a 14-day intervention phase, and a post-learning phase (Session 3). Figure 1 shows a schematic overview of the procedure. Download figure Open in new tab Figure 1 Overview of the Experimental Procedure and Implementation of Learning Strategies Note. (A) Experimental phases: pre-learning (Session 1: baseline vocabulary testing; Session 2: EEG assessment and initiation of the 14-day mobile-app intervention; blue = learning days; white = rest days); and post-learning (Session 3: vocabulary testing and EEG reassessment). Participants were randomized to distributed or massed schedules. (B) Example of word presentation in the mobile app during intervention. Interface elements (e.g., buttons and labels) are shown in English for illustration; the actual app was presented in German or French (L1) and Finnish (L2). Stimuli were allocated by retrieval proportion (70% retrieval practice; 30% restudy), modality (50% multisensory; 50% unisensory), and feedback type (50% corrective; 50% non-corrective). The intervention phase comprised 48 initial encoding trials, 12 daily sessions of 48 trials each, and a final retrieval session of 20 trials (total = 644 trials per participant). Session 1 (approximately 2.5 hours) involved cognitive and vocabulary testing and was conducted individually or in small groups (51 individually, 22 pairs, 10 groups of three). Session 2 (approximately 2 hours) consisted of a demographic questionnaire, visual acuity testing using Landolt rings (optikschweiz.ch), and EEG setup. Participants were seated approximately 60 cm from the computer screen, and a chin rest was used to minimize head movements and maintain constant viewing distance. The neurophysiological assessment began with a 3-minute resting-state EEG recording (eyes open), followed by two EEG tasks—a translation recognition and a fast periodic visual stimulation (FPVS) oddball paradigm—administered in random order. Only the translation recognition task is reported in the present manuscript. The EEG session concluded with detailed instructions for the mobile app-based vocabulary training. Session 3 (approximately 2 hours) comprised a repeated vocabulary test and EEG assessments. Six participants completed the EEG tasks before the vocabulary test to minimize order effects. The order of the two EEG tasks was kept consistent with Session 2. 2.5 Electrophysiological Recording and Pre-processing EEG was recorded with a 64-channel sponge-based electrode system (RNet; Brain Products GmbH), arranged according to the extended international 10–20 system (ground: FPz, reference: Cz), with impedances kept below 30 kΩ. Signals were digitized at 1,000 Hz using a BrainAmp amplifier (Brain Products GmbH) and recorded on a Lenovo laptop (Windows 10 Home, 8 GB RAM). Pre-processing was performed using EEGLAB (version 2024.1; Delorme & Makeig, 2004 ; The MathWorks, Inc., 2022 ) and ERPLAB (version 12.00; Lopez-Calderon & Luck, 2014 ) and comprised downsampling to 250 Hz; band-pass filtering between 0.1 and 35 Hz; continuous artifact rejection; interpolation of broken or artifact-contaminated channels; re- referencing to the common average; peri-stimulus epoching (−200–800 ms); pre-stimulus baseline correction (−200–0 ms); artifact rejection on epochs (±150 µV), and removal of eye- blink artifacts. Following pre-processing, an average of 302 ± 68 epochs per participant pre- learning and 305 ± 64 epochs post-learning were retained. 2.6 Data Analysis 2.6.1 Statistical Analyses & Variables T-tests and mixed ANOVAs were conducted in RStudio (version 2024.12.0) with p = .05 as the threshold for statistical significance. Behavioral dependent variables included vocabulary test accuracy (percent correct) and response bias indices from the translation recognition task (sensitivity ( d ’), criterion location ( c ), likelihood ratio (ln β )). Response-bias indices were calculated as per Macmillan & Creelman (2005) , with hit and false alarm rates corrected, using Snodgrass & Corwin’s (1988) formula (adding 0.5 and dividing by 𝑁 + 1, where 𝑁 is the number of congruent or incongruent trials). The specific computations were: The criterion location was computed as The likelihood ratio was computed as where 𝑧 𝐻 and 𝑧 𝐹𝐴 denote the z-transformed hit rate and false alarm rate, respectively. For further group-level analyses, a median split was performed on vocabulary gain (i.e., post-test minus pre-test accuracy) across all participants; those with gains equal to or above the sample median were classified as “high performers,” and those below as “low performers.” Electrophysiological dependent variables encompassed mean N400 amplitudes measured at six centro-parietal electrodes (C3, Cz, C4, P3, Pz, P4), reflecting the canonical centro-parietal distribution of the mature N400 ( Kutas & Federmeier, 2011 ; Van Petten & Luka, 2012 ). We quantified mean amplitudes in the 300–500 ms window post-stimulus onset ( Šoškić et al., 2021 ). To capture global spatiotemporal dynamics, we performed topographic clustering and derived template-map preponderance (proportion of time frames assigned to each map within predefined epochs; time frames = TF) and used RAGU to compute Global Field Power (GFP) and Global Map Dissimilarity (GMD). Effects in GFP/GMD were assessed with the permutation-based global pAUC statistic (5,000 permutations). In the Results, we report the permutation p values associated with the global pAUC tests (formatted as “global pAUC, p = …”). 2.6.2 Topographic Clustering, Global Field Power, and Global Map Dissimilarity Analyses of neural activation were conducted using the freeware Cartool (version 5.02; Brunet et al., 2011 ) for topographic clustering and freeware RAGU (compiled 24 November 2020; Koenig et al., 2011 ) for GFP and GMD. Topographic clustering decomposed continuous ERPs into transient but stable ERP template maps that reflect discrete functional brain states. Grand-averaged ERPs per condition (pre-congruent, pre-incongruent, post-congruent, post-incongruent) were imported into Cartool and spatially filtered to enhance signal quality. Segmentation was performed using the Topographic Atomize and Agglomerate Hierarchical Clustering (T-AAHC) algorithm with a minimum segment length of 10 time frames (TF). The resulting group-level ERP template maps were then backfitted to individual ERPs via spatial correlation to derive map labels and preponderance. GFP analysis assessed differences in the strength of neural responses across conditions. GFP reflects the overall amplitude of electric brain activity, independent of topographic configuration. At each time frame 𝑡, GFP was computed as the root mean square across the 𝑁 electrodes ( Equation 4 ). Significance for GFP was evaluated within RAGU’s global pAUC framework using nonparametric permutation tests (5,000 permutations). GMD analysis evaluated condition-related differences in scalp topographies for each pair of the four experimental conditions (pre-congruent, pre-incongruent, post-congruent, post-incongruent) across the full post-stimulus period (0–796 ms). In contrast to topographic clustering, which identifies recurring ERP template maps within predefined epochs, GMD provides a time-resolved measure of topographic dissimilarity between two conditions. For any two conditions 𝛼 and 𝛽, GMD at time 𝑡 was computed as: where are the GFP-normalized potentials at electrode 𝑖 for conditions 𝛼 and 𝛽, respectively and 𝑁 is the number of electrodes. Statistical significance for GMD was likewise assessed via nonparametric permutation testing (5,000 permutations) within the global pAUC framework; in the Results we report the associated permutation p values. 3 Results 3.1 Vocabulary Test Vocabulary test accuracy increased substantially from pre- to post-learning (see Figure 2 ). On average, participants scored M = 0.41% ( SD = 1.19%; range 0–6.82%) before learning and M = 75.5% ( SD = 19.1%; range 16.7–100%) after learning. A paired-samples t- test confirmed this change was highly significant, t (82) = 36.07, p < .001, d z = 3.96, 95% CI [3.32, 4.59], indicating a large learning effect. Download figure Open in new tab Figure 2 Vocabulary Test Accuracy Before and After Learning Note. Boxplots show participants’ test accuracy (%) before and after learning. Gray circles are individual accuracy; colored lines connect paired measurements (low performers in red, high performers in blue). Green diamonds indicate group means, and asterisks denote significant within-group gains ( p 0.116; see Supplementary Table S2 ). There was a small but significant main effect of Feedback Type, F (1, 80) = 10.95, p = 0.001, η² g = 0.03. However, follow-up analyses showed that this effect was driven by low performers: The improvement in accuracy (post–pre) was higher for items learned with corrective feedback ( M = 61.8, SD = 22.6) than with non-corrective feedback ( M = 52.8, SD = 17.1), t (41) = 2.96, p = .005, d z = 0.46, 95% CI [0.14, 0.77]. In contrast, among high performers, there was no significant difference in improvement in accuracy between corrective ( M = 88.9, SD = 11.0) and non-corrective feedback ( M = 85.7, SD = 13.7), t (39) = 1.58, p = .121, d z = 0.25, 95% CI [−0.07, 0.56]. 3.2 Response-Bias Indices Sensitivity ( d’ ), Criterion c and likelihood ratio (ln β ) were computed as described in the Methods. Sensitivity in the translation recognition task improved markedly from pre- to post-learning. The mean d′ score increased from M = 0.59 ( SD = 0.34) to M = 4.15 ( SD = 1.01), indicating a substantial gain in participants’ ability to distinguish correct from incorrect translations. A repeated-measures ANOVA revealed significant main effects of Session, F (1, 75) = 1603.27, p < .001, η² g = .89, and Performance Group, F (1, 75) = 30.16, p .05; see Supplementary Table S3) . Criterion c value decreased from M = 0.28 ( SD = 0.45) pre-learning to M = 0.12 ( SD = 0.26) post-learning, indicating a shift toward less conservative responding. ANOVA results revealed significant main effects of Performance Group, F (1, 75) = 5.92, p = .017, η² g = .04 and Session, F (1, 75) = 9.49, p = .003, η² g = .05. The Session × Performance Group interaction was not significant, F (1, 75) = 0.75, p = .390, η² g = .00. No learning-strategy factors reached significance (all p > .26, η² g ≤ .01; see Supplementary Table S4 ), except for small group-specific interactions for Multisensory Learning at Retrieval (Performance Group × RM: F (1, 75) = 4.67, p = .034, η² g = .01) and Distributed Learning (Performance Group × DL: F (1, 73) = 5.40, p = .023, η² g = .07). The mean ln β value increased from M = 0.15 ( SD = 0.28) pre-learning to M = 0.43 ( SD = 0.97) post-learning, indicating a tendency toward more conservative decisions post- learning—participants were less likely to identify a translation pair as correct without sufficient certainty. A significant main effect of Session was found, F (1, 75) = 6.75, p = .011, η² g = .04. No significant main effect of Performance Group, F (1, 75) = 3.63, p = .061, η² g = .03, and no significant Session × Performance Group interaction, F (1, 75) = 0.62, p = .432, η² g = .00, were observed. No learning strategy effects were significant (all p > .05). 3.3 N400 Incongruity Effect To evaluate changes in semantic processing, we quantified the N400 incongruity effect as the amplitude difference between incongruent and congruent trials. A repeated- measures ANOVA revealed a significant main effect of Session, F (1, 75) = 99.52, p < .001, η² g = 0.32, indicating a larger incongruity effect post-learning. There was also a main effect of Performance Group, F (1, 75) = 14.44, p = .001, η² g = .11, with high performers showing greater N400 incongruity effects overall. Importantly, the Session × Performance Group interaction was significant, F( 1, 75 ) = 6.79, p = .011, η² g = .03, reflecting that high performers exhibited a larger pre-to-post increase than low performers (see Figure 3A ). Download figure Open in new tab Figure 3 N400 Amplitude Change, Scalp Topographies, and ERP Waveforms Note. Panel A displays individual N400 incongruity effects (incongruent−congruent) before and after learning for low and high performers. Gray lines connect repeated measurements within participants; green diamonds represent group means; asterisks indicate significant within-group differences ( p < .001). Panel B depicts post–pre scalp topographies of the N400 incongruity effect (300–500 ms), with low performers on the left and high performers on the right; electrode Pz is marked by a white dot (color scale in µV at right). Panel C shows the grand-average post–pre ERP difference wave for the N400 incongruity effect at electrode Pz, with shaded bands representing standard error of the mean. Separate ANOVAs on post-learning N400 incongruity effects—examining each learning strategy by Performance Group—showed no modulation by strategy (all p > .588, for Supplementary Table S5 ). However, small but consistent main effects of Performance Group persisted across strategies (all p < .01, η² g < .13), confirming that high performers maintained larger incongruity effects after learning. Figure 3B illustrates the scalp distribution of the learning-related change in the N400 incongruity effect, calculated as shown in Equation 6 : over the 300–500 ms window for low (left) and high (right) performers. Figure 3C presents the grand-average post–pre ERP difference wave at Pz (incongruent−congruent), confirming more pronounced parietal negativity in high performers. 3.4 Analyses of Global Features of the Electric Field at the Scalp 3.4.1 Topographic Clustering & GFP To investigate condition-related changes in the strength and topography of the scalp- recorded electric field, we first examined global features using topographic clustering and Global Field Power (GFP). Topographic clustering revealed six distinct ERP template maps over the 0–796 ms period ( Figure 4A ). Across conditions, Global Field Power ( Figure 4B ) consistently peaked during Map 2 (∼ 148–296 ms), indicating heightened early processing preceding the N400 window. Within the N400 window (300–500 ms), Maps 3 and 4 predominated. Map 3, characterized by broad left-hemispheric negativity, was present in pre-learning congruent and incongruent conditions as well as in the post-learning incongruent condition, but absent in the post-learning congruent condition, which was characterized by Map 4 and uniquely by Map 5. Map 4 displayed right-posterior positivity with opposing left-frontal negativity, while Map 5 featured left-posterior negativity coupled with pronounced right-central positivity. Download figure Open in new tab Figure 4 ERP Template Maps, GFP Time Courses by Condition with Segmentation, and Mean GFP by Session Note. Panel A shows the six ERP template maps (µV; color bar at right). Panel B displays GFP time courses for the four experimental conditions, with shaded colored bands indicating the temporal extent of each corresponding map from A. Panel C presents mean GFP amplitudes pre- and post-learning (± SEM ); paired-samples t-test, t (76) = −4.42, p < .001. This pattern suggests a learning-related reorganization of semantic processing. The disappearance of Map 3 post-learning for congruent items likely reflects a reduced need for effortful semantic processing, whereas Map 5’s unique presence suggests a more efficient or specialized processing state. In line with this interpretation, permutation testing on GFP using the global pAUC statistic revealed a significant main effect of Session (global pAUC, p = .0002; Figure 4C ), indicating stronger overall brain responses post-learning. No other main effects or interactions were significant (all global pAUC tests, ps > .129). 3.4.2 Template-Map Preponderance by Epoch To investigate how template-map dynamics varied with learning, congruency, and performance, we analyzed the preponderance of each template map within three predefined temporal epochs. Preponderance was defined as the number of time frames (TF) in a participant’s ERP that showed the highest spatial correlation with a given template map, as identified during topographic clustering. Repeated-measures ANOVAs were conducted for each epoch with the factors Map, Session, Congruency, and Performance Group. Epoch 1 (0–73 TF; 0–292 ms) was dominated by Maps 1 and 2. A main effect of Map, F (1, 75) = 10.30, p = .002, η² g = .09, indicated that Map 2 exhibited a higher preponderance than Map 1, independent of Session, Congruency, or Performance Group. Epoch 2 (74–162 TF; 292–648 ms), which corresponds to the N400 window, was characterized by Maps 3 and 4 ( Figure 5 A ). A Session × Congruency × Map interaction, F (1, 75) = 5.43, p = .022, indicated condition-specific shifts in semantic processing dynamics. Follow-up analyses showed that, in post-learning congruent trials, Map 4 showed higher preponderance than Map 3, F (1, 75) = 22.03, p < .001, η² g = .23, with this effect stronger in high performers (Map × Performance Group: F (1, 75) = 6.42, p = .013, η² g = .08). Download figure Open in new tab Figure 5 Preponderance of Map 3, 4 and Map 5, 6 by Condition and Performance group Note. Preponderance of Map 3 and 4 (A), and Map 5 and 6 (B) expressed as proportion of total time frames per condition and performance group. Bars represent mean proportions. Error bars indicate the standard error of the mean. In post-learning incongruent trials, a similar Map × Performance Group trend emerged ( F (1, 75) = 4.07, p = .048, η² g = .05), although the main effect of Map did not reach significance ( p = .092). No Map- or Performance-related effects occurred in the pre-learning conditions. Across all conditions, a robust Congruency × Map interaction, F (1, 75) = 18.85, p < .001, η² g = .01, showed higher Map 3 preponderance during incongruent trials and higher Map 4 preponderance during congruent trials. A Session × Map interaction, F (1, 75) = 8.97, p = .004, η² g = .02, reflected increased Map 4 preponderance after learning. Epoch 3 (163–199 TF; 648–796 ms) involved Maps 5 and 6 (see Figure 5 B ). A Session × Congruency × Map interaction, F (1, 75) = 19.46, p < .001, η² g = .03), prompted follow-up ANOVAs. In all pre-learning conditions and in the post-learning incongruent condition, Map 6 preponderance exceeded those of Map 5 (all F ≥ 16.95, p ≤ .001). The post- learning congruent condition showed no significant Map difference ( p = .058). A Map × Performance Group interaction in the post-learning incongruent condition, F (1, 75) = 4.66, p = .034, η² g = .06, indicated greater Map 6 preponderance among high performers. No other Performance Group interactions were observed ( Fs ≤ 2.17, ps ≥ .145). These results suggest that learning effects on late-stage topographic map dynamics were strongest for incongruent items, particularly in high-performing individuals. ANOVA results are provided in Supplementary Table S6 . 3.4.3 Global Map Dissimilarity To complement the insights from topographic clustering and GFP, we employed Global Map Dissimilarity (GMD) to quantify, at each time point (0–796 ms), the degree to which the entire scalp topography differed between conditions. Whereas clustering reduces the data to a finite set of recurring ERP template maps and GFP indexes overall field strength, GMD provides a continuous, data-driven metric of spatial configuration differences—even when template-map identity or amplitude remains constant. Permutation testing using the global pAUC statistic revealed significant main effects of Session (global pAUC, p < .001), Congruency (global pAUC, p < .001), and Performance Group (global pAUC, p = .008), as well as significant Session × Congruency (global pAUC, p = .010) and Session × Performance Group (global pAUC, p = .009) interactions. The TANOVA time windows for the factor Session (the entire period 0–796 ms), for Congruency (from 232 ms onward) and the Session × Congruency interaction (260–476 ms and 508–796 ms; see Supplementary Figure S1 mirror our clustering and GFP findings. Notably, the Session × Performance Group interaction was most pronounced between 276 and 428 ms ( Supplementary Figure S1E ), coinciding with the N400 window. This timing aligns with the analysis of topographic map preponderance in Epoch 2, where a Map × Performance Group interaction ( F (1, 75) = 6.42, p = .013, η² g = .08) showed that high performers exhibited higher Map 4 preponderance than low performers. Thus, the GMD confirms that individual competency not only modulates the strength (GFP) and topographic shifts (clustering) of the N400, but also the continuous scalp-map reconfigurations captured by GMD. No significant Congruency × Performance Group or the three-way (Session × Congruency × Performance Group) interactions emerged (all ps > .26). 4 Discussion The present study demonstrated robust vocabulary learning gains accompanied by clear neural changes. Following two weeks of L2 vocabulary training, participants exhibited significant improvements in vocabulary test scores and enhanced discrimination sensitivity ( d′ ) for congruent versus incongruent word pairs. Critically, the N400 incongruity effect, minimal prior to training, emerged prominently after learning, reflecting successful integration of new L2 words into participants’ semantic networks. High-performing learners (those with above-median vocabulary gains) consistently showed larger N400 differences than low performers, indicating more efficient neural processing and deeper semantic encoding. Contrary to our hypotheses, however, there was little evidence that specific learning strategies (retrieval practice, corrective feedback, multisensory learning, or distributed learning) differentially modulated the N400 or behavioral outcomes, except for a modest benefit of corrective feedback on vocabulary test performance. These findings are discussed in the context of the established functional role of the N400 and prior ERP research on L2 vocabulary acquisition, with a particular focus on insights from the ERP template-map analyses. 4.1 Neural Sensitivity of the N400 The N400 is a well-established index of semantic integration, lexical access ease, and prediction error ( Kuperberg & Jaeger, 2016 ; Kutas & Federmeier, 2011 ; Lau et al., 2008 ; Murray et al., 2024 ). In line with Hypothesis 1, the pronounced N400 incongruity effect observed after learning confirms that the newly acquired words were efficiently integrated into the semantic network, enabling learners to form stronger lexical-semantic predictions. Consequently, encountering incongruent word pairs elicited greater semantic processing difficulty due to violated predictions, as indicated by increased N400 amplitudes ( Kuperberg & Jaeger, 2016 ; Lau et al., 2008 ). Previous ERP studies of L2 vocabulary acquisition typically employed shorter training intervals—often limited to 3–4 hours—and nonetheless reported detectable, albeit smaller, N400 incongruity effects (e.g., McLaughlin et al., 2004 ; Pu et al., 2016 ). Pu et al. (2016) showed that learners exhibited no reliable N400 incongruity effect prior to training but developed a significant, though comparatively moderate, effect after only three hours of instruction, with a clear frontal distribution. Importantly, their study exclusively employed L2–L1 translations, whereas our study tested translation recognition in both L2–L1 and L1– L2 directions, providing a more comprehensive assessment of lexical-semantic integration. By including both translation directions, our design may not only have promoted more robust and balanced semantic mapping by engaging both forward (L1–L2) and backward (L2–L1) translation processes (see Figure 3 for illustration), but also offered a more ecologically valid model of real-world L2 use. In everyday language contexts, L2 learners frequently encounter and produce words in both directions, and thus this bidirectional paradigm more closely mirrors the challenges and demands of authentic second language communication. According to the Revised Hierarchical Model ( Kroll & Stewart, 1994 ), these directions rely on partly distinct mechanisms—semantic mediation for L1–L2 and more direct lexical links for L2– L1—suggesting that activating both may strengthen cross-linguistic integration. High- performers, in particular, may have benefited from this dual-route activation, leading to stronger N400 incongruity effects. Similar early frontal N400 patterns have been reported by Yum et al. (2014) , who observed enhanced frontal negativity in fast learners after short-term training. Likewise, McLaughlin et al. (2004) demonstrated rapid onset of N400 incongruity effects following very brief passive L2 exposure, suggesting initial stages of lexical acquisition. In contrast, our extended two-week intervention resulted in substantially stronger behavioral improvements and a more mature neural signature of semantic integration, characterized by clearer centro-parietal distributions and enhanced N400 differentiation between congruent and incongruent word pairs. These results align with findings from Armstrong et al. (2024) , who observed a similar maturational shift in N400 topography, moving from fronto-central dominance during early learning toward the canonical centro- parietal distribution following multi-day consolidation. Additionally, Elgort et al. (2014) reported comparable centro-parietal distributions among proficient L2 learners, further supporting the notion that increased lexical proficiency shifts the N400 topography toward canonical patterns. Moreover, the magnitude of the N400 incongruity effect in the present study varied systematically with participants’ vocabulary gains, supporting Hypothesis 4. This suggests that depth of lexical-semantic knowledge, rather than the specific learning strategies employed, primarily drives neural efficiency — that is, the brain’s ability to rapidly and effectively integrate new lexical-semantic information, resulting in more streamlined and differentiated neural responses during language processing — and ease of semantic integration. This interpretation is consistent with previous studies emphasizing the relationship between proficiency or learning depth and N400 amplitude modulation (e.g., Elgort et al., 2014 ; Yum et al., 2014 ). Qi et al. (2017) further demonstrated that initial N400 amplitudes to native language stimuli predicted subsequent vocabulary and grammar learning in an artificial language, underscoring the role of individual differences in semantic processing efficiency, a concept used interchangeably here with "neural efficiency" for learning outcomes. 4.2 Impact of Learning Strategies on Behavioral and Neural Outcomes One objective was to examine whether established learning strategies would produce measurable differences. Across all participants, a combination of retrieval practice, feedback, multisensory input, and distributed learning resulted in substantial learning gains—approximately a 75% increase in vocabulary scores and improved translation recognition accuracy. However, when analyzing the effects of individual learning strategies, differences were modest, and no strategy reliably modulated the N400 amplitude or behavioral outcomes in isolation. In line with Hypothesis 2, we expected that retrieval practice would enhance long- term retention and sharpen semantic representations, potentially manifesting as a stronger post-learning N400 incongruity effect or superior behavioral performance. While the overall intervention clearly benefited learning, we did not observe a significant advantage for items practiced with higher retrieval proportion. This stands in contrast to previous findings demonstrating that retrieval practice enhances recall accuracy during vocabulary acquisition—a phenomenon known as the testing effect. Behavioral studies have consistently shown that actively retrieving word associations leads to superior long-term retention compared to passive restudy ( Barcroft, 2007 ; Fritz et al., 2007 ; Kang et al., 2013 ; Roediger & Karpicke, 2006 ). At the neural level, Liu et al. (2018) reported distinct ERP correlates of retrieval-based learning, and Li et al. (2023) found that actively retrieved L3 words elicited a reduced N400 amplitude compared to restudied items, interpreted as reflecting more efficient semantic access. In our study, however, no such effect emerged. This may be due to ceiling effects or overlapping exposure: items were learned repeatedly across conditions, and the high overall success rate may have masked potential condition-specific differences. A related issue concerns how ERP measures such as the N400 can be meaningfully linked to cognitive processes like encoding richness or memory consolidation. While reduced N400 incongruity is often interpreted as reflecting more fluent lexical-semantic access, these reductions do not necessarily indicate deeper or more stable memory representations. As such, the expected benefits of multisensory input and distributed learning on encoding and retention (Hypotheses 2 and 3) were not reflected in post-learning N400 incongruity or behavioral outcomes. Prior studies have shown that multimodal presentation (e.g., visual and auditory) deepens semantic encoding ( Shams & Seitz, 2008 ), and that spaced repetition enhances memory stability ( Cepeda et al., 2006 ). However, our design did not implement pure “present vs. absent” contrasts for any individual learning strategy. Even "unisensory" items could involve both visual and auditory input, shown in distinct screen regions (e.g., one in the upper and one in the lower part of the display). All participants engaged in repeated practice over a two-week period, which may have diminished the contrasts between conditions. Unlike studies that implemented sharper contrasts—such as multimodal versus unimodal input (e.g., Thelen & Murray, 2013 ) or massed versus widely spaced repetition at the item level (e.g., Atkin et al., 2023 ; Feng et al., 2019 )—our manipulation may not have been sufficiently strong to yield distinct neural or behavioral effects. Additionally, most of the aforementioned studies used between-subjects designs, which may have amplified contrast effects between learning conditions. Together, these differences in experimental design, contrast strength, and spacing duration may explain why the expected benefits of learning strategies were not observable in our ERP and behavioral outcomes. Subdividing the sample by learning strategy and performance group may have reduced statistical power to detect small or interaction effects. We did observe a very small behavioral benefit of corrective feedback: across participants, items where the correct answer was immediately presented when a mistake was made were slightly better than those without feedback. This aligns with educational theories that timely feedback strengthens memory traces by explicitly correcting the erroneous associations ( Nicol & Macfarlane-Dick, 2006 ). Yet, the effect size was limited ( η² g ≈ .03), and no corresponding effects emerged at the neural level, such as in the N400 amplitude. In summary, although the intervention led to substantial gains in vocabulary knowledge and neural differentiation, our results did not provide clear evidence that any individual learning strategy—retrieval practice, corrective feedback, multisensory learning, or distributed learning—consistently enhanced outcomes beyond the general effects of exposure. The small behavioral benefit observed for corrective feedback was specific to low performers—those who showed smaller accuracy gains—suggesting that immediate presentation of the correct answer after errors may be especially helpful for individuals with less improvement in vocabulary retention, even though no corresponding neural effects were found. Given the high overall learning success across conditions, it remains possible that the cumulative exposure across multiple strategies, rather than any specific one, supported lexical-semantic integration. However, since the design did not include a no-strategy control condition, conclusions about additive or synergistic effects of strategy combinations remain speculative. Future studies should more systematically isolate and contrast strategy effects to clarify their unique and interactive contributions to vocabulary learning. 4.3 High vs. Low Performers: Neural Efficiency and Strategy Use High performers showed more pronounced N400 incongruity effects and subtle topographic differences compared to low performers. Our study adds to the literature by showing that even when group-level learning gains are large, ERP measures such as the N400 and ERP template-map analyses reveal persistent qualitative differences between high and low performers—reflecting differences in neural efficiency (as previously defined, i.e., the brain’s ability to rapidly and effectively integrate new lexical-semantic information). In other words, high-performing learners exhibit more efficient neural processing of new vocabulary, as indicated by larger and more consistent N400 incongruity effects and more specialized ERP template-map configurations, which signal deeper semantic integration and more stable memory traces. In contrast, low performers may have remained uncertain about word meanings even post-learning, resulting in reduced or inconsistent N400 responses and less differentiated neural patterns. This pattern aligns with the idea that proficient learners process L2 semantics more similarly to native speakers ( McLaughlin et al., 2004 ). Our high-performing group’s neural activity can be viewed as more tuned to the semantics of the new words, whereas low performers might rely on more analytical or familiarity-based strategies (potentially engaging later positivity components for decision uncertainty). Although we did not find significant learning strategy-specific improvements for high versus low performers, minor interactions in response bias measures suggest that certain learning strategies (e.g., distributed learning) might subtly modulate response tendencies. Overall, these results highlight ERPs as a sensitive tool for revealing qualitative differences in how deeply L2 words are integrated, beyond simple recall accuracy. 4.4 Neural Dynamics Revealed by ERP Template-Map Analyses, GFP, and GMD By extending traditional ERP analysis with ERP template-map analyses (topographic clustering), GFP, and GMD approaches, we provided a more detailed view of how the spatiotemporal patterns of brain activity are reorganized following vocabulary learning. This multimethod approach provided a more fine-grained view of when and how the brain’s functional states differ before versus after vocabulary acquisition. We identified six distinct ERP template maps that describe the dominant EEG topographies across the 800 ms epoch. Within the canonical N400 window (300–500 ms), we observed two different ERP template maps (Maps 3 and 4) whose preponderance varied by condition—a finding in line with Brandeis et al. (1995) , who reported separate preN400 and N400 scalp-maps during sentence processing. Notably, Map 3 (left-hemispheric negativity) was prominent before learning and in post-learning incongruent trials, while Map 4 and a unique Map 5 (right-central positivity/left-posterior negativity) characterized post-learning congruent trials, suggesting a shift towards more fluent or automatized processing. High performers exhibited higher Map 3 preponderance within the N400 window, consistent with their larger N400 amplitudes, indicating sustained semantic processing. This finding—that the post-learning congruent condition occupies a unique neural state—aligns with the emergence of Map 5 and underscores a qualitative change in how known correct translations are processed. Comparable shifts in scalp topographies driven by semantic predictability have also been reported in sentence processing (e.g., Perrin & Garcia- Larrea, 2003) and in category learning and semantic decision tasks ( Khateb et al., 2003 ), suggesting that semantic congruency can induce distinct neural configurations. Furthermore, findings from auditory learning ( Spierer et al., 2007 ) and perceptual classification ( Tzovara et al., 2012 ) provide theoretical and empirical support for the idea that learning systematically reorganizes not only response amplitude but also the spatial dynamics of brain activity across domains. Our GFP analysis revealed a general increase in global field strength post-learning— regardless of congruency—implying increased overall neural engagement. GMD confirmed robust congruency effects beginning at 232 ms, consistent with the onset of semantic processing reported in the literature ( Hauk et al., 2006 ; Kutas & Federmeier, 2011 ; Lau et al., 2008 ). The overall topographic pattern of the Session × Congruency interaction mirrors the learning- and congruency-related reorganization observed in the clustering and GFP results, reflecting conceptual convergence across analytic methods without offering additional temporal detail. In sum, these results demonstrate that vocabulary learning enhances both the strength and the spatiotemporal configuration of neural activity during semantic processing, as measured by multiple complementary EEG analysis techniques. 4.5 Comparison with Previous Studies and Implications Our findings contribute to a growing body of research at the intersection of L2 learning and neurocognition. They corroborate prior evidence that even initial stages of L2 word learning modulate the N400 ( Pu et al., 2016 ; Kutas & Federmeier, 2011 ) and extend this by linking the magnitude of the N400 incongruity effect to individual vocabulary gains ( Qi et al., 2017 ; Elgort et al., 2014 ). Although we tested four evidence-based digital learning strategies—retrieval practice, corrective feedback, multisensory encoding, and distributed learning—none showed clear advantages over the others in our design. This absence of differential strategy effects mirrors well-known boundary conditions: Roediger and Karpicke (2006) demonstrated that, once recall approaches ceiling levels, additional retrieval practice yields diminishing gains; and Kornell and Bjork (2007) showed that when retrieval is too easy (i.e., items are already well learned), testing produces smaller benefits than under more challenging conditions. Together, these studies indicate that when learning items are overlearned or tasks lack sufficient difficulty, the unique contributions of individual strategies are masked—exactly as we observed after our high-exposure, high-success learning intervention. Beyond educational implications, our analysis of topographic ERP mapping illuminates how vocabulary learning is accompanied by neural reorganization. The clear distinction between processing known versus unknown words supports models of synaptic and systems consolidation, whereby repeated activation refines synaptic weights and engages hippocampal–neocortical interactions to stabilize memory traces over time ( McGaugh, 2000 ; Frankland & Bontempi, 2005 ). This “representational sharpening” emerges as reduced trial- to-trial variability and the appearance of specialized EEG map configurations ( Paller & Wagner, 2002 ; Yassa & Stark, 2011 ). Consistent with the neural efficiency accounts—which posit that increasing proficiency yields more selective and topographically focal neural engagement ( Haier et al., 1992 ; Neubauer & Fink, 2009 )—our topographic ERP mapping findings show increasingly focal scalp topographies both after vocabulary acquisition and in high-performing learners ( Khateb et al., 2003 ; Spierer et al., 2007 ; Tzovara et al., 2012 ). Importantly, whereas Neubauer and Fink (2009) report reduced global field strength in experts, our high performers exhibited larger N400 incongruity effects alongside focal ERP template-map engagement, reflecting qualitative specialization rather than mere amplitude suppression. Together, these results provide empirical support for theories of brain plasticity showing that, as vocabulary knowledge consolidates, cortical networks reorganize into more stable, specialized patterns observable across perceptual, semantic, and associative learning domains. These findings underscore the potential of ERP and topographic clustering as sensitive tools for monitoring individual progress and for evaluating the impact of pedagogical interventions in L2 learning. Future research should investigate whether these learning-induced neural signatures— such as changes in N400 incongruity and ERP template-map dynamics—generalize to other populations and tasks, including productive language use. In particular, children typically show shorter and less stable EEG microstates in resting activity ( Koenig et al., 2002 ) and delayed/broader N400 ( Holcomb et al., 1992 ; Friedrich & Friederici, 2004 ). 4.6 Limitations There are some limitations to consider. First, although we manipulated three strategies (retrieval practice, corrective feedback, multisensory learning) within participants and distributed learning between participants, the nested implementation may have attenuated contrasts. Moreover, the two-week intervention yielded very high overall success rates— vocabulary test performance increased from 0.41% to 75.5% ( d z = 3.96) and sensitivity ( d ′) in the translation recognition task increased from 0.59 to 4.15 ( η² g = .89)—such that even sub- optimal strategy assignments were sufficient to drive near-ceiling learning and obscured any strategy-specific benefits (all η² g ≤ .03 for strategy factors). Second, although our EEG sample (N = 77) is large for the field, exclusions for artifact rejection and the median split reduced power for interaction tests; effect sizes for strategy-related ERP interactions were small ( η² g ≤ .02). Third, our EEG paradigm focused exclusively on translation-recognition— a receptive task in both L2–L1 and L1–L2 directions—and did not assess productive use (e.g., cued recall or sentence production). It remains to be tested whether similar ERP template-map reconfigurations and N400 dynamics arise under more generative demands, which would help establish the generality of these neural markers across task contexts. 4.7 Conclusion This study demonstrates that intensive L2 vocabulary learning rapidly strengthens semantic processing, as evidenced by larger N400 incongruity effects in successful learners, while remaining largely unaffected by the particular learning strategy employed. Our ERP template-map analyses further demonstrate that learning not only shifts which ERP template maps dominate the N400 window from pre- to post-learning, but also differentially by congruency (congruent vs. incongruent), reflecting a qualitative reorganization of neural activity rather than a mere increase in amplitude. Together, these results bridge cognitive neuroscience and language education by demonstrating that effective vocabulary acquisition leaves stable, condition-specific neural signatures in semantic processing. Importantly, our findings underscore the practical value of ERP and topographic clustering for capturing individual learning-related changes in second language acquisition— even in the absence of clear differential effects of specific learning strategies. These neural measures may therefore provide sensitive biomarkers of L2 learning success, offering unique insights into individual differences in learning outcomes that are not always captured by behavioral measures alone. Author Contributions Nicole H. Skieresz: Conceptualization; Methodology; Investigation; Formal analysis; Data curation; Writing – original draft; Writing – review & editing. Sandy C. Marca: Investigation; Data curation; Methodology; Writing – review & editing. Micah M. Murray: Supervision; Conceptualization; Methodology; Formal analysis; Writing – review & editing. Thomas P. Reber: Supervision; Conceptualization; Methodology; Writing – review & editing; Funding acquisition. Nicolas Rothen: Supervision; Conceptualization; Methodology; Writing – review & editing; Funding acquisition. Note. Micah M. Murray, Thomas P. Reber and Nicolas Rothen contributed equally to this work (*). Data Availability Statement Data and analysis scripts are available to editors and reviewers via a private, view-only OSF link: https://osf.io/bj6pt/?view_only=ead3461634134e209cd8c234687e1d6e Upon acceptance, we will make the OSF project public. Preprocessed EEG data are archived on Zenodo (DOI: https://doi.org/10.5281/zenodo.16538184 ) and are currently accessible to reviewers via a private link described in the OSF README. The Zenodo record will be made public upon publication. Conflict of Interest Statement The authors declare no competing interests. Funding This research was conducted as part of the project “School of Tomorrow” at UniDistance Suisse, Brigue, Switzerland and was funded by the Canton du Valais, Department of Economic Affairs and Education, Office of Higher Education. Funder Information Declared Canton of Valais, Department of Economic Affairs and Education, Office of Higher Education Footnotes https://osf.io/bj6pt/?view_only=ead3461634134e209cd8c234687e1d6e https://zenodo.org/records/16538184?token=eyJhbGciOiJIUzUxMiJ9.eyJpZCI6ImVlYzU2YWUxLWZkNTgtNGMyYy05NGFiLTM2NTI2ZjNiZjk3ZSIsImRhdGEiOnt9LCJyYW5kb20iOiIxMThhYmJjMWQxODliZDEyZmVjNGUyYjJhMTdiYjQyMyJ9.3yDX2kR9JNBIku3fz9GY086CWgfBW_M0rNXd7xrPex3SaJWEa8Y8F7AOgWu_fNg3Vqdps3DdsZ8jSr-E1EMqFw References ↵ Armstrong , S. R. , Copland , D. A. , Escudero , P. , & Angwin , A. J . ( 2024 ). Tracking the acquisition and retention of novel word representations: An ERP study . Language, Cognition and Neuroscience , 39 ( 4 ), 401 – 422 . doi: 10.1080/23273798.2024.2310549 OpenUrl CrossRef ↵ Atkin , C. , Stacey , J. E. , Roberts , K. L. , Allen , H. A. , Henshaw , H. , & Badham , S. P . ( 2023 ). The effect of unisensory and multisensory information on lexical decision and free recall in young and older adults . Scientific Reports , 13 , 16575 . doi: 10.1038/s41598-023-41791-1 OpenUrl CrossRef PubMed ↵ Barcroft , J . ( 2007 ). Effects of Opportunities for Word Retrieval During Second Language Vocabulary Learning . Language Learning , 57 ( 1 ), 35 – 56 . doi: 10.1111/j.1467-9922.2007.00398.x OpenUrl CrossRef ↵ Boros , M. , Magyari , L. , Morvai , B. , Hernández-Pérez , R. , Dror , S. , & Andics , A . ( 2024 ). Neural evidence for referential understanding of object words in dogs . Current Biology , 34 ( 8 ), 1750 – 1754 .e4. doi: 10.1016/j.cub.2024.02.029 OpenUrl CrossRef PubMed ↵ Brandeis , D. , Lehmann , D. , Michel , C. M. , & Mingrone , W . ( 1995 ). Mapping event-related brain potential microstates to sentence endings . Brain Topography , 8 ( 2 ), 145 – 159 . doi: 10.1007/BF01199778 OpenUrl CrossRef PubMed ↵ Brunet , D. , Murray , M. M. , & Michel , C. M. ( 2011 ). Cartool: A software for the visualization and analysis of multichannel EEG data. Retrieved from https://cartool.cibm.ch ↵ Cepeda , N. J. , Pashler , H. , Vul , E. , Wixted , J. T. , & Rohrer , D . ( 2006 ). Distributed practice in verbal recall tasks: A review and quantitative synthesis . Psychological Bulletin , 132 ( 3 ), 354 – 380 . doi: 10.1037/0033-2909.132.3.354 OpenUrl CrossRef PubMed Web of Science ↵ Dalla Bella , S. , Farrugia , N. , Benoit , C. E. , Begel , V. , Verga , L. , Harding , E. , & Kotz , S. A. ( 2017 ). BAASTA: Battery for the Assessment of Auditory Sensorimotor and Timing Abilities . Behavior research methods , 49 ( 3 ), 1128 – 1145 . doi: 10.3758/s13428-016-0773-6 OpenUrl CrossRef ↵ Delorme , A. , & Makeig , S . ( 2004 ). EEGLAB: An open-source toolbox for analysis of single-trial EEG dynamics . Journal of Neuroscience Methods , 134 ( 1 ), 9 – 21 . doi: 10.1016/j.jneumeth.2003.10.009 OpenUrl CrossRef PubMed Web of Science Dunn , L. M. , & Thériault-Whalen , C. M . ( 1993 ). French adaptation of the Peabody Picture Vocabulary Test, revised: Manuals for forms A and B . Psycan . ↵ Edmonds , A. , Gerbier , E. , Palasis , K. , & Whyte , S . ( 2021 ). Understanding the distributed practice effect and its relevance for the teaching and learning of L2 vocabulary . Lexis , 18 . doi: 10.4000/lexis.5652 OpenUrl CrossRef ↵ Elgort , I. , Perfetti , C. A. , Rickles , B. , & Stafura , J. Z . ( 2014 ). Contextual learning of L2 word meanings: second language proficiency modulates behavioural and event-related brain potential (ERP) indicators of learning . Language, Cognition and Neuroscience , 30 ( 5 ), 506 – 528 . doi: 10.1080/23273798.2014.942673 OpenUrl CrossRef ↵ Feng , K. , Zhao , X. , Liu , J. , Cai , Y. , Ye , Z. , Chen , C. , & Xue , G . ( 2019 ). Spaced learning enhances episodic memory by increasing neural pattern similarity across repetitions . The Journal of Neuroscience , 39 ( 27 ), 5351 – 5360 . doi: 10.1523/JNEUROSCI.2741-18.2019 OpenUrl Abstract / FREE Full Text ↵ Frankland , P. W. , & Bontempi , B . ( 2005 ). The organization of recent and remote memories . Nature Reviews Neuroscience , 6 ( 2 ), 119 – 130 . doi: 10.1038/nrn1607 OpenUrl CrossRef PubMed Web of Science ↵ Friedrich , M. , & Friederici , A. D . ( 2004 ). N400-like Semantic Incongruity Effect in 19- Month-Olds: Processing Known Words in Picture Contexts . Journal of Cognitive Neuroscience , 16 ( 8 ), 1465 – 1477 . doi: 10.1162/0898929042304705 OpenUrl CrossRef PubMed Web of Science ↵ Fritz , C. O. , Morris , P. E. , Acton , M. , Voelkel , A. R. , & Etkind , R . ( 2007 ). Comparing and combining retrieval practice and the keyword mnemonic for foreign vocabulary learning . Applied Cognitive Psychology , 21 ( 5 ), 499 – 526 . doi: 10.1002/acp.1287 OpenUrl CrossRef ↵ García-Gámez , A. B. , & Macizo , P . ( 2022 ). Lexical and semantic training to acquire words in a foreign language: An electrophysiological study . Bilingualism: Language and Cognition , 25 ( 5 ), 768 – 785 . doi: 10.1017/S1366728921000456 OpenUrl CrossRef ↵ Gorin , S. & Majerus , S . ( 2019 ). Verbal and Musical Short-Term Memory: Evidence for Shared Serial Order Processes? . Psychologica Belgica , 59 ( 1 ), pp. 177 – 205 . doi: 10.5334/pb.426 OpenUrl CrossRef PubMed ↵ Hauk , O. , Davis , M. H. , Ford , M. , Pulvermüller , F. , & Marslen-Wilson , W. D . ( 2006 ). The time course of visual word recognition as revealed by linear regression analysis of ERP data . NeuroImage , 30 ( 4 ), 1383 – 1400 . doi: 10.1016/j.neuroimage.2005.11.048 OpenUrl CrossRef PubMed Web of Science ↵ Haier , R. J. , Siegel , B. V. , Jr. , Tang , C. , Abel , L. , & Buchsbaum , M. S . ( 1992 ). Intelligence and changes in cerebral glucose metabolic rate following learning . Intelligence , 16 ( 3– 4 ), 415 – 426 . doi: 10.1016/0160-2896(92)90018-M OpenUrl CrossRef Web of Science ↵ Henninger , F. , Shevchenko , Y. , Mertens , U. K. , Kieslich , P. J. , & Hilbig , B. E . ( 2020 ). lab.js: A free, open, online Study builder . doi: 10.5281/zenodo.597045 OpenUrl CrossRef ↵ Holcomb , P. J. , Coffey , S. A. , & Neville , H. J . ( 1992 ). Visual and auditory sentence processing: A developmental analysis using event-related brain potentials . Developmental Neuropsychology , 8 ( 2-3 ), 203 – 241 . doi: 10.1080/87565649209540525 OpenUrl CrossRef Web of Science ↵ Kang , S. H. K. , Gollan , T. H. , & Pashler , H . ( 2013 ). Don’t just repeat after me: Retrieval practice is better than imitation for foreign vocabulary learning . Psychonomic Bulletin & Review , 20 , 1259 – 1265 . doi: 10.3758/s13423-013-0450-z OpenUrl CrossRef PubMed ↵ Khateb , A. , Michel , C. M. , Pegna , A. J. , O’Dochartaigh , S. D. , Landis , T. , & Annoni , J. M . ( 2003 ). Processing of semantic categorical and associative relations: An ERP mapping study . International Journal of Psychophysiology , 49 ( 1 ) , 41 – 55 . doi: 10.1016/S0167-8760(03)00076-X OpenUrl CrossRef PubMed ↵ Koenig , T. , Kottlow , M. , Stein , M. , & Melie-García , L . ( 2011 ). RAGU: A free tool for the analysis of EEG/MEG data using randomisation statistics . Brain Topography , 24 ( 1 ), 3 – 12 . doi: 10.1007/s10548-010-0177-1 OpenUrl CrossRef ↵ Koenig , T. , Lehmann , D. , Michel , C. M. , & Brandeis , D . ( 2002 ). Millisecond by millisecond, year by year: Normative EEG microstates and developmental stages . NeuroImage , 16 ( 1 ), 41 – 48 . doi: 10.1006/nimg.2002.1070 OpenUrl CrossRef PubMed Web of Science Kornell , N. , & Bjork , R. A . ( 2007 ). The promise and perils of self-regulated study . Psychonomic Bulletin & Review , 14 ( 2 ), 219 – 224 . doi: 10.3758/BF03194055 OpenUrl CrossRef PubMed ↵ Kroll , J. F. , & Stewart , E . ( 1994 ). Category interference in translation and picture naming: Evidence for asymmetric connections between bilingual memory representations . Journal of Memory and Language , 33 ( 2 ), 149 – 174 . doi: 10.1006/jmla.1994.1008 OpenUrl CrossRef Web of Science ↵ Kuperberg , G. R. , & Jaeger , T. F . ( 2016 ). What do we mean by prediction in language comprehension? Language, Cognition and Neuroscience , 31 ( 1 ), 32 – 59 . doi: 10.1080/23273798.2015.1102299 OpenUrl CrossRef PubMed ↵ Kutas , M. , & Federmeier , K. D . ( 2011 ). Thirty years and counting: Finding meaning in the N400 component of the event-related brain potential (ERP) . Annual Review of Psychology , 62 , 621 – 647 . doi: 10.1146/annurev.psych.093008.131123 OpenUrl CrossRef PubMed Web of Science ↵ Kutas , M. , & Hillyard , S. A . ( 1980 ). Reading senseless sentences: Brain potentials reflect semantic incongruity . Science , 207 ( 4427 ), 203 – 205 . doi: 10.1126/science.7350657 OpenUrl Abstract / FREE Full Text ↵ Lau , E. , Phillips , C. , & Poeppel , D . ( 2008 ). A cortical network for semantics: (De)constructing the N400 . Nature Reviews Neuroscience , 9 ( 12 ), 920 – 933 . doi: 10.1038/nrn2532 OpenUrl CrossRef PubMed Web of Science ↵ Leark , R. A. , Greenberg , L. M. , Kindschi , C. L. , Dupuy , T. R. , & Hughes , S. J . ( 2008 ). TOVA professional manual . Los Alamitos, CA : TOVA Company . ↵ Leclercq , A.-L. , & Majerus , S . ( 2010 ). Serial-order short-term memory predicts vocabulary development: Evidence from a longitudinal study . Developmental Psychology , 46 ( 2 ), 417 – 427 . doi: 10.1037/a0018540 OpenUrl CrossRef PubMed ↵ Lopez-Calderon , J. , & Luck , S. J . ( 2014 ). ERPLAB: An open-source toolbox for the analysis of event-related potentials . Frontiers in Human Neuroscience , 8 , 213 . doi: 10.3389/fnhum.2014.00213 OpenUrl CrossRef PubMed ↵ Li , J. , Zhang , E. H. , Zhang , H. , He , X. , Li , D. , & Cao , H. W. ( 2023 ). Neural correlates of retrieval practice on the learning and memory retention of L3 French vocabulary . International Journal of Multilingualism , 21 ( 3 ), 1369 – 1385 . doi: 10.1080/14790718.2023.2166943 OpenUrl CrossRef ↵ Liu , X. L. , Tan , D. H. , & Reder , L. M . ( 2018 ). The two processes underlying the testing effect: Evidence from event-related potentials (ERPs) . Neuropsychologia , 112 , 77 – 85 . doi: 10.1016/j.neuropsychologia.2018.02.022 OpenUrl CrossRef PubMed ↵ Macmillan , N. A. , & Creelman , C. D . ( 2005 ). Detection theory: A user’s guide (2nd ed.) . Lawrence Erlbaum Associates Publishers . ↵ Majerus , S. , Poncelet , M. , Greffe , C. , & Van der Linden , M. ( 2006 ). Relations between vocabulary development and verbal short-term memory: The relative importance of short-term memory for serial order and item information . Journal of experimental child psychology , 93 ( 2 ), 95 – 119 . doi: 10.1016/j.jecp.2005.07.005 OpenUrl CrossRef PubMed Web of Science ↵ McGaugh , J. L . ( 2000 ). Memory – a century of consolidation . Science , 287 ( 5451 ), 248 – 251 . doi: 10.1126/science.287.5451.248 OpenUrl Abstract / FREE Full Text ↵ McLaughlin , J. , Osterhout , L. , & Kim , A . ( 2004 ). Neural correlates of second-language word learning: Minimal instruction produces rapid change . Nature Neuroscience , 7 ( 7 ), 703 – 704 . doi: 10.1038/nn1264 OpenUrl CrossRef PubMed Web of Science ↵ Midgley , K. J. , Holcomb , P. J. , & Grainger , J . ( 2009 ). Masked repetition and translation priming in second language learners: A window on the time-course of form and meaning activation using ERPs . Psychophysiology , 46 ( 3 ), 551 – 565 . doi: 10.1111/j.1469-8986.2009.00784.x OpenUrl CrossRef PubMed Web of Science ↵ Murray , M. M. , Brunet , D. , & Michel , C. M . ( 2008 ). Topographic ERP analyses: a step-by- step tutorial review . Brain topography , 20 ( 4 ), 249 – 264 . doi: 10.1007/s10548-008-0054-5 OpenUrl CrossRef PubMed Web of Science ↵ Murray , M. M. , Michel , C. M. , Grave de Peralta , R. , Ortigue , S. , Brunet , D. , González Andino , S. , & Schnider , A. ( 2004 ). Rapid discrimination of visual and multisensory memories revealed by electrical neuroimaging . NeuroImage , 21 ( 1 ), 125 – 135 . doi: 10.1016/j.neuroimage.2003.09.035 OpenUrl CrossRef PubMed Web of Science ↵ Murray , M. M. , Middelmann , N. K. , & Federmeier , K. D . ( 2024 ). Animal cognition: Dogs build semantic expectations between spoken words and objects . Current Biology , 34 ( 9 ), R348 – R351 . doi: 10.1016/j.cub.2024.03.045 OpenUrl CrossRef PubMed ↵ Neubauer , A. C. , & Fink , A . ( 2009 ). Intelligence and neural efficiency: Measures of brain activation versus brain connectivity . Neuroscience & Biobehavioral Reviews , 33 ( 7 ), 1004 – 1023 . doi: 10.1016/j.neubiorev.2009.04.001 OpenUrl CrossRef PubMed Web of Science ↵ Nicol , D. J. , & Macfarlane-Dick , D . ( 2006 ). Formative assessment and self-regulated learning: A model and seven principles of good feedback practice . Studies in Higher Education , 31 ( 2 ), 199 – 218 . doi: 10.1080/03075070600572090 OpenUrl CrossRef Web of Science ↵ Paller , K. A. , & Wagner , A. D . ( 2002 ). Observing the transformation of experience into memory . Trends in Cognitive Sciences , 6 ( 2 ), 93 – 102 . doi: 10.1016/S1364-6613(00)01845-3 OpenUrl CrossRef PubMed Web of Science ↵ Pashler , H. , Cepeda , N. J. , Wixted , J. T. , & Rohrer , D . ( 2005 ). When does feedback facilitate learning of words? Journal of experimental psychology. Learning, memory, and cognition , 31 ( 1 ), 3 – 8 . doi: 10.1037/0278-7393.31.1.3 OpenUrl CrossRef PubMed Web of Science Perrin , F. , & García-Larrea , L . ( 2003 ). Modulation of the N400 potential during auditory phonological/semantic interaction . Cognitive Brain Research , 17 ( 1 ), 36 – 47 . doi: 10.1016/s0926-6410(03)00078-8 OpenUrl CrossRef PubMed ↵ Pu , H. , Holcomb , P. J. , & Midgley , K. J . ( 2016 ). Neural changes underlying early stages of L2 vocabulary acquisition . Journal of Neurolinguistics , 40 , 55 – 65 . doi: 10.1016/j.jneuroling.2016.05.002 OpenUrl CrossRef PubMed ↵ Qi , Z. , Beach , S. D. , Finn , A. S. , & Gabrieli , J. D. E . ( 2017 ). Native-language N400 and P600 predict dissociable language-learning abilities in adults . Neuropsychologia , 98 , 111 – 122 . doi: 10.1016/j.neuropsychologia.2016.10.005 OpenUrl CrossRef PubMed R Core Team . ( 2024 ). R: A language and environment for statistical computing (Version 2024.12.0) [Computer software]. R Foundation for Statistical Computing . https://www.R-project.org/ Raven , J . ( 1958 ). Standard Progressive Matrices . London: H. K. Lewis . Reber , T. P. , & Rothen , N. ( 2018 ). Educational app-development needs to be informed by the cognitive neurosciences of learning & memory . npj Science of Learning , 3 ( 1 ), 22 . doi: 10.1038/s41539-018-0039-4 OpenUrl CrossRef PubMed ↵ Roediger , H. L. , & Karpicke , J. D . ( 2006 ). Test-enhanced learning: Taking memory tests improves long-term retention . Psychological Science , 17 ( 3 ), 249 – 255 . doi: 10.1111/j.1467-9280.2006.01693.x OpenUrl CrossRef PubMed Web of Science Roediger , H. L. , & Karpicke , J. D . ( 2006 ). The Power of Testing Memory: Basic Research and Implications for Educational Practice . Perspectives on Psychological Science , 1 ( 3 ), 181 – 210 . doi: 10.1111/j.1745-6916.2006.00012.x OpenUrl CrossRef PubMed Web of Science ↵ Shams , L. , & Seitz , A. R . ( 2008 ). Benefits of multisensory learning . Trends in Cognitive Sciences , 12 ( 11 ), 411 – 417 . doi: 10.1016/j.tics.2008.07.006 OpenUrl CrossRef PubMed Web of Science Snodgrass , J. G. , & Corwin , J . ( 1988 ). Pragmatics of measuring recognition memory: Applications to dementia and amnesia . Journal of Experimental Psychology: General , 117 ( 1 ), 34 – 50 . doi: 10.1037/0096-3445.117.1.34 OpenUrl CrossRef PubMed Web of Science ↵ Soto-Faraco , S. , & Spence , C . ( 2025 ). Crossmodal Semantics in Memory: Scoping Review and Meta-Analyses of Multisensory Effects in Short-Term and Episodic Memory Systems . Psychological Bulletin , 151 ( 7 ) , 861 – 891 . doi: 10.1037/bul0000483 OpenUrl CrossRef PubMed ↵ Soskey , L. , Holcomb , P. J. , & Midgley , K. J . ( 2016 ). Language effects in second-language learners: A longitudinal electrophysiological study of Spanish classroom learning . Brain Research , 1646 , 44 – 52 . doi: 10.1016/j.brainres.2016.05.028 OpenUrl CrossRef PubMed ↵ Šoškić , A. , Jovanović , V. , Styles , S. J. , Kappenman , E. S. , & Ković , V . ( 2021 ). How to do Better N400 Studies: Reproducibility, Consistency and Adherence to Research Standards in the Existing Literature . Neuropsychology Review . doi: 10.1007/s11065-021-09513-4 OpenUrl CrossRef Speer , R . ( 2022 ). rspeer/wordfreq: v3.0 [Software] . Zenodo . doi: 10.5281/zenodo.7199437 OpenUrl CrossRef ↵ Spierer , L. , Tardif , E. , Sperdin , H. , Murray , M. M. , & Clarke , S . ( 2007 ). Learning-induced plasticity in auditory spatial representations revealed by electrical neuroimaging . The Journal of Neuroscience , 27 ( 20 ), 5474 – 5483 . doi: 10.1523/JNEUROSCI.0764-07.2007 OpenUrl Abstract / FREE Full Text ↵ The MathWorks , Inc . ( 2022 ). MATLAB (Version R2022b) [Computer software] . https://www.mathworks.com/products/matlab.html ↵ Thelen , A. , & Murray , M. M . ( 2013 ). The efficacy of single-trial multisensory memories . Multisensory Research , 26 ( 5 ), 483 – 502 . doi: 10.1163/22134808-00002426 OpenUrl CrossRef PubMed Web of Science ↵ Tzovara , A. , Murray , M. M. , Michel , C. M. , & De Lucia , M. ( 2012 ). A Tutorial Review of Electrical Neuroimaging From Group-Average to Single-Trial Event-Related Potentials . Developmental Neuropsychology , 37 ( 6 ), 518 – 544 . doi: 10.1080/87565641.2011.636851 OpenUrl CrossRef PubMed ↵ van der Loo , M. P. J. ( 2014 ). The stringdist package for approximate string matching . The R Journal , 6 ( 1 ), 111 – 122 . doi: 10.32614/RJ-2014-011 OpenUrl CrossRef ↵ Van Petten , C. , & Luka , B. J. ( 2012 ). Prediction during language comprehension: Benefits, costs, and ERP components . International Journal of Psychophysiology , 83 ( 2 ), 176 – 190 . doi: 10.1016/j.ijpsycho.2011.09.015 OpenUrl CrossRef PubMed Web of Science ↵ Yassa , M. A. , & Stark , C. E. L . ( 2011 ). Pattern separation in the hippocampus . Trends in Neurosciences , 34 ( 10 ), 515 – 525 . doi: 10.1016/j.tins.2011.06.006 OpenUrl CrossRef PubMed Web of Science ↵ Yum , Y. N. , Midgley , K. J. , Holcomb , P. J. , & Grainger , J . ( 2014 ). An ERP study on initial second language vocabulary learning . Psychophysiology , 51 ( 4 ), 364 – 373 . doi: 10.1111/psyp.12183 OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted September 28, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Brain Network Differences in Second Language Learning Depend on Individual Competencies Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Brain Network Differences in Second Language Learning Depend on Individual Competencies Nicole H. Skieresz , Sandy C. Marca , Micah M. Murray , Thomas P. Reber , Nicolas Rothen bioRxiv 2025.09.28.679014; doi: https://doi.org/10.1101/2025.09.28.679014 Share This Article: Copy Citation Tools Brain Network Differences in Second Language Learning Depend on Individual Competencies Nicole H. Skieresz , Sandy C. Marca , Micah M. Murray , Thomas P. Reber , Nicolas Rothen bioRxiv 2025.09.28.679014; doi: https://doi.org/10.1101/2025.09.28.679014 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Neuroscience Subject Areas All Articles Animal Behavior and Cognition (7633) Biochemistry (17678) Bioengineering (13888) Bioinformatics (41927) Biophysics (21445) Cancer Biology (18585) Cell Biology (25491) Clinical Trials (138) Developmental Biology (13373) Ecology (19897) Epidemiology (2067) Evolutionary Biology (24308) Genetics (15606) Genomics (22494) Immunology (17736) Microbiology (40385) Molecular Biology (17175) Neuroscience (88581) Paleontology (666) Pathology (2830) Pharmacology and Toxicology (4822) Physiology (7641) Plant Biology (15139) Scientific Communication and Education (2045) Synthetic Biology (4293) Systems Biology (9822) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00