Linguistic Rules of Syntax and Sharing in the Complex Songs of a Tropical Passerine

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 76,299 characters · extracted from preprint-html · click to expand
Linguistic Rules of Syntax and Sharing in the Complex Songs of a Tropical Passerine | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Linguistic Rules of Syntax and Sharing in the Complex Songs of a Tropical Passerine View ORCID Profile Suyash Sawant , View ORCID Profile Chiti Arvind , View ORCID Profile Viral Joshi , View ORCID Profile Indranil Dutta , View ORCID Profile V. V. Robin doi: https://doi.org/10.1101/2025.07.31.666818 Suyash Sawant 1 Department of Biology, Indian Institute of Science Education and Research (IISER) Tirupati , Tirupati, AP 517619, India 2 Department of Wildlife Ecology and Conservation, University of Florida , Gainesville, FL 32603, USA 3 School of Natural Resources and Environment, University of Florida , Gainesville, FL 32603, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Suyash Sawant For correspondence: s.sawant{at}ufl.edu robin{at}labs.iisertirupati.ac.in Chiti Arvind 1 Department of Biology, Indian Institute of Science Education and Research (IISER) Tirupati , Tirupati, AP 517619, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Chiti Arvind Viral Joshi 1 Department of Biology, Indian Institute of Science Education and Research (IISER) Tirupati , Tirupati, AP 517619, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Viral Joshi Indranil Dutta 4 School of Languages and Linguistics, Jadavpur University , Kolkata, WB 700032, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Indranil Dutta V. V. Robin 1 Department of Biology, Indian Institute of Science Education and Research (IISER) Tirupati , Tirupati, AP 517619, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for V. V. Robin For correspondence: s.sawant{at}ufl.edu robin{at}labs.iisertirupati.ac.in Abstract Full Text Info/History Metrics Preview PDF Abstract 1. Birdsong offers a powerful model to study the evolution of complex communication systems. While most song syntax and sharing research focuses on temperate species with fixed repertoires, we know far less about tropical songbirds with large, open-ended vocal systems. 2. We examined song structure and cultural transmission in the White-bellied Sholakili Sholicola albiventris , a tropical passerine endemic to the Shola Sky Islands of southern India. We studied song complexity and spectro-temporal variation using over 6,000 songs from 17 color-banded males across five years. We analyzed the song syntax using sequence-based metrics, including Levenshtein Distances and N-gram models. 3. Our results reveal high syntactic variability across short and long timescales, with stable note-type cores and structured expansions of combinatorial sequences. Higher-order N-gram turnover was rapid and strongly individual-specific, while broadly sharing the population-level note pool. Song sharing was significantly higher among neighbors than non-neighbors. 4. Using Generalized Additive Models, we explain how social and ecological factors, including neighbor count, territory area, repertoire size, N-gram usage, and the spectro-temporal structure of N-grams, determine consistency across years and sharing across individuals. This study highlights parallels between human linguistics and syntactic organization in the complex songs of a tropical passerine. 1. Introduction Vocal communication is central to mediating social interactions, coordinating reproductive behaviors, and facilitating parental care across animal taxa ( Janik and Slater 2000 ; Mariette 2019 ; Riebel et al. 2019 ). Songbirds ( Passerines ) are particularly recognized for their structural and functional complexity in vocalizations, making them a good model system for investigating the evolution of vocal communication. Songs in these species function as a reproductive strategy, enabling individuals to attract mates, compete with rivals, and establish individual identity ( Kroodsma and Byers 1991 ; Brenowitz et al. 1997 ; Beecher 2017 ; Rose et al. 2022 ). These functions often rely on the recognition of song patterns, which allows individuals to assess one another and modulate their behavior through social interactions ( Catchpole 1987 ; Leitão et al. 2022 ). In many species, song sharing is typically a result of vocal learning and social affiliation ( Hughes et al. 1998 ; King and McGregor 2016 ; Sánchez and Mennill 2024 ), which implies knowledge of neighbours’ songs and contributes to maintaining territories. Song sharing, with group-level similarities and individual differences, creates a complex selective information landscape for vocal expression and cultural transmission ( Slater 1986 ; Dhondt and Lambrechts 1992 ; Podos and Warren 2007 ). Like human language, birdsong consists of sequences of discrete acoustic units: notes, syllables, or motifs arranged in non-random, often rule-based orders ( Kuhl 2003 ; Kershenbaum et al. 2014 ; Williams 2021 ). This syntactic organization enables birds to generate a large variety of vocal outputs from a limited set of elements, allowing for both repetition and recombination, much like the phonemic and grammatical structures in human speech ( Goldstein et al. 2003 ; Berwick et al. 2011 ; Samuels 2015 ; Kershenbaum et al. 2016 ). Although birdsong lacks semantic referentiality, it is often socially learned, context-dependent, and hierarchically organized, especially in species with complex social dynamics ( Doupe and Kuhl 1999 ; Fishbein et al. 2020 ). These parallels have led to an expanding literature comparing avian vocal systems and human language in terms of learning mechanisms, sequence structure, and cultural evolution ( Slater 1986 ; Griesser et al. 2018 ; Aamodt et al. 2020 ; Williams and Lachlan 2022 ). However, most of what we know about syntactic rules in birdsong again comes from temperate species with relatively simple, closed-ended repertoires ( Hughes et al. 1998 ) - birds that learn all their songs in a critical short window of development. It remains unclear whether similar structural rules apply to species with large, variable repertoires and open-ended learning, such as many tropical songbirds ( Price and Yuan 2011 ; Araya-Salas and Wright 2013 ). These open-ended learners can acquire new vocal elements throughout their lives, resulting in diverse and context-dependent song structures, and allowing for individual identity, repertoire turnovers, and rapid cultural evolution ( Cornez et al. 2017 ). This lifelong capacity for vocal modification parallels aspects of human language learning, where individuals can acquire new words, dialects, or even new languages well into adulthood ( Hughes et al. 1998 ; Bruno et al. 2021 ). These similarities suggest that open-ended vocal learning may be key in supporting flexible, socially responsive communication systems across species. The ability to learn new vocal elements throughout life challenges the assumption of fixed syntactic rules, raising critical questions about social and ecological factors that shape the evolution of information landscapes in more dynamic and interactive environments. In this study, we examine the structure and syntax of song sequences of a tropical passerine that is known to have highly variable songs - the White-bellied Sholakili Sholicola albiventris , endemic to the high-elevation Shola Sky Islands of the southern Western Ghats, India (Robin et al. 2017). This species is also thought to be an open-ended learner, making it a compelling system for studying variable vocal syntax and song sharing. We investigate how S. albiventris songs are constructed and modified over time, as well as their ecological significance. Specifically, we address (a) individual level variation within a year, including changes in consecutive songs, short- and long-term song plasticity; (b) individual level variation across years, focusing on annual repertoire turnover and long-term repertoire drift; and (c) across-individual patterns, including neighbor song sharing and individual vocal signatures. This framework allows us to evaluate vocal variation across multiple temporal and social scales. We apply a multi-scale analytical framework to capture the complexity of vocal syntax and its variation, representing songs as structured sequences of discrete acoustic units ( Kershenbaum et al. 2016 ). We fragment songs using individual note types and higher-order sequences to capture vocal organization at different levels, quantifying how birds construct, reuse, and recombine vocal elements across social and temporal scales. Our approach integrates methods developed initially in computational linguistics and information theory. We quantify the minimum number of insertions, deletions, or substitutions required to convert one sequence into another using Normalized Levenshtein Distance (NLD), a widely used metric in language processing ( Garland et al. 2012 ; Kershenbaum and Garland 2015 ). We also use N-gram models, adapted from text and speech analysis, allowing us to examine patterns of vocal sequence structure and track the emergence, persistence, or loss of syntactic fragments over time ( Somervuo and Harma 2004 ; Sidorov et al. 2014 ; Smith 2014 ). We integrated these tools with Generalized Additive Models (GAM) ( Hastie and Tibshirani 1990 ) to assess how ecological or social factors shape vocal consistency. 2. Methods 2.1 Study Species and Site This study examined songs of the White-bellied Sholakili ( Sholicola albiventris ), a monomorphic flycatcher endemic to the high-elevation Shola forests of the southern Western Ghats, India. We focused on S. albiventris males, who are highly vocal during the breeding season and are known for their complex and extensive repertoires used in territory defense and mate attraction ( Purushotham and Robin 2016 ; Sawant et al. 2022 ). Our focal population is in and around a forest patch in Kodaikanal, adjacent to the Kodaikanal Wildlife Sanctuary (Palani Hills, Tamil Nadu, India), at an elevation of ∼2100 m. Our study spanned over a partially disturbed montane forest landscape with a mix of native tropical montane cloud forest trees and Pinus and Eucalyptus plantations close to a human settlement ( Arasumani et al. 2019 ) ( Fig. S1 ). We conducted the fieldwork during the breeding seasons, March-June, spanning five years, with observations from four years, 2019 and 2021 to 2023, bearing the field logistic constraints due to the COVID-19 pandemic in 2020 ( Fig. S1 ). 2.2 Banding and Territory Mapping In order to track and record individuals ( Dunn and John Ralph 2004 ), we captured and color-banded adult birds using mist nets near known singing perches. Since the species exhibits no sexual dimorphism in plumage or size, we determined the sex of individuals using molecular techniques. Blood samples were collected via brachial venipuncture and stored in a Queen’s lysis buffer. We used established protocols ( Robin et al. 2021 ) for DNA extraction using DNeasy blood and Tissue Kit (DNeasy Blood & Tissue Handbook 2023), molecular sexing using P2/P8 primers ( Bantock et al. 2008 ), PCR amplification, and gel electrophoresis to distinguish male and female individuals, which allowed us to identify and focus analyses exclusively on males ( Table S1 ). We followed color-banded males throughout the breeding seasons to outline approximate individual territories. Using handheld GPS units and cellphones at each confirmed sighting, we aggregated locations to construct spatial outlines of breeding territories in QGIS v3.16.11 (QGIS Association). Later, we manually adjusted these boundaries based on more field observations, including natural boundaries and unoccupied gaps following ( Suarez Sharma et al. 2024 ). 2.3 Acoustic Data Collection and Processing We obtained high-quality recordings of focal individuals using either a Sennheiser ME66 shotgun microphone or a Wildtronics Pro-Mono parabolic microphone mounted to Zoom H6 or H4N digital recorders. We recorded S. albiventris songs from within 10 m of the focal individuals in the mornings, 5:00-12:00, and in the evenings, 15:00-19:00, under low wind and minimal anthropogenic noise conditions. We targeted approximately 150 songs per individual per year (described further below), resulting in a final dataset of >6000 songs from 17 males across the four years ( Table S2 ). All recordings were single-channel and stored as uncompressed files (WAV files, 44.1 kHz sampling rate, 16-bit resolution). All recordings were processed using Raven Pro v1.5 (K. Lisa Yang Center for Conservation Bioacoustics at the Cornell Lab of Ornithology), generating spectrograms with a 512-sample Hann window, 50% overlap, and a 512 DFT. Songs were manually segmented based on pauses greater than 2 seconds. Following established conventions in avian communication, SS annotated each vocal element (note) as a discrete acoustic unit separated by a visible temporal gap (supported by auditory confirmation), an approximate threshold of >0.02 seconds ( Kershenbaum et al. 2016 ). For each note, we marked the start-end times and frequency bounds using visual inspection of the spectrogram. 2.4 Sampling Effort and Statistical Power We determined the optimal number of songs to record per individual based on an initial rarefaction analysis of note-type accumulation curves ( Fig. S2A ). Using a pilot dataset of over 300 songs each for 12 individuals in a year, we observed that the number of unique note types plateaued between 120 and 180 songs per individual. Based on this asymptotic pattern, we adopted a standardized target of ∼150 songs per male per breeding season to capture most of each individual’s vocal repertoire while minimizing redundancy. To ensure sufficient statistical power to detect biologically meaningful variation in song structure, we conducted sensitivity analyses using Analysis of Variance (ANOVA) in G*Power 3.1 ( Faul et al. 2009 ). For temporal comparisons across four years within the same individual (n = 600 songs) and social comparisons across 12 individuals within a year (n = 1800 songs), our sampling design achieved 90% power to detect small effect sizes ( f = 0.154 and f = 0.109, respectively). These results confirm that despite our species being an open-ended learner, with a high repertoire size, our dataset is sufficiently sensitive to detect fine-scale variation in vocal traits across both temporal and ecological dimensions ( Fig. S2B - S2C ). 2.5 Note Classification Pipeline We implemented a semi-supervised classification pipeline using Spectrogram Cross-Correlation (SPCC) (Charif et al. 2010) to assign vocal elements to discrete note types and estimate repertoire diversity with a manually curated reference set of 1,000 notes, which served as the initial training dataset. The notes were annotated in Raven Pro v1.5 and exported, processed, and frequency bandpass filtered them using the warbleR package in R (Araya-Salas and Smith-Vidaurre 2017) to compute pairwise SPCC, with Pearson’s correlation used to quantify spectrogram similarity ( Fig. S3 ). We conducted the classification iteratively: each unclassified note was compared to reference notes until a correlation >0.97 assigned it a matching type. If the algorithm found no match, it accepted the highest-scoring match >0.8; otherwise, it treated the note as a new type, assigned a novel label, and added it to the training set. We selected these cut-offs based on manual validation of classified types of ∼1000 notes, cross-validated by two independent researchers (SS and CA). The algorithm added up to five replicates per newly assigned type to the training set to capture within-type variability ( Fig. S3 ). The dataset was incrementally updated as new types emerged, followed by a manual review to ensure structural distinctiveness, collapse redundant classes, and assess classification accuracy through random spot-checks. In all, we manually assessed around 2% of the notes, and with ∼160 note types among 46,628 annotated notes, we felt this method of automation combined with manual verification was the only practical way to conduct this procedure in a scalable manner. 2.6 Quantifying Song Features 2.6.1 Song Structure & Complexity Metrics We used custom R scripts ( Sawant 2025 ) to summarize the song-level spectro-temporal structure from extracted spectro-temporal parameters for each annotated note, including low, mean, and high frequencies, frequency bandwidth, and duration. We used both note- and song-level parameters to examine acoustic parameters across individuals and years ( Fig. 1 ). We calculated a range of metrics capturing both within-song variation and across-song repertoire structure to quantify vocal complexity. Within each song, we measured note count (total number of notes), note pace (notes per second), note types (number of distinct note categories), note richness (proportion of note types), and note diversity using the Song Richness Index (SRI) ( Sawant et al. 2021 ). We assessed note order using first-order Markov Entropy Rates (MER) ( Kershenbaum 2014 ) to evaluate syntactic predictability and spectro-temporal variation using a Note Variability Index (NVI) ( Sawant et al. 2022 ) based on spectro-temporal dissimilarity among notes ( Fig. 1 ). To evaluate across-song repertoire structure, we estimated individual-level note repertoires using the Chao1 estimator in the vegan package ( Kindt 2020 ) in R, which accounts for undetected note types. We also generated rarefaction curves to assess note-type accumulation across increasing song samples, allowing us to evaluate repertoire saturation and compare vocal richness for an individual within a year. Download figure Open in new tab Figure 1: Comparison of song structure and syntax using two example song sequences. Spectrograms show two songs (Song 1 and Song 2) with labelled note identities and acoustic annotations at both the note and song levels. Key spectro-temporal parameters - duration, mean frequency, and frequency bandwidth are illustrated on the spectrograms. The summary metrics below each song quantify vocal complexity using specific complexity metrics. The Normalized Levenshtein Distance (NLD) measures syntactic dissimilarity between the sequences based on the number of edit operations required for alignment. The lower panel splits each song into its constituent N-grams:1 grams (individual notes), 2-grams (note pairs), and 3-grams (note triplets). Counts shown beneath each N-gram indicate their frequency within each song. 2.6.2 Song Syntax Metrics To quantify fine-scale structural differences between songs, we calculated Normalized Levenshtein Distance (NLD). This string-edit metric estimates the minimum number of insertions, deletions, or substitutions required to convert one sequence into another. We treated each song as a linear sequence of note-type names and computed pairwise NLD between songs produced by the same individual within a recording session, across sessions, and years ( Fig. 1 ). These distances allowed us to quantify the degree of song-to-song variation and assess temporal patterns of vocal plasticity within bouts and breeding seasons. We compared consecutive and non-consecutive (random) song pairs to test whether syntactic changes were gradual or abrupt and whether divergence changed with time. We extracted N-gram sequences from annotated notes to characterize higher-order syntactic structure, treating note types as discrete symbolic units. We focused on 1-gram (individual notes), 2-gram (adjacent note pairs), and 3-gram (adjacent note triplets) levels to capture increasingly complex patterns of syntax organization ( Fig. 1 ). We compiled repertoires of N-gram types for each individual per year and calculated their diversity, frequency of use, and overlap across years. To assess repertoire turnover, we computed the proportion of N-grams retained, dropped, or newly introduced from one year to the next, providing insights into how vocal syntax evolves within individuals. To evaluate patterns of N-gram sharing across individuals, we measured pairwise overlap in N-gram repertoires. We also constructed cumulative N-gram accumulation curves across individuals to assess how syntactic diversity scales at the population level. 2.7 Modeling Song Sharing: Statistical Methods To examine the ecological and acoustic drivers of syntactic structure in S. albiventris songs, we constructed two sets of Generalized Additive Models (GAMs) using the mgcv package in R. 2.7.1 N-gram Consistency Across Years The first model set focused on intra-individual consistency of N-gram usage across consecutive years. Each N-gram type was classified as either “consistent” (used in both years) or “not-consistent” (used in Year 1 - Y1 but not in Year 2 - Y2). We modeled the probability of each N-gram being classified as consistent or learned using the following predictors: (1) ΔTerritoryArea Y1→Y2, i : proportional change in territory area from Y1 to Y2 for i ; (2) NeighborCount Y1 ∪ Y2, i : cumulative number of neighbors across the two years for individual i ; (3) NgramOccurrence Y1, i : number of times N-gram g occurred in i’s songs in Y1; (4) NgramRichness Y1, i : total number of unique N-grams used by i in Y1; (5) NgramPosition g : mean position of N-gram g within songs; (6) NgramMeanFreq g : mean frequency (Hz) of N-gram g ; (7) NgramFreqBand g : frequency bandwidth (Hz) of N-gram g ; and (8) NgramDuration g : temporal duration (s) of N-gram g . 2.7.2 N-gram Sharing Between Individuals The second model set analyzed pairwise N-gram sharing within a year, where each N-gram was classified as “shared” (used by both individuals in a pair) or “not-shared” (used by only one of them). We modeled the probability of sharing between individuals i ₁ and i ₂ as a function of: (1) TerritoryDistance i₁↔i₂ : distance (in meters) between territory centroids of the pair; (2) Shared NeighborCount i₁ ∩ i₂ : number of shared neighbors between individuals i ₁ and i ₂; (3) max(NgramOccurrence g, i₁ , NgramOccurrence g, i₂ ): maximum usage count of N-gram g between the pair; (4) NgramRichness i₁ ∪ i₂ : total number of unique N-grams used by the pair; (5) NgramPosition g : mean position of N-gram g within songs; (6) NgramMeanFreq g : mean frequency (Hz) of N-gram g ; (7) NgramFreqBand g : frequency bandwidth (Hz) of N-gram g ; and (8) NgramDuration g : temporal duration (s) of N-gram g . We modeled all predictors using penalized thin plate regression splines s() , allowing for flexible estimation of non-linear relationships. We ran all models separately for 1-gram, 2-gram, and 3-gram levels, and retained all predictors across models regardless of statistical significance to enable effect comparisons. 3. Results This study analyzed over 6000 songs from 17 color-banded male S. albiventris , recorded over four breeding seasons (2019, 2021-2023). Using a combination of spectral, syntactic, and combinatorial metrics, we characterized vocal variation across three temporal scales within and across days, and across years. We examined spectro-temporal features such as mean and delta frequency and vocal complexity metrics such as note count, richness, and Markov Entropy Rate. In parallel, we quantified sequence-level consistency using Normalized Levenshtein Distances (NLDs) and tracked the growth of individual N-gram repertoires (unigrams, bigrams, trigrams) to assess structural plasticity over time. Finally, we evaluated social and spatial predictors of N-gram overlap among individuals to understand the extent and drivers of vocal sharing. These results offer a multi-layered perspective on the individual, social, and temporal dynamics shaping vocal communication in a montane songbird with highly variable songs. 3.1 Territorial Dynamics and Social Context Despite the high site fidelity of many individuals (e.g., individual YYXX), we observed variation in territory size, locations, and neighboring individual interactions across four years (e.g., individual YOXX). For example, several individuals had turnover of neighboring males between years, and some territories declined in area. In contrast, we observed some new individuals (e.g., individual RUGG) dispersing into new areas, claiming empty spaces and/or pushing previously territory-holding individuals to introduce their territories. The long-term monitoring and banding allowed us to track persistent and newly recorded individuals in subsequent years ( Fig. 2 ). Download figure Open in new tab Figure 2: Annual (breeding season) territory maps of individually banded male S. albiventris across four breeding seasons (2019, 2021-2023) in the montane habitats of Kodaikanal, southern India. Polygons represent mapped male territories, with colors indicating banding and song analysis status: light blue = banded individuals, dark blue = banded individuals with song data analyzed that year, and gray = approximate territories of unbanded individuals. Territory boundaries are based on repeated resighting, spatial mapping, detecting song perches, and individual interactions, during the breeding season of the year. 3.2 Song Structure: Spectro-Temporal Features and Complexity S. albiventris songs covered a broad frequency bandwidth of 3 to 9 kHz around a mean frequency between 4.5 and 5.5 kHz, with most individuals singing song-segments of 1.5 to 4 seconds duration. Despite this broad range, variation in these acoustic features was only partially structured by individual identity or year. Kruskal-Wallis tests revealed significant but moderate individual-level differences in mean frequency and bandwidth, suggesting that some males consistently favored higher or broader frequency ranges. Song duration also varied significantly across individuals, with some producing notably longer songs. Some individuals also showed significant differences in these spectro-temporal parameters across years ( Fig. S4 ). The first two principal components resulted from the PCA of all song-level acoustic parameters, explained 87% of the variance, but did not indicate any distinct clustering by individual or year ( Fig. S5 ). These results suggest spectro-temporal features alone do not encode individual identity or population dialect patterns. Next, we examined song complexity metrics to assess vocal richness, diversity, and syntactic organization variation. These included note count, pace, repertoire size (note types and richness), diversity (Song Richness Index), spectro-temporal variation (Note Variability Index), and note order (Markov Entropy Rate). Most individuals showed significant differences in metrics, particularly in note count, note types, and song richness index. Some males consistently produced longer or more diverse songs, while others exhibited more repetitive or shorter sequences. Inter-annual variation was also evident in a few individuals, though overall patterns were more strongly structured by individual identity than by year ( Fig. S6 ). A principal component analysis of all song complexity features revealed that the first two dimensions explained 82% of the variance, with PC1 capturing structural diversity, and PC2 reflecting note count and pace ( Fig. S7 ). However, consistent with the spectro-temporal analysis, the PCA scores showed broad overlap among individuals and years, and did not reveal strong clustering by identity or time. 3.3 Song Syntax: Sequential Organization and Temporal Consistency Despite a shared structural framework, S. albiventris songs exhibit striking internal diversity in their syntactic arrangements. Our analysis of normalized Levenshtein Distance (NLD) between song pairs sampled across three temporal scales within a day, across days within a season, and across years revealed consistently high values (typically NLD > 0.9; Fig. 3A ), reflecting substantial syntactic plasticity. NLD values increased subtly with longer inter-song intervals beyond 4-5 minutes, suggesting that songs become progressively more distinct as temporal separation increases. Even within a single singing bout (generally a few minutes long), males rarely repeated similar song syntax (NLD < 0.5), and song pairs separated by more than a few minutes typically showed substantial structural divergence. Download figure Open in new tab Figure 3: Song consistency and cumulative N-gram usage over time for four individuals. (A) Normalized Levenshtein Distance (NLD) between a random pair of songs as a function of temporal separation. Left: comparisons within the same day (log-scaled in seconds), middle: across days within the same year (log-scaled in days), right: across years (1-4 year gaps). Colored points indicate individual comparisons; black lines show smoothed GAM trends. (B) Repertoire accumulation curves for 1-gram, 2-gram, and 3-gram types in 2022. Each panel shows the number of unique N-grams accumulated as a function of the number of songs sampled. Curves represent individual birds, with ribbons indicating ±1 SD based on 100 random permutations. (C) Cumulative unique N-gram types across recording years. Solid lines connect consecutive years with available data; dashed lines represent gaps due to missing recordings in 2020. Each panel shows the cumulative number of distinct N-grams detected for each individual by year. However, this high variation does not equate to disorder. Song syntax retained an underlying structure, particularly at the level of note types (1-grams). As we sampled more songs per individual, the number of unique 1-grams, 2-grams, and 3-grams steadily increased, although the rate and asymptote varied by N-gram level ( Fig. 3B ). Unigram repertoires saturated around 150 songs, suggesting a relatively stable note inventory. In contrast, the accumulation of bigrams and trigrams continued at a near-linear rate with increasing song count, indicating that novel combinations of notes emerge even within a single season. By extending this analysis across years, we quantified the cumulative number of unique unigrams, bigrams, and trigrams produced over time ( Fig. 3C ). Unigram repertoires showed relatively shallow growth, with most note types reused across years and few novel notes added, indicating a relatively stable basic inventory. In contrast, the number of bigrams and trigrams increased rapidly each successive year, suggesting ongoing reorganization and innovation in how existing notes are combined. Even so, given the vast number of potential permutations, observed combinations represented only a small fraction of the possible syntactic space, implying that song syntax is not randomly assembled but constrained by individual-specific or culturally transmitted rules. 3.4 Song Sharing We observed a strong effect of social factors on N-gram repertoire structure and sharing. Across both years analyzed (2021 - 12 individuals and 2022 - 13 individuals), cumulative N-gram richness increased with the number of individuals, but at varying rates depending on N-gram size ( Fig. 4A ). One-gram richness showed signs of saturation (possibly around 15 individuals), whereas 2-grams and 3-grams exhibited a near-linear accumulation, indicating higher combinatorial diversity. Overall richness was consistently higher in 2021 compared to 2022 across all N-gram sizes, suggesting temporal drift in repertoire complexity. Download figure Open in new tab Figure 4: Social patterns of N-gram structure and sharing across individuals. (A) Cumulative N-gram richness as a function of the number of individuals, shown separately for 1-grams, 2-grams, and 3-grams. Lines represent mean richness across 100 random permutations, and shaded ribbons indicate standard deviation. (B) Distribution of N-grams by the number of individuals sharing them, shown as a percentage of total N-grams each year. Most 2- and 3-grams are individual-specific or rare. (C) Boxplots showing pairwise N-gram repertoire overlap between neighbors (territories ≤ 100 m apart) and non-neighbors, across N-gram sizes. Asterisks indicate Wilcoxon rank-sum test significance levels (* p < 0.05; ** p < 0.01; *** p < 0.001; n.s. = not significant). Year-specific comparisons are limited to 2021 and 2022, the two years with the most individuals recorded. Despite this richness, most N-grams were rare and individual-specific. In both years, over 90% of 3-grams and over 75% of 2-grams were used by only one or two individuals ( Fig. 4B ). In contrast, a significant proportion of 1-grams was more widely shared, with all individuals sharing a subset of 1-grams. These patterns reflect a high degree of vocal individuality at higher-order N-gram levels, suggesting that complex syntactic sequences are not commonly shared, even among individuals in close proximity. Consistent with this, N-gram repertoire overlap between neighboring individuals (territory centroids ≤ 200 m apart) was significantly higher than that between non-neighbors for 2-grams, indicating that shared short sequences may play a role in local social recognition or song matching ( Fig. 4C ). No significant difference was found for 1-grams and 3-grams, reinforcing that higher-order structures are more individualized and less influenced by spatial proximity. 3.5 Individual Signatures We identified a set of individual-specific N-grams uniquely produced by only one focal male in a given year, highlighting the presence of individualized vocal signatures. For each focal individual (eg, YYXX, YOXX, RUGG, YOGG), we extracted the most frequently occurring 1-gram, 2-gram, and 3-gram types that met this criterion ( Fig. 5 ). While all individuals exhibited distinct 2-gram and 3-gram signatures, 1-gram signatures were more limited, with some individuals (e.g., YYXX) lacking any consistent single-note signature in either year. The occurrence rates of these unique N-grams varied across individuals and years, but were relatively rare. The signature N-grams were structurally diverse, comprising short tonal elements and longer, frequency-modulated sequences. Many higher-order signatures included note combinations with distinct spectro-temporal features, suggesting that individual identity may be encoded not just in the presence of specific notes but also in the arrangement, duration, and acoustic structure of note sequences. Download figure Open in new tab Figure 5: Individual-specific N-gram signatures in S. albiventris songs. Rows correspond to 1-gram, 2-gram, and 3-gram units; columns represent four focal individuals (YYXX, YOXX, RUGG, YOGG). Each panel displays a spectrogram of the most frequently occurring N-gram that was uniquely produced by that individual in a given year. The total number of occurrences across ∼150 songs is indicated at the top-left of each panel. The year of signature occurrence is shown at the bottom-right. Purple boxes outline individual notes comprising each N-gram. 3.6 Impact of Social and Ecological Factors on Song Consistency and Sharing 3.6.1 Predictors of N-gram Consistency Across Years Generalized additive models revealed that the probability of an N-gram being retained across years within individuals was significantly influenced by N-gram occurrence and repertoire richness in Year 1, as well as by acoustic features such as frequency bandwidth and mean frequency ( Fig. 6A ). N-grams with higher occurrence frequency in Year 1 were more likely to be retained, suggesting that frequently used elements form the core of an individual’s vocal repertoire. Repertoire richness showed a nonlinear relationship: individuals with intermediate-sized N-gram repertoires had the highest probabilities of retention. In contrast, ecological factors such as proportional change in territory area and total number of neighbors across years had weak or nonsignificant effects. Download figure Open in new tab Figure 6: Results of generalized additive models (GAMs) examining ecological and acoustic predictors of N-gram usage in Sholicola albiventris . (A) Predicted probability of within-individual N-gram consistency across consecutive years. (B) Predicted probability of within-year N-gram sharing across individuals. Each column represents a different N-gram size (1-Gram, 2-Gram, 3-Gram), and each row shows the effect of a specific predictor on the probability of consistency or sharing. Rows 1-4 differ by model type: In (A) Consistency models, the predictors are: Proportional change in the territory area from Year 1 to Year 2, Total Number of neighboring individuals across two years, N-gram occurrence frequency in Year 1, and N-gram repertoire size in Year 1. In (B) Sharing models, the predictors are: Pairwise distance between territories, Number of shared neighboring individuals, Maximum N-gram occurrence between the pair, and Cumulative N-gram repertoire size across the pair. Rows 5-8 (shared across both model types) show effects of acoustic features: Mean position of the N-gram in the song, Mean frequency of the N-gram, Frequency bandwidth, and Duration of the N-gram. Lines show GAM-predicted probabilities, with shaded ribbons representing 95% confidence intervals. Line colors correspond to N-gram size: 1-Gram (purple), 2-Gram (pink), 3-Gram (orange). 3.6.2 Predictors of N-gram Sharing Within Years Within-year sharing of N-grams across individuals was primarily structured by spatial proximity and social connectivity ( Fig. 6B ). N-gram sharing decreased with increasing distance between territories, and the sharing of notes (1-grams) increased with the number of shared neighbors, indicating localized convergence driven by social exposure. Larger combined repertoire sizes were positively associated with sharing, suggesting that individuals with larger repertoires are more likely to have shared N-grams. 3.6.3 Syntactic and Structural Constraints Across Both Models The position of N-grams is critical in sharing, as N-grams occurring in the initial part of the song are likely to be shared by individuals. The spectro-temporal structure of N-grams influenced consistency and sharing patterns, with comparable trends across model sets. Frequency bandwidth was one of the strongest predictors: N-grams with narrower frequency ranges were more likely to be retained across years and shared across individuals, suggesting reduced complexity may favor stability and convergence. Mean frequency also showed moderate nonlinear effects, while duration had a weaker, inconsistent influence ( Fig. 6 ). 4. Discussion 4.1 Complexity beyond Spectro-Temporal Features Traditional acoustic features and complexity metrics quantify only partial aspects of song syntax diversity in S. albiventris . While spectro-temporal features like frequency bounds and song duration are helpful descriptors, they fail to capture the organizational intricacies that characterize the elaborate vocal repertoire of this species. Single-value indices such as note pace, note richness, Song Richness Index (SRI), Markov Entropy Rate (MER), and Note Variability Index (NVI) are informative for broad comparisons but are limited in scope. These metrics reduce complex vocal syntax into simplified summaries and overlook the internal structure and sequential transitions. In species with open-ended repertoires and high syntactic variation, such as S. albiventris , communicative complexity lies not just in how many elements exist, but in how they are combined and reused across time and social contexts ( Kershenbaum et al. 2014 ). This study emphasizes the need to move beyond traditional acoustic parameters and summary indices and adopt sequence-based, syntactic approaches to understand the intricacies of vocal communication in complex song systems. 4.2 Balancing Vocal Innovation and Identity S. albiventris displays a dynamic balance between vocal stability and innovation. Males reliably reused core note types across years, suggesting stable vocal “signatures,” yet higher-order N-gram structures showed ongoing turnover, reflecting active innovation within repertoires. This dual pattern suggests an evolutionary trade-off between the need for individual recognizability and the flexibility to diversify signals in response to shifting social or ecological pressures ( Briefer et al. 2008 ; Smith-Vidaurre et al. 2020 ). The inter-annual variation and syntactic plasticity observed here are typical of open-ended learners capable of modifying song beyond early development ( Cornez et al. 2017 ). This structured plasticity shows the potential for using birdsongs as a model to study how communication systems evolve under competing pressures for stability and novelty. 4.3 Social Context as a Driver of Vocal Learning Vocal learning is prominently shaped by intrinsic developmental programs and the social environment in which individuals acquire and use their songs. We found that males with more territorial neighbors tended to exhibit higher N-gram richness and greater syntactic flexibility, suggesting that vocal innovation is partially influenced by local social context. Territory overlap, proximity to other males, and opportunities for repeated vocal interactions may encourage learning and modifying vocal sequences. Our results suggest that S. albiventris males may navigate these demands by combining shared population-level syntax with personalized vocal signatures, such as those in European Wrens ( Catchpole and Rowell 1993 ), Skylarks ( Briefer et al. 2012 ), Great Tits ( Rivera-Gutierrez et al. 2010 ), and Splendid Sunbird ( Payne 1978 ) through repeated interaction with their acoustic neighborhood. This socially responsive vocal behavior is not unique, as social context plays a key role in shaping vocal learning trajectories, from dialect formation in temperate sparrows ( Hensel et al. 2022 ) to vocal convergence in parrots ( Wright and Dahlin 2017 ) and cetaceans ( Janik 2014 ). Rather than being fixed endpoints of early-life learning, repertoires may remain open to change throughout adulthood, especially in socially flexible, open-ended learner species ( Cornez et al. 2017 ). 4.4 Cultural Transmission and Formation of Vocal Dialects Patterns of N-gram sharing among S. albiventris males revealed a core set of syntactic elements widely used within a given year, indicating a shared cultural pool. These common N-grams, sustained through social learning and horizontal transmission among neighboring individuals, form the basis of a population-level dialect. Similar dynamics have been observed in the Yellow-naped Amazon ( Amazona auropalliata ), where consistent variation in contact calls coexists with the long-term stability of vocal dialects across populations ( Wright and Wilkinson 2001 ; Wright et al. 2008 ). At the same time, individual S. albiventris exhibited distinct N-gram patterns, creating a layered system of shared and individual-specific note sequences. In many passerines, such cultural variation is shaped by geographic and habitat barriers ( Laiolo and Tella 2005 ; Ortiz-Ramírez et al. 2016 ; Camacho-Alpízar et al. 2018 ), short dispersal distances ( Searcy et al. 2002 ; Graham et al. 2017 ), and constrained social networks ( Fernandez et al. 2017 ; Williams 2021 ), which can promote the emergence of localized dialects across fragmented landscapes. These findings highlight the potential of birdsong as a model for studying how geographic isolation, dispersal constraints, and habitat connectivity drive the evolution and divergence of cultural traits. 4.5 Parallels Between Birdsong and Human Language The syntactic structure of S. albiventris songs revealed striking similarities with the organization of human languages. In human speech, phonemes and words serve as symbolic units flexibly combined into larger sequences, and similarly, individual notes and N-grams in birdsong act as compositional building blocks ( Doupe and Kuhl 1999 ; Kershenbaum et al. 2016 ). Our analyses showed that these sequences are neither random nor rigid but exhibit structured transitions and recurrent patterns, reflecting principles akin to compositional syntax in language ( Berwick et al. 2011 ). S. albiventris syntax balances regularity and flexibility, suggesting a rule-governed but adaptable communication system similar to human languages. Vocal innovation, social learning, and inter-annual turnover in repertoires parallel key mechanisms of human cultural transmission that make it a valuable model for understanding the origins and dynamics of complex communication systems. 4.6 Analyzing Complex Song Syntax: Challenges and Opportunities Quantifying syntactic structure in birdsong introduces significant analytical challenges, particularly in species like S. albiventris that possess large, variable repertoires with flexible note ordering ( Kershenbaum et al. 2014 ; Sawant et al. 2022 ). Traditional methods often rely on fixed or stereotyped syntactic structures and may fail to capture the underlying organization in open-ended learners. While N-gram models are widely used to detect recurring syllables ( Sasahara et al. 2012 ; Smith 2014 ), they require careful implementation to distinguish meaningful syntactic patterns from chance co-occurrences, particularly in systems with high sequence variability. The huge combinatorial space of possible note arrangements can also lead to data sparsity, especially at higher N-gram levels. Moreover, classification accuracy in note labeling can compound this challenge: for example, with 80% precision at the single-note level, the accuracy of a 2-gram drops to ∼64%, and declines exponentially for longer sequences. These factors underscore the need for analytical tools that are both sensitive to latent structure and robust to observational noise. Despite these difficulties, our study shows we can detect robust patterns of N-gram reuse and structured innovation even in open-ended learners with high variability. 4.7 Long-term Monitoring of Tropical Birds and Future Directions Long-term monitoring is essential in tropical systems, where extended breeding seasons ( Renthlei et al. 2022 ), high adult survival ( Karr et al. 1990 ), and complex social dynamics ( Buskirk 1976 ) place unique pressures on vocal communication. Our multi-year study of S. albiventris demonstrates the value of sustained, individual-level acoustic monitoring for uncovering syntactic variation, vocal plasticity, and social learning. Crucially, such insights depend on the ability to track known individuals across years, highlighting the irreplaceable role of color-banding in studies of vocal communication and cultural transmission. We may fully understand the key processes, such as repertoire turnover, the maintenance of individual vocal signatures, and the development of population-level dialects, only through extended observations of individually marked birds. Unfortunately, recent policy changes have made obtaining permissions for color-banding endemic birds in India increasingly difficult, potentially undermining future efforts to study long-term vocal communication ( Shanker et al. 2023 ). As habitat fragmentation and degradation intensify across tropical montane forests ( Laurance et al. 2011 ), culturally transmitted traits essential for mate attraction, territoriality, and social cohesion may become increasingly fragile. Long-term, individual-based studies remain vital for understanding and conserving the cultural dimensions of avian biodiversity. Declaration of AI usage During the analytical process for the manuscript, we used ChatGPT-4o to simplify and clean our R scripts. We analyzed all the data in the R environment, and SS and CA thoroughly reviewed the scripts before finalizing the workflow. We used Grammarly to improve the readability and clarity, and Paperpile to manage citations, but we did not use Generative AI tools to write this manuscript. So we take full responsibility for the text presented here. Author Contribution Statement Suyash Sawant: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Software, Validation, Visualization, Writing - original draft, and Writing - review & editing. Chiti Arvind: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Software, Supervision, Validation, & Writing - review and editing. Viral Joshi: Conceptualization, Investigation, Methodology, Validation, & Writing - review and editing. Indranil Dutta: Methodology and Writing - review & editing. Robin V. V.: Conceptualization, Funding acquisition, Methodology, Project administration, Resources, Supervision, Writing - original draft, and Writing - review & editing. Funding Information This research was supported by the grants from the Government of India: Department of Science and Technology (DST) - Science and Engineering Research Board (SERB) (ECR/2016/001065), the Ministry of Environment, Forest and Climate Change (MoEFCC) (19-22/2018/RE), and intramural funds from Indian Institute of Science Education and Research (IISER) Tirupati. Supplementary Material Download figure Open in new tab Figure S1: (a) Location of Kodaikanal, Tamil Nadu (TN), in the southern Western Ghats of India. (b) Adult male Sholicola albiventris (White-bellied Sholakili), the focal species individual with Black-White (BWXX) color-band. (c) Satellite view of the primary study site, Bombay Shola, a mid-elevation montane evergreen forest fragment (∼40 ha) adjacent to Kodaikanal town. The yellow polygon marks the forest boundary used for sampling and territory mapping. Download figure Open in new tab Figure S2: (A) Rarefaction curves showing note-type accumulation across songs for 12 males, indicating saturation between 120-180 songs per individual. (B) Power analysis for detecting within-individual variation across four years (n = 600 songs). (C) Power analysis for detecting among-individual variation within a year (n = 1800 songs). Power analyses were conducted using one-way ANOVA in G*Power 3.1, showing ≥90% power to detect small effect sizes. Download figure Open in new tab Figure S3: Representative spectrograms (top) and hierarchical clustering dendrogram (bottom) illustrating the classification of note types into 13 distinct acoustic categories based on similarity in acoustic features. Clustering was performed using hierarchical clustering using spectrogram cross-correlation. Colors correspond to the final note clusters used in downstream analyses. Download figure Open in new tab Figure S4: Variation in spectro-temporal parameters across individuals and years. Boxplots show individual-level variation in five song-level acoustic features: (A) Frequency Bandwidth, (B) Mean Frequency, (C) Low Frequency, (D) High Frequency, and (E) Song Duration. Each boxplot represents an individual aggregated across all years (2019–2023), with overlaid colored error bars indicating inter-annual variation within each individual. Asterisks above boxes denote statistical significance of individual identity in linear mixed models (p < 0.05*, ** < 0.01**, *** < 0.001***; “ns” = not significant). Download figure Open in new tab Figure S5: Principal Component Analysis (PCA) of spectro-temporal song parameters. Top panels show PCA scores (PC1 vs. PC2) for all songs, colored by individual identity and faceted by year (2019–2023), illustrating population-wide overlap and inter-annual stability in acoustic space. Middle panels show within-individual PCA scores for four focal males, highlighting individual-specific clustering patterns colored by year. The bottom-left panel shows the variance explained by the top five principal components, with PC1 and PC2 accounting for 62% and 25% of the total variance, respectively. The bottom-right panel shows PCA loadings, indicating that PC1 primarily reflects frequency-based traits, while PC2 captures variation in frequency and temporal spread. Download figure Open in new tab Figure S6: Variation in song complexity metrics across individuals and years. Boxplots show individual-level variation in five song-level acoustic features: (A) Note Count, (B) Note Pace, (C) Note Types, (D) Note Richness, (E) Song Richness Index, and (F) Markov Entropy Rate. Each boxplot represents an individual aggregated across all years (2019–2023), with overlaid colored error bars indicating inter-annual variation within each individual. Asterisks above boxes denote statistical significance of individual identity in linear mixed models (p < 0.05*, ** < 0.01**, *** < 0.001***; “ns” = not significant). Download figure Open in new tab Figure S7: Principal Component Analysis (PCA) of song complexity metrics. Top panels show PCA scores (PC1 vs. PC2) for all songs, colored by individual identity and faceted by year (2019–2023), illustrating population-wide overlap and inter-annual stability in acoustic complexity. Middle panels show within-individual PCA scores for four focal males, highlighting individual-specific clustering patterns colored by year. The bottom-left panel shows the variance explained by the top five principal components, with PC1 and PC2 accounting for 49% and 33% of the total variance, respectively. The bottom-right panel shows PCA loadings, indicating that PC1 primarily reflects frequency-based traits, while PC2 captures variation in frequency and temporal spread. View this table: View inline View popup Table S1: A list of all individuals of S. albiventris banded during the study period. Band # represents the unique number on the aluminium ring (generally on the right leg), the color-band combination represents the color of rings from top to bottom (generally on the left leg) and the Individual ID represents a unique code used for individual monitoring. * represents the males that were monitored for territorial interactions and acoustic recordings. Individuals were aged based on morphology in the field and sex was determined through molecular sexing. Year of banding is the first time the individual was captured and banded. View this table: View inline View popup Download powerpoint Table S2: Per year sample size for each color-banded male recorded during the study period. Number of Songs and the total number of notes in the songs annotated per year for each individual. All the songs across individuals and years were used to examine spectro-temporal variation and song complexity. For song syntax analysis, we included individual data in a given year if we had >75 songs and the number of songs per individual per year was capped to 150. Acknowledgement We thank Harikrishnan C.P., Ashwin Warudkar, Vinay K.L., Amrutha Rajan, Archita Sharma, Naman Goyal, Anuja Kanase, and Susmit Bansode for their field and lab work assistance; Yogeshwari and Kamraj for assistance in the field. We are grateful to Ramana Athreya, Jobin Varughese, Nandini Rajamani, Michael Pitzrick, Russ Charif, Laurel Symes, Guha Dharmarajan, and Kathryn Sieving for valuable discussions and feedback on study design, analytical approaches, and broader conceptual framing. We also thank the members of the Bird Ecology Lab at the Indian Institute of Science Education and Research (IISER) Tirupati, for their thoughtful inputs. We sincerely appreciate the Tamil Nadu Forest Department and the Kodaikanal Forest Division for granting the permissions (permit no. WL5(A)/43781/2017) necessary to conduct fieldwork. We thank Kodaikanal International School (KIS) and the School’s Center for Environment and Humanity, particularly Corey Stixrud, Ashwin Fernandes, and Iti Maloney, for providing access to the KIS-IISER field station and additional logistical support. We also thank Ian Lockwood, Ramesh Daga, Billy and Arun Kolhatkar, and the Palani Hills Conservation Council for generously granting access to their lands during data collection. Funder Information Declared Government of India: Department of Science and Technology (DST) - Science and Engineering Research Board (SERB) , ECR/2016/001065 Government of India: Ministry of Environment, Forest and Climate Change (MoEFCC) , 19-22/2018/RE References ↵ Aamodt , C. M. , M. Farias-Virgens , and S. A. White . 2020 . Birdsong as a window into language origins and evolutionary neuroscience. Philosophical Transactions of the Royal Society B . ↵ Arasumani , M. , D. Khan , C. K. Vishnudas , M. Muthukumar , M. Bunyan , and V. V. Robin . 2019 . Invasion compounds an ecosystem-wide loss to afforestation in the tropical grasslands of the Shola Sky Islands . Biological Conservation 230 : 141 – 150 . OpenUrl CrossRef ↵ Araya-Salas , M. , and T. Wright . 2013 . Open-ended song learning in a hummingbird. Biology Letters . ↵ Bantock , T. M. , R. P. Prys-Jones , and P. L. M. Lee . 2008 . New and improved molecular sexing methods for museum bird specimens . Molecular ecology resources 8 : 519 – 528 . OpenUrl PubMed ↵ Beecher , M. D . 2017 . Birdsong learning as a social process . Animal Behaviour 124 : 233 – 246 . OpenUrl ↵ Berwick , R. C. , K. Okanoya , G. J. L. Beckers , and J. J. Bolhuis . 2011 . Songs to syntax: the linguistics of birdsong . Trends in cognitive sciences 15 : 113 – 121 . OpenUrl CrossRef PubMed Web of Science ↵ Brenowitz , E. A. , D. Margoliash , and K. W. Nordeen . 1997 . An introduction to birdsong and the avian song system . Journal of neurobiology 33 : 495 – 500 . OpenUrl CrossRef PubMed Web of Science ↵ Briefer , E. , T. Aubin , K. Lehongre , and F. Rybak . 2008 . How to identify dear enemies: the group signature in the complex song of the skylark Alauda arvensis . The journal of experimental biology 211 : 317 – 326 . OpenUrl Abstract / FREE Full Text ↵ Briefer , E. , F. Rybak , and T. Aubin . 2012 . MICRODIALECT AND GROUP SIGNATURE IN THE SONG OF THE SKYLARK ALAUDA ARVENSIS . Bioacoustics 219 – 233 . ↵ Bruno , J. H. , E. D. Jarvis , M. Liberman , and O. Tchernichovski . 2021 . Birdsong Learning and Culture: Analogies with Human Spoken Language . Annual Review of Linguistics 7 : 449 – 472 . OpenUrl ↵ Buskirk , W. H . 1976 . Social Systems in a Tropical Forest Avifauna . The American naturalist 110 : 293 – 310 . OpenUrl CrossRef Web of Science ↵ Camacho-Alpízar , A. , E. J. Fuchs , and G. Barrantes . 2018 . Effect of barriers and distance on song, genetic, and morphological divergence in the highland endemic Timberline Wren (Thryorchilus browni, Troglodytidae) . PloS one 13 : e0209508 . OpenUrl PubMed ↵ Catchpole , C. K . 1987 . Bird song, sexual selection and female choice . Trends in ecology & evolution 2 : 94 – 97 . OpenUrl PubMed ↵ Catchpole , C. K. , and A. Rowell . 1993 . Song Sharing and Local Dialects in a Population of the European Wren Troglodytes troglodytes . Behaviour 125 : 67 – 78 . OpenUrl CrossRef ↵ Cornez , G. , F. N. Madison , A. Van der Linden , C. Cornil , K. M. Yoder , G. F. Ball , and J. Balthazart . 2017 . Perineuronal nets and vocal plasticity in songbirds: A proposed mechanism to explain the difference between closed-ended and open-ended learning . Developmental Neurobiology 77 : 975 – 994 . OpenUrl PubMed ↵ Dhondt , A. , and M. M. Lambrechts . 1992 . Individual voice recognition in birds . Trends in ecology & evolution 7 : 178 – 179 . OpenUrl PubMed DNeasy Blood & Tissue Handbook . 2023 . ↵ Doupe , A. J. , and P. K. Kuhl . 1999 . Birdsong and human speech: common themes and mechanisms . Annual review of neuroscience 22 : 567 – 631 . OpenUrl CrossRef PubMed Web of Science ↵ Dunn , E. H. , and C. John Ralph . 2004 . The use of mist nets as a tool for bird population monitoring . Studies in Avian Biology 29 : 1 ?6. OpenUrl ↵ Faul , F. , E. Erdfelder , A. Buchner , and A.-G. Lang . 2009 . Statistical power analyses using G*Power 3.1: tests for correlation and regression analyses . Behavior research methods 41 : 1149 – 1160 . OpenUrl CrossRef PubMed Web of Science ↵ Fernandez , M. S. A. , C. Vignal , and H. A. Soula . 2017 . Impact of group size and social composition on group vocal activity and acoustic network in a social songbird . Animal behaviour 127 : 163 – 178 . OpenUrl ↵ Fishbein , A. R. , W. J. Idsardi , G. F. Ball , and R. J. Dooling . 2020 . Sound sequences in birdsong: how much do birds really care? Philosophical Transactions of the Royal Society B . ↵ Garland , E. C. , M. S. Lilley , A. W. Goldizen , M. L. Rekdahl , C. Garrigue , and M. J. Noad . 2012 . Improved versions of the Levenshtein distance method for comparing sequence information in animals’ vocalisations: tests using humpback whale song . Behaviour 149 : 1413 – 1441 . OpenUrl ↵ Goldstein , M. H. , A. P. King , and M. J. West . 2003 . Social interaction shapes babbling: Testing parallels between birdsong and speech . Proceedings of the National Academy of Sciences 100 : 8030 – 8035 . OpenUrl Abstract / FREE Full Text ↵ Graham , B. A. , D. D. Heath , and D. J. Mennill . 2017 . Dispersal influences genetic and acoustic spatial structure for both males and females in a tropical songbird . Ecology and evolution 7 : 10089 – 10102 . OpenUrl ↵ Griesser , M. , D. Wheatcroft , and T. N. Suzuki . 2018 . From bird calls to human language: exploring the evolutionary drivers of compositional syntax . Current Opinion in Behavioral Sciences 21 : 6 – 12 . OpenUrl ↵ Hastie , T. J. , and R. J. Tibshirani . 1990 . Generalized Additive Models. Chapman & Hall/CRC Monographs on Statistics and Applied Probability. Chapman & Hall/CRC, Philadelphia , PA . ↵ Hensel , A. L. J. , S. L. Dobney , S. M. Doucet , D. Ryan Norris , A. E. M. Newman , H. Williams , and D. J. Mennill . 2022 . Microgeographical variation in birdsong: Savannah sparrows exhibit microdialects in an island population . Animal behaviour 188 : 119 – 131 . OpenUrl ↵ Hughes , M. , S. Nowicki , W. A. Searcy , and S. Peters . 1998 . Song-type sharing in song sparrows: implications for repertoire function and song learning . Behavioral Ecology and Sociobiology 42 : 437 – 446 . OpenUrl CrossRef Web of Science ↵ Janik , V. M. 2014 . Cetacean vocal learning and communication . Current Opinion in Neurobiology 28 : 60 – 65 . OpenUrl CrossRef PubMed ↵ Janik , V. M. , and P. J. B. Slater . 2000 . The different roles of social learning in vocal communication . Animal Behaviour 60 : 1 – 11 . OpenUrl CrossRef PubMed Web of Science ↵ Karr , J. R. , J. D. Nichols , M. K. Klimkiewicz , and J. D. Brawn . 1990 . Survival rates of birds of tropical and temperate forests: Will the dogma survive? The American naturalist 136 : 277 – 291 . OpenUrl CrossRef Web of Science ↵ Kershenbaum , A . 2014 . Entropy rate as a measure of animal vocal complexity . Bioacoustics 23 : 195 – 208 . OpenUrl ↵ Kershenbaum , A. , D. T. Blumstein , M. A. Roch , Ç. Akçay , G. Backus , M. A. Bee , K. Bohn , et al. 2016 . Acoustic sequences in non-human animals: a tutorial review and prospectus . Biological reviews of the Cambridge Philosophical Society 91 : 13 – 52 . OpenUrl CrossRef ↵ Kershenbaum , A. , A. E. Bowles , T. M. Freeberg , D. Z. Jin , A. R. Lameira , and K. Bohn . 2014 . Animal vocal sequences: not the Markov chains we thought they were . Proceedings. Biological sciences / The Royal Society 281 . ↵ Kershenbaum , A. , and E. C. Garland . 2015 . Quantifying similarity in animal vocal sequences: which metric performs best? Methods in ecology and evolution / British Ecological Society 6 : 1452 – 1461 . OpenUrl ↵ Kindt , R. 2020 . Vegan: community ecology package. R package version 1.17-8. WORLD 11 . ↵ King , S. L. , and P. K. McGregor . 2016 . Vocal matching: the what, the why and the how . Biology Letters . K. Lisa Yang Center for Conservation Bioacoustics at the Cornell Lab of Ornithology. Raven Pro: Interactive Sound Analysis Software (Version 1.5). The Cornell Lab of Ornithology . ↵ Kroodsma , D. E. , and B. E. Byers . 1991 . The function (s) of bird song . American zoologist 31 : 318 – 328 . OpenUrl CrossRef ↵ Kuhl , P. K. 2003 . Human speech and birdsong: Communication and the social brain . Proceedings of the National Academy of Sciences 100 : 9645 – 9646 . OpenUrl FREE Full Text ↵ Laiolo , P. , and J. L. Tella . 2005 . Habitat fragmentation affects culture transmission: patterns of song matching in Dupont’s lark . Journal of Applied Ecology 42 : 1183 – 1193 . OpenUrl ↵ Laurance , W. F. , J. L. C. Camargo , R. C. C. Luizão , S. G. Laurance , S. L. Pimm , E. M. Bruna , P. C. Stouffer , et al. 2011 . The fate of Amazonian forest fragments: A 32-year investigation . Biological conservation 144 : 56 – 67 . OpenUrl CrossRef Web of Science ↵ Leitão , A. V. , R. A. Mulder , and M. L. Hall . 2022 . Song functions for joint territory defence and within-pair communication in female and male lovely fairy-wrens . Animal Behaviour 192 : 145 – 157 . OpenUrl ↵ Mariette , M. M. 2019 . Acoustic Cooperation: Acoustic Communication Regulates Conflict and Cooperation Within the Family . Frontiers in Ecology and Evolution 7 : 483074 . OpenUrl ↵ Ortiz-Ramírez , M. F. , M. J. Andersen , A. Zaldívar-Riverón , J. F. Ornelas , and A. G. Navarro-Sigüenza . 2016 . Geographic isolation drives divergence of uncorrelated genetic and song variation in the Ruddy-capped Nightingale-Thrush (Catharus frantzii; Aves: Turdidae) . Molecular phylogenetics and evolution 94 : 74 – 86 . OpenUrl PubMed ↵ Payne , R. B . 1978 . Microgeographic Variation in Songs of Splendid Sunbirds Nectarinia coccinigaster: Population Phenetics, Habitats, and Song Dialects . Behaviour 65 : 282 – 308 . OpenUrl ↵ Podos , J. , and P. S. Warren . 2007 . The Evolution of Geographic Variation in Birdsong . Pages 403 – 458 in Advances in the Study of Behavior (Vol. 37 ). Academic Press . OpenUrl ↵ Price , J. J. , and D. Yuan . 2011 . Song-type sharing and matching in a bird with very large song repertoires, the tropical mockingbird . Behaviour 148 : 673 – 689 . OpenUrl CrossRef ↵ Purushotham , C. B. , and V. V. Robin . 2016 . Sky island bird populations isolated by ancient genetic barriers are characterized by different song traits than those isolated by recent deforestation . Ecology and Evolution 6 : 7334 – 7343 . OpenUrl QGIS Association . Geographic Information System Developers Manual . QGIS.org . ↵ Renthlei , Z. , S. Yatung , R. Lalpekhlui , and A. K. Trivedi . 2022 . Seasonality in tropical birds. Journal of experimental zoology. Part A , Ecological and integrative physiology 337 : 952 – 966 . OpenUrl ↵ Riebel , K. , K. J. Odom , N. E. Langmore , and M. L. Hall . 2019 . New insights from female bird song: towards an integrated approach to studying male and female communication roles. Biology Letters . ↵ Rivera-Gutierrez , H. F. , E. Matthysen , F. Adriaensen , and H. Slabbekoorn . 2010 . Repertoire Sharing and Song Similarity between Great Tit Males Decline with Distance between Forest Fragments . Ethology 116 : 951 – 960 . OpenUrl CrossRef Web of Science ↵ Robin , V. V. , J. E. Hines , J. D. Nichols , M. Katti , and A. Sinha . 2021 . Demographic changes of a tropical understory bird in naturally patchy montane habitats in southern India . bioRxiv . ↵ Rose , E. M. , N. H. Prior , and G. F. Ball . 2022 . The singing question: re-conceptualizing birdsong . Biological Reviews 97 : 326 – 342 . OpenUrl CrossRef ↵ Samuels , B. D . 2015 . Can a bird brain do phonology? Frontiers in Psychology 6 : 156732 . OpenUrl ↵ Sánchez , N. V. , and D. J. Mennill . 2024 . Behavioural consequences of conspecific neighbours: a systematic literature review of the effects of local density on avian vocal communication . Journal of Ornithology 165 : 847 – 859 . OpenUrl ↵ Sasahara , K. , M. L. Cody , D. Cohen , and C. E. Taylor . 2012 . Structural design principles of complex bird songs: a network-based approach . PloS one 7 : e44436 . OpenUrl CrossRef PubMed ↵ Sawant , S. 2025 . birdsong-syntax. Github . ↵ Sawant , S. , C. Arvind , V. Joshi , and V. V. Robin . 2021 . Song Richness Index: A measure to understand the diversity and repetition of notes in a birdsong . bioRxiv . ↵ Sawant , S. , C. Arvind , V. Joshi , and V. V. Robin . 2022 . Spectrogram cross-correlation can be used to measure the complexity of bird vocalizations . Methods in Ecology and Evolution 13 : 459 – 472 . OpenUrl ↵ Searcy , W. A. , S. Nowicki , M. Hughes , and S. Peters . 2002 . Geographic song discrimination in relation to dispersal distances in song sparrows . The American naturalist 159 : 221 – 230 . OpenUrl CrossRef PubMed Web of Science ↵ Shanker , K. , V. V. Robin , U. Srinivasan , R. Athreya , N. Rajamani , F. Ishtiaq , U. Kodandaramiah , et al. 2023 . Why Amendments to the Wild Life Act Are Scheduled To Fail . ↵ Sidorov , G. , F. Velasquez , E. Stamatatos , A. Gelbukh , and L. Chanona-Hernández . 2014 . Syntactic N-grams as machine learning features for natural language processing . Expert Systems with Applications 41 : 853 – 860 . OpenUrl ↵ Slater , P. J. B . 1986 . The cultural transmission of bird song . Trends in Ecology & Evolution 1 : 94 – 97 . OpenUrl PubMed ↵ Smith , R. 2014 . Complexity in Animal Communication: Estimating the Size of N-Gram Structures . Entropy 16 : 526 – 542 . OpenUrl ↵ Smith-Vidaurre , G. , M. Araya-Salas , and T. F. Wright . 2020 . Individual signatures outweigh social group identity in contact calls of a communally nesting parrot . Behavioral ecology: official journal of the International Society for Behavioral Ecology 31 : 448 – 458 . OpenUrl ↵ Somervuo , P. , and A. Harma . 2004 . Bird song recognition based on syllable pair histograms. Bird song recognition based on syllable pair histograms. Presented at the 2004 IEEE International Conference on Acoustics, Speech, and Signal Processing, IEEE . ↵ Suarez Sharma , S. P. , S . L. Dobney , D. R. Norris , S. M. Doucet , A. E. M. Newman , J. B. Burant , I. G. Moran , et al. 2024 . Effects of age, breeding strategy, population density, and number of neighbors on territory size and shape in Passerculus sandwichensis (Savannah Sparrow) . Ornithology 141 :ukae025. ↵ Williams , H. 2021 . Mechanisms of Cultural Evolution in the Songs of Wild Bird Populations . Frontiers in Psychology 12 : 643343 . OpenUrl PubMed ↵ Williams , H. , and R. F. Lachlan . 2022 . Evidence for cumulative cultural evolution in bird song . Philosophical Transactions of the Royal Society B . ↵ Wright , T. F. , and C. R. Dahlin . 2017 . Vocal dialects in parrots: patterns and processes of cultural evolution . Emu - Austral Ornithology 50 – 66 . ↵ Wright , T. F. , C. R. Dahlin , and A. Salinas-Melgoza . 2008 . Stability and change in vocal dialects of the yellow-naped amazon . Animal behaviour 76 : 1017 – 1027 . OpenUrl CrossRef PubMed Web of Science ↵ Wright , T. F. , and G. S. Wilkinson . 2001 . Population genetic structure and vocal dialects in an amazon parrot. Proceedings . Biological sciences 268 : 609 – 616 . OpenUrl CrossRef PubMed Web of Science View the discussion thread. Back to top Previous Next Posted August 01, 2025. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Linguistic Rules of Syntax and Sharing in the Complex Songs of a Tropical Passerine Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Linguistic Rules of Syntax and Sharing in the Complex Songs of a Tropical Passerine Suyash Sawant , Chiti Arvind , Viral Joshi , Indranil Dutta , V. V. Robin bioRxiv 2025.07.31.666818; doi: https://doi.org/10.1101/2025.07.31.666818 Share This Article: Copy Citation Tools Linguistic Rules of Syntax and Sharing in the Complex Songs of a Tropical Passerine Suyash Sawant , Chiti Arvind , Viral Joshi , Indranil Dutta , V. V. Robin bioRxiv 2025.07.31.666818; doi: https://doi.org/10.1101/2025.07.31.666818 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Animal Behavior and Cognition Subject Areas All Articles Animal Behavior and Cognition (7629) Biochemistry (17660) Bioengineering (13881) Bioinformatics (41910) Biophysics (21436) Cancer Biology (18576) Cell Biology (25480) Clinical Trials (138) Developmental Biology (13368) Ecology (19887) Epidemiology (2067) Evolutionary Biology (24302) Genetics (15598) Genomics (22482) Immunology (17726) Microbiology (40360) Molecular Biology (17163) Neuroscience (88534) Paleontology (666) Pathology (2830) Pharmacology and Toxicology (4821) Physiology (7637) Plant Biology (15129) Scientific Communication and Education (2045) Synthetic Biology (4290) Systems Biology (9817) Zoology (2269)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00