Accelerando and crescendo in African penguin display songs

preprint OA: gold CC-BY-NC-ND-4.0
📄 Open PDF Full text JSON View at publisher
Full text 44,295 characters · extracted from preprint-html · click to expand
Accelerando and crescendo in African penguin display songs | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Accelerando and crescendo in African penguin display songs View ORCID Profile Taylor A. Hersh , View ORCID Profile Yannick Jadoul , View ORCID Profile Marco Gamba , View ORCID Profile Andrea Ravignani , View ORCID Profile Livio Favaro doi: https://doi.org/10.1101/2025.04.04.647185 Taylor A. Hersh 1 Comparative Bioacoustics Group, Max Planck Institute for Psycholinguistics , Nijmegen, Netherlands 2 Marine Mammal Institute, Oregon State University , Newport, Oregon, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Taylor A. Hersh For correspondence: taylor.a.hersh{at}gmail.com yannick.jadoul{at}uniroma1.it Yannick Jadoul 1 Comparative Bioacoustics Group, Max Planck Institute for Psycholinguistics , Nijmegen, Netherlands 3 Artificial Intelligence Lab, Vrije Universiteit Brussel , Brussels, Belgium 4 Department of Human Neurosciences, Sapienza University of Rome , Rome, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Yannick Jadoul For correspondence: taylor.a.hersh{at}gmail.com yannick.jadoul{at}uniroma1.it Marco Gamba 5 Department of Life Sciences and Systems Biology, University of Turin , Turin, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Marco Gamba Andrea Ravignani 1 Comparative Bioacoustics Group, Max Planck Institute for Psycholinguistics , Nijmegen, Netherlands 4 Department of Human Neurosciences, Sapienza University of Rome , Rome, Italy 6 Center for Music in the Brain, Department of Clinical Medicine, Aarhus University , Aarhus, Denmark 7 Research Center of Neuroscience “CRiN-Daniel Bovet”, Sapienza University of Rome , Rome, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Andrea Ravignani Livio Favaro 5 Department of Life Sciences and Systems Biology, University of Turin , Turin, Italy Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Livio Favaro Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Many species produce rhythmic sound sequences. Some purportedly speed up their vocalizations throughout a display, reminiscent of—but not necessarily equivalent to— “accelerando” in human music. This phenomenon has been frequently reported but rarely quantified, which limits our ability to understand its mechanism, function, and evolution. Here, we use a suite of rhythm analyses to quantify temporal and acoustic features in the display songs of male African penguins ( Spheniscus demersus ). We show that songs get faster (i.e., accelerando) and louder (i.e., crescendo) as they progress. The accelerando occurs because the inter-syllable silences, not the syllables themselves, predictably shorten over time. This rhythmicity is maintained even when individuals take audible breaths. Individuals also show plasticity: when they start with a slow tempo, they speed up more strongly than when they start with a fast tempo. We hypothesize that this well-timed accelerando may stem from arousal-based mechanisms, biomechanical constraints, or more complex rhythmic control; future work should test the mechanisms behind this intra-individual rhythmic variation, since non-passerine birds are thought to have limited vocal plasticity. By integrating a rich empirical dataset with cutting-edge rhythm analyses, we establish the necessary foundation to determine how such features evolved and their role(s) across communication systems. 1. Introduction Theoretically, animals can time their vocalizations in an unlimited number of ways. In practice, isochrony—where the inter-onset intervals (IOIs) of vocalizations exhibit roughly equal durations—dominates across taxa. 1 – 5 Temporal variation around isochrony can be achieved by progressively lengthening (ritardando) or shortening (accelerando) IOIs in a sequence. In particular, vocal accelerando has been reported in passerine birds and mammals, and examples are often linked to agonistic interactions and high arousal situations ( Table 1 ). Rufous horneros ( Furnarius rufus ) produce “accelerated trills” when singing solos and duets, with song playing a role in territory defense and mate guarding. 6 Male thrush nightingales ( Luscinia luscinia ) may use accelerando in mating songs to evoke anticipation in listeners. 7 Both Columbian and California ground squirrels ( Urocitellus columbianus and Otospermophilus beecheyi , respectively) accelerate call production in the presence of a moving predator or intruder. 8 , 9 Yellow-bellied marmots ( Marmota flaviventris ) produce “accelerando whistles” when disturbing objects approach them; these acoustic displays often culminate in a physical attack. 10 Similarly, when flying male hammer-headed bats ( Hypsignathus monstrosus ) are approached by other males, they accelerate their call rate, orient towards the intruder, and attack if the intruder is not deterred. 11 View this table: View inline View popup Download powerpoint Table 1. Examples of mammalian (top) and avian (bottom) species with accelerando in vocal displays. Note that most reports of accelerando are anecdotal and descriptive rather than quantitative. More broadly, there is evidence that loud, accelerating calls are an ancestral call morphotype for phylogenetically new and ancient primates. 12 , 13 Accelerando is also common in human music, where it is used as a stylistic device to increase arousal, manipulate tension, and prevent habituation in listeners. 14 – 16 Coupling accelerando with other musical phenomena, such as crescendo (i.e., increasing loudness/intensity), can enhance a composition’s expressiveness. These and other descriptions of accelerating animal acoustic displays suggest that accelerando plays an important role in diverse communication systems, although that role may not necessarily be equivalent across systems. However, questions relating to the evolution, mechanism, and function of accelerando will remain intractable unless one can explicitly and systematically quantify accelerando across diverse study systems. 17 Here, we use a suite of rhythm analyses and statistical models to measure various temporal and acoustic features, including accelerando, in vocalizations produced by a non-passerine bird, the critically endangered African penguin ( Spheniscus demersus ). Compared to oscine songbirds, vocal communication is understudied in other avian taxa, especially in those assumed to have limited vocal plasticity. 18 African penguins are territorial, monogamous seabirds. They live in dense colonies where they compete for nesting space. During breeding periods, individuals produce multisyllabic “ecstatic display songs” (hereafter songs ; Figure 1 ). 19 , 20 Primarily made by males, these songs seem to play a role in nest territory defense, mate recognition, and mate attraction, but how they bolster or facilitate such displays is unknown. 19 – 22 Songs are typically composed of a sequence of short-duration “A” syllables leading up to one or more long-duration “B” syllables. 20 Both A and B syllables are egressive (i.e., produced with an outward flow of air). A third syllable type, the ingressive “C” syllable, occurs when penguins audibly inhale. C syllables can be interspersed throughout a song but do not occur in all songs. Given the differences in how and when they are produced, whether C syllables contribute to the structure and function of songs in the same way as A and B syllables is unknown. Download figure Open in new tab Figure 1. Example of accelerando and crescendo in an African penguin ecstatic display song. (A) Typical penguin stance while singing, with feet apart, beak up, and wings extended. (B) The annotated spectrogram shows the portion of a song leading up to the first B syllable (Audio S1). The accelerating sine wave (blue) captures the acceleration of the A syllables. As this song progresses, (C) successive IOIs shorten (accelerando) and (D) successive syllables get louder (crescendo). Temporal features of vocalizations often have higher transmission fidelity than spectral features in noisy environments, such as dense colonies of highly vocal individuals. 23 This could evolutionarily favor information encoding in the time domain for species like penguins and motivated our analysis of the temporal structure of African penguin songs. While spectral plasticity in African penguin vocalizations is limited, temporal plasticity is virtually unexplored. 21 Understanding song structure is thus a critical first step towards eventually unravelling the exact function of this biologically important display. Using song recordings from ex-situ individuals, we first test whether C syllables contribute to the temporal structure of songs in the same way as A syllables. Then, we investigate whether qualitative impressions of song accelerando and crescendo are quantitatively validated. We interpret our results against the broader behavioral ecology of African penguins and conclude with topics for future research. 2. Materials and Methods (a) Song recordings We analyzed 551 passively recorded songs from 26 ex-situ male African penguins (Table S1) during the 2016/2017 breeding seasons (between October 2016 and May 2017) at three Italian zoological facilities. Each male contributed at least six songs. Recordings were made when the facilities were closed to visitors, thus minimizing activity and disturbance around the exhibits. Individuals were unequivocally identified using colored flipper bands. Our dataset is a subset of a previously collected one, excluding females; data collection methods are detailed in 22 and summarized in Method S1. (b) Song feature extraction Song spectrograms were visually inspected and manually annotated in Praat 24 version 6.0.43 by two trained analysts. Each syllable’s start and end were manually demarcated and syllables were assigned to a syllable type based on spectrotemporal features, as previously described in the literature. 19 , 20 , 25 Inter-observer agreement on syllable type assignments was high (Cohen’s κ coefficient = 0.99; see 22 for details). Start time and duration were automatically extracted from the annotations with a custom Python script for each of the n syllables up to and including the first B syllable in a song. Additionally, each syllable’s intensity was calculated with the Python package Parselmouth 26 version 0.4.1 (Praat version 6.1.38) as the energy-based average of the intensity curve using default parameters after filtering out low-frequency noise using a Hann band-stop filter below 100 Hz (bandwidth 10 Hz). We then calculated the n −1 IOIs and silent interval durations between successive syllables. For each song, we calculated acceleration ratios between successive IOIs as 4 (resulting in n −2 ratios, Figure 1 ) and average acceleration ratio (excluding □ □ □ 1 ) as: A ratio greater than 0.5 corresponds to an accelerating sequence (i.e., a sequence with shortening IOIs and thus an increasing tempo), a ratio equal to 0.5 corresponds to an isochronous sequence, and a ratio less than 0.5 corresponds to a decelerating sequence. To normalize the position of syllables (or IOIs, or acceleration ratios) over songs of different lengths, we calculated their relative position within a song such that it is scaled between 0% and 100% for the first and last syllable ( for syllable i , for IOI i , for a i ). Finally, for each penguin, we grouped the IOI durations into five equally spaced bins based on their relative position (see Method S2). We then calculated the mean, standard deviation, and coefficient of variation (CV, corrected for small sample size) 27 of the IOI durations of all songs within each bin. (c) C syllable analysis Our first goal was to determine whether A and C syllables contribute equally to the acceleration of a song. This analysis assessed whether we should include C syllable onsets in IOI calculations, acceleration ratio calculations, and subsequent analyses. To address this, we calculated acceleration ratios for all pairs of successive IOIs and generated three distributions for comparison. The baseline distribution includes only acceleration ratios in parts of songs without C syllables present (i.e., between successive A-A and A-B syllable IOIs). The two alternative distributions include acceleration ratios in parts of songs with C syllables present. For these two alternative distributions, the C syllable onsets were either omitted or included in the IOI and acceleration calculations. We call these the “C-omitted distribution” and the “C-included distribution”, respectively. We then compared the alternative distributions to the baseline distribution to see which one was more similar to the baseline distribution. To do so, we calculated a kernel density estimation of the acceleration ratios in the baseline distribution and used it to calculate the likelihood of all acceleration ratios in the C-omitted and C-included distributions. We then used a Wilcoxon signed-rank test to test the difference in the median likelihood of each penguin’s acceleration ratios, omitting vs. including C syllable onsets. These tests were only done for penguins with at least three C syllables in their songs ( n =13). The baseline distribution represents the empirical distribution of measured acceleration ratios in the absence of detectable C syllables; by comparing which alternative distribution matches the baseline distribution most closely, we can quantitatively assess which of the two approaches, omitting or including C syllable onsets, can explain the observed temporal patterns in the most parsimonious way. (d) Song accelerando and crescendo analyses To determine whether songs accelerate, we ran a linear mixed-effects model (LMEM) (response variable: log-transformed IOI duration; fixed effect: relative position of IOI within song; nested random intercept: song in penguin in colony). As a linear slope in log space corresponds to an exponential curvilinear relation in the non-transformed data, the coefficient fitted by the LMEM conceptually matches the acceleration ratio between successive IOIs. For this and other LMEMs, we tested the significance of the fixed effect using a chi-square likelihood ratio test, comparing model fits with vs. without the fixed effect. Having quantitatively shown accelerando, we next ran a LMEM to determine whether acceleration is constant throughout a song (response variable: acceleration ratio; fixed effect: relative position of acceleration ratio within song; nested random intercept: song in penguin in colony). We also wanted to know how the two components of an IOI—syllable and silence— contribute to the observed acceleration. Accordingly, we ran LMEMs analogous to the previous ones, checking whether the duration of syllables and silences changes throughout songs (response variable: log-transformed syllable/silence duration; fixed effect: relative IOI position; nested random intercept: song in penguin in colony). To determine whether IOI durations become more precise as songs progress, we fitted a LMEM to test the change in IOI duration CV across songs (response variable: CV of grouped IOI durations; fixed effect: relative position of IOI bin; nested random intercept: penguin in colony). CV values were calculated for 5 disjunct bins; this approach groups values to calculate the CV summary statistic but also quantifies its evolution across songs. We also tested the decrease in CV between IOI 1 (the first IOI) and IOI n-1 (the last IOI before the B syllable) for each individual penguin using the modified signed-likelihood ratio test (SLRT) for equality of CVs, implemented in the R package cvequality . 28 , 29 Next, we ran a LMEM to test whether IOI 1 predicts average acceleration in songs (response variable: average acceleration ratio, excluding IOI 1 ; fixed effect: IOI 1 duration; nested random intercept: penguin in colony). As our random effect explicitly controls for variation across individuals (i.e., between penguins), the tested fixed effect captures within-penguin variation. Finally, we wanted to know whether songs crescendo leading up to the first B syllable. Again, we tested this with a LMEM (response variable: A syllable intensity, normalized relative to the first B syllable intensity; fixed effect: relative syllable position in the song; nested random slope: song in penguin in colony). 3. Results When C syllable onsets are included in IOI calculations, the distribution of acceleration ratios between successive IOIs (C-included distribution) clearly differs from the observed acceleration in naturally occurring sequences of A/B syllables without any Cs (baseline distribution; Figure 2A ). When C syllable onsets are omitted (i.e., not factored into IOI and acceleration ratio calculations), the resulting acceleration ratios (C-omitted distribution) match the baseline distribution significantly better. More specifically, the likelihood of the C-omitted distribution data points being drawn from the baseline distribution is significantly higher than for the points from the C-included distribution (Wilcoxon signed-rank test, n =13 penguins, T =0.0, p <0.001; Figures 2A & S1). These results indicate that the underlying assumption of the C-omitted distribution—that C syllables do not fulfil the same role as A syllables in a song’s temporal structure—is the more parsimonious explanation for the observed accelerando. Accordingly, we omitted C syllables in subsequent analyses. Download figure Open in new tab Figure 2. Quantitative analyses of accelerando and crescendo in African penguin ecstatic display songs. (A) Omitting C syllable onsets results in a distribution of acceleration ratios (purple) closely matching the baseline distribution (brown curve) of acceleration ratios between two successiv egressive (A/B) syllable IOIs (top); including C syllable onsets (teal) does not (bottom). This suggests that C syllables do not contribute to the temporal structure of songs in the same way a A syllables. (B) Within a song, IOI duration is significantly predicted by its relative position. The background lines show the individual songs; the bold lines show the fitted LMEM’s effect for each penguin (excluding the nested random effect per song). (C) Across penguins, the coefficient of variation of IOI duration significantly decreases as songs progress. The vertical lines represent the boundaries between bins (see Method S2). (D) Controlling for individuals, a LMEM show that IOI 1 significantly predicts a song’s subsequent acceleration. (E) Songs also show crescendo: later syllables are louder than earlier syllables. Bold lines again show the LMEM fit for each penguin. In panels B–E, colors denote different penguins (see bottom left legend; alphanumeric codes from 22 ) and shades correspond to the three colonies. Next, our analyses show that African penguin songs exhibit robust accelerando. Across penguins, an IOI’s position in a song is significantly negatively correlated with its duration, such that later IOIs have shorter durations (chi-square test, n =2834 syllables, χ 2 (1)=2425.2, p <0.001; Figure 2B ). Per-penguin linear regressions confirm these results: IOIs shorten as songs progress for all 26 penguins (Figure S2). Song acceleration is above 0.5 but not constant, with smaller acceleration ratios at the end of songs compared to the start (chi-square test, n =2253 syllables, χ 2 (1)=65.861, p <0.001; Figure S3). In general, penguins do not sing one stereotyped song, instead showing within-individual plasticity in the number of A syllables, number of C syllables, and mean acceleration ratio per song (Figure S4). Our duration analyses show that shortening silences, not A syllables, cause the observed acceleration. IOI position is negatively correlated with silence duration, with IOIs becoming ∼25% shorter and inter-syllable silences decreasing by almost 45% as songs progress (chi-square test, n =2834 syllables, χ 2 (1)=3211.3, p <0.001; Figure S5). In contrast, IOI position is positively correlated with A syllable duration: A syllables that occur later in songs are ∼20% longer than A syllables that occur earlier in songs (chi-square test, n =2834 syllables, χ 2 (1)=632.55, p <0.001; Figure S5). Across songs, the IOI durations become significantly less variable throughout songs (chi-square test, n =130 CV measurements, χ 2 (1)=56.739, p <0.001; Figure 2C ). In other words, songs gradually get more precise towards the end than at the start. Per individual, 13/26 penguins show a significant decrease in CV when comparing IOI 1 to IOI n-1 (Figure S6). Moreover, the duration of IOI 1 predicts the average acceleration ratio leading up to the first B syllable: a longer IOI 1 is correlated with a larger acceleration ( Figure 2D ; chi-square test, n =465 songs, χ 2 (1) =47.102, p <0.001). Again, per-penguin linear regressions broadly confirm these results (Figure S7). Figure S8 illustrates this correlation for one penguin, showing the acceleration for ten songs that vary in the length of IOI 1 . Finally, the intensity of A syllables significantly increases with relative syllable position, showing that songs crescendo leading up to the first B syllable, which is typically the most intense syllable in a song (chi-square test, n =3357 A and B syllables, χ 2 (1) =7.571, p <0.01; Figure 2E ). Per-penguin linear regressions confirm this result, with significant positive slopes for all 26 penguins (Figure S9). 4. Discussion The animal communication literature contains many descriptions of accelerating vocal signals ( Table 1 ), but few studies explicitly quantify accelerando. Our analyses show that male African penguin songs get faster and louder as they progress. They are also more precise (regarding IOI duration) at the end compared to at the start. The accelerando occurs because males shorten the silences between A syllables as they sing and is made more impressive by the fact that the A syllables themselves become longer throughout a song. While the accelerando itself is not perfectly constant, songs consistently accelerate rather than become isochronous or slow down. The crescendo occurs because males produce increasingly intense A syllables, culminating in a very long and intense B syllable. Past work shows that C syllables differ from A syllables in how they are produced and how consistently they occur in song. 20 Our results extend that work, suggesting that C syllables do not contribute to song accelerando in the same way as A syllables. Whether these two syllable types are also functionally different is an open question; playback experiments that evaluate receiver response to songs where A and C syllables are added or removed are needed to conclusively test this. Regardless, our results suggest that C syllables should be omitted from African penguin song analyses specifically focused on temporal structure. The duration of the first IOI predicts subsequent acceleration in a song. In other words, natural variation in IOI 1 is accounted for by a correspondingly more or less strong acceleration ratio throughout a song. This is not explained by individual penguins filling specific acceleration “niches” (for example, one penguin always accelerates slowly while another penguin always accelerates quickly), as evidenced by penguins overlapping in their song parameter distributions. Coupled with the increasing precision of IOIs as the song progresses, these results suggest that individual penguins show some degree of vocal plasticity in the temporal domain. Which mechanisms can explain the predictable accelerando and crescendo we observe in African penguin songs? Arousal is one possibility, but the proximal mechanisms linking arousal to changes in call speed or intensity are often difficult to determine. 30 They can include: increased muscle tone that alters the resonant properties of the underlying vocal production anatomy; an increased neural duty signal through the vocal motor regions in the brain; or an increase in the rate of other linked physiological processes, such as heart rate. 31 – 33 From a biomechanical perspective, the patterns we observe match what we would expect if penguins are physically preparing to produce the intense, long B syllable when singing. For example, if a certain air pressure level or volume in the lungs must be reached before a B syllable can be produced, then penguins may incrementally work towards that threshold, gradually adding air to their lungs and increasing tension in their syrinx membranes leading up to producing the B syllable. This scenario could explain the patterns we see in C syllable production and A syllable crescendo. Alternatively, African penguins may aim for a rhythmic “target” when singing, e.g., a specific tempo, and compensate for any natural variation in IOI 1 by accelerating more or less strongly. Under this scenario, our finding that C syllables do not contribute to temporal song structure in the same way as A syllables could indicate that penguins time their breaths in such a way as not to delay the onset of the next A syllable and thus interrupt the rhythmicity/acceleration of their song. This could be analogous to human wind instrument musicians, who are taught to breathe during rests (i.e., non-note moments) in a musical performance. If penguins instead breathed randomly without compensating for the breath duration, some of their breaths would overlap with or A delay syllables, altering the temporal structure of the vocal display. To tease apart these alternative hypotheses, future work should collect physiological and anatomical data from singers in parallel with song measurements to look for correlations between singer body condition/quality and spectrotemporal song features. This would enable testing whether arousal is responsible for the observed accelerando and crescendo in African penguin songs. Playback experiments that manipulate different song features and measure conspecific responses will shed light on which features are salient and which individuals are the intended signal receiver(s). Coupling such experiments with real-time physiological monitoring (e.g., heart rate) 34 of nearby penguins will help determine whether song accelerando and crescendo influence arousal, tension, and/or habituation in listeners, as they do in human music. 14 , 16 Our work adds African penguins to a growing list of animal species that produce accelerating vocal displays and takes a step forward by explicitly quantifying, rather than describing, this acoustic phenomenon. Our approach can help researchers conduct similar quantitative analyses for other species’ vocal displays. By systematically quantifying accelerando—a fundamental feature of rhythmic communication—and crescendo in animal vocalizations, we can establish the necessary foundation to determine how such features evolved and understand their role(s) across communication systems. Ethics Under Italian law, no specific permissions were required for collecting non-invasive passive acoustic recordings of ex-situ penguins. Data accessibility The dataset supporting the conclusions of this manuscript is available in a dedicated Open Science Framework repository ( https://osf.io/4dfxz/?view_only=979c3a6ae90942beb74269856b9504de ). Authors’ contributions All authors were involved in conceptualization; TAH, YJ, and AR developed the methodology; YJ created the Python scripts for the acoustic and statistical analyses; TAH and YJ analyzed the data and prepared the visualizations; MG, AR, and LF supervised the research; LF provided project resources; AR and LF acquired funding; TAH and YJ wrote the original draft; all authors reviewed and edited the final draft. Competing interests We have no competing interests to declare. Funding TAH, YJ, and AR were supported by Max Planck Group Leader funding to AR. TAH was also supported by the Oregon Gray Whale License Plate Program at the Marine Mammal Institute and a L’Oréal USA For Women in Science Fellowship. The Center for Music in the Brain is funded by the Danish National Research Foundation (DNRF117). YJ and AR are funded by the European Union (ERC, TOHR, 101041885) and are also supported by the Human Frontier Science Program research grant RGP0019/2022 ( https://doi.org/10.52044/HFSP.RGP00192022.pc.gr.153618 ). Acknowledgements We thank Giardino Zoologico di Pistoia, Zoomarine Roma, and Zoom Torino for facilitating research and providing access to penguin colonies; Stephanie King, Elias Fernández Domingos, Christian Herbst, Scott McCain, and two reviewers for helpful feedback; Eleonora Cresta and Elena Fumagalli for annotating recordings; and Francesca Terranova for checking text grids. Footnotes ↵ # Joint senior authors https://osf.io/4dfxz/?view_only=979c3a6ae90942beb74269856b9504de References 1. ↵ Ravignani A. & G. Madison . 2017 . The paradox of isochrony in the evolution of human rhythm . Frontiers in Psychology 8 : 1820 . doi: 10.3389/fpsyg.2017.01820 OpenUrl CrossRef PubMed 2. Raimondi T. , G. Di Panfilo , M. Pasquali , et al. 2023 . Isochrony and rhythmic interaction in ape duetting . Proceedings of the Royal Society B 290 : 20222244 . doi: 10.1098/rspb.2022.2244 OpenUrl CrossRef PubMed 3. De Gregorio C. , D. Valente , T. Raimondi , et al. 2021 . Categorical rhythms in a singing primate . Current Biology 31 : R1379 – R1380 . doi: 10.1016/j.cub.2021.09.032 OpenUrl CrossRef PubMed 4. ↵ Roeske T.C. , O. Tchernichovski , D. Poeppel , et al. 2020 . Categorical rhythms are shared between songbirds and humans . Current Biology 30 : 3544 – 3555 . doi: 10.1016/j.cub.2020.06.072 OpenUrl CrossRef PubMed 5. ↵ Burchardt L.S. , P. Norton , O. Behr , et al. 2019 . General isochronous rhythm in echolocation calls and social vocalizations of the bat Saccopteryx bilineata . Royal Society Open Science 6 : 181076 . doi: 10.1098/rsos.181076 OpenUrl CrossRef PubMed 6. ↵ Diniz P. , E.F. da Silva , M.S. Webster , et al. 2018 . Duetting behavior in a Neotropical ovenbird: Sexual and seasonal variation and adaptive signaling functions . Journal of Avian Biology 49 : jav – 01637 . doi: 10.1111/jav.01637 OpenUrl CrossRef 7. ↵ Rothenberg D. , T.C. Roeske , H.U. Voss , et al. 2014 . Investigation of musicality in birdsong . Hearing Research 308 : 71 – 83 . doi: 10.1016/j.heares.2013.08.016 OpenUrl CrossRef PubMed 8. ↵ Harris M.A. , J.O. Murie & J.A. Duncan . 1983 . Responses of Columbian ground squirrels to playback of recorded calls . Zeitschrift für Tierpsychologie 63 : 318 – 330 . doi: 10.1111/j.1439-0310.1983.tb00747.x OpenUrl CrossRef 9. ↵ Owings D.H. & R.A. Virginia . 1978 . Alarm calls of California ground squirrels (Spermophilus beecheyi) . Zeitschrift für Tierpsychologie 46 : 58 – 70 . doi: 10.1111/j.1439-0310.1978.tb01438.x OpenUrl CrossRef 10. ↵ Waring G.H. 1966 . Sounds and communications of the yellow-bellied marmot (Marmota flaviventris) . Animal Behaviour 14 : 177 – 183 . doi: 10.1016/S0003-3472(66)80028-3 OpenUrl CrossRef PubMed Web of Science 11. ↵ Bradbury J.W. 1977 . Lek mating behavior in the hammer_Jheaded bat . Zeitschrift für Tierpsychologie 45 : 225 – 255 . doi: 10.1111/j.1439-0310.1977.tb02120.x OpenUrl CrossRef 12. ↵ Geissmann T. 1993 . Evolution of communication in gibbons (Hylobatidae) . . 13. ↵ Schruth D.M. , C.N. Templeton & D.J. Holman . 2021 . On reappearance and complexity in musical calling . PLoS One 16 : e0218006 . doi: 10.1371/journal.pone.0218006 OpenUrl CrossRef 14. ↵ Schulze H.-H. , A. Cordes & D. Vorberg . 2005 . Keeping synchrony while tempo changes: Accelerando and ritardando . Music Perception 22 : 461 – 477 . doi: 10.1525/mp.2005.22.3.461 OpenUrl Abstract / FREE Full Text 15. Weissman Y.A. , V. Demartsev , A. Ilany , et al. 2020 . A crescendo in the inner structure of snorts: A reflection of increasing arousal in rock hyrax songs? Animal Behaviour 166 : 163 – 170 . doi: 10.1016/j.anbehav.2020.06.010 OpenUrl CrossRef 16. ↵ Fitch W.T. 2013 . Rhythmic cognition in humans and animals: Distinguishing meter and pulse perception . Frontiers in Systems Neuroscience 7 : 1 – 16 . doi: 10.3389/fnsys.2013.00068 OpenUrl CrossRef 17. ↵ Hersh T.A. , A. Ravignani & L.S. Burchardt . 2023 . Robust rhythm reporting will advance ecological and evolutionary research . Methods in Ecology and Evolution 14 : 1398 – 1407 . doi: 10.1111/2041-210X.14118 OpenUrl CrossRef 18. ↵ Ten Cate C. 2021 . Re-evaluating vocal production learning in non-oscine birds . Philosophical Transactions of the Royal Society B 376 : 20200249 . doi: 10.1098/rstb.2020.0249 OpenUrl CrossRef PubMed 19. ↵ Calcari C. , C. Pilenga , L. Baciadonna , et al. 2021 . Long-term stability of vocal individuality cues in a territorial and monogamous seabird . Animal Cognition 24 : 1165 – 1169 . doi: 10.1007/s10071-021-01518-z OpenUrl CrossRef PubMed 20. ↵ Favaro L. , L. Ozella & D. Pessani . 2014 . The vocal repertoire of the African penguin (Spheniscus demersus): Structure and function of calls . PLoS One 9 : e103460 . doi: 10.1371/journal.pone.0103460 OpenUrl CrossRef PubMed 21. ↵ Baciadonna L. , C. Solvi , F. Del Vecchio , et al. 2022 . Vocal accommodation in penguins (Spheniscus demersus) as a result of social environment . Proceedings of the Royal Society B 289 : 20220626 . doi: 10.1098/rspb.2022.0626 OpenUrl CrossRef PubMed 22. ↵ Favaro L. , M. Gamba , E. Cresta , et al. 2020 . Do penguins’ vocal sequences conform to linguistic laws? Biology Letters 16 : 20190589 . doi: 10.1098/rsbl.2019.0589 OpenUrl CrossRef 23. ↵ Kershenbaum A. , D.T. Blumstein , M.A. Roch , et al. 2016 . Acoustic sequences in non-human animals: A tutorial review and prospectus . Biological Reviews 91 : 13 – 52 . doi: 10.1111/brv.12160 OpenUrl CrossRef 24. ↵ Boersma P. 2001 . Praat, a system for doing phonetics by computer . Glot International 5 : 341 – 345 . OpenUrl CrossRef 25. ↵ Jouventin P. 1982 . Visual and vocal signals in penguins, their evolution and adaptive characters . Fortschritte der Verhaltensforschung 24 :. 26. ↵ Jadoul Y. , B. Thompson & B. de Boer . 2017 . Introducing Parselmouth: A Python interface to Praat . Journal of Phonetics 71 : 1 – 15 . doi: 10.1016/j.wocn.2018.07.001 OpenUrl CrossRef 27. ↵ Plavcan J.M. & D.A. Cope . 2001 . Metric variation and species recognition in the fossil record . Evolutionary Anthropology 10 : 204 – 222 . doi: 10.1002/evan.20001 OpenUrl CrossRef 28. ↵ Marwick B. & K. Krishnamoorthy . 2019 . cvequality: Tests for the equality of coefficients of variation from multiple groups . R software package version 0.1.3 . . 29. ↵ Krishnamoorthy K. & M. Lee . 2014 . Improved tests for the equality of normal coefficients of variation . Computational Statistics 29 : 215 – 232 . doi: 10.1007/s00180-013-0445-2 OpenUrl CrossRef 30. ↵ Seyfarth R.M. & D.L. Cheney . 2003 . Signalers and receivers in animal communication . Annual Review of Psychology 54 : 145 – 173 . doi: 10.1146/annurev.psych.54.101601.145121 OpenUrl CrossRef PubMed Web of Science 31. ↵ Briefer E.F. 2012 . Vocal expression of emotions in mammals: Mechanisms of production and evidence . Journal of Zoology 288 : 1 – 20 . doi: 10.1111/j.1469-7998.2012.00920.x OpenUrl CrossRef Web of Science 32. Zhang Y.S. , J.L. Alvarez & A.A. Ghazanfar . 2022 . Arousal elevation drives the development of oscillatory vocal output . Journal of Neurophysiology 127 : 1519 – 1531 . doi: 10.1152/jn.00007.2022 OpenUrl CrossRef PubMed 33. ↵ Borjon J.I. , D.Y. Takahashi , D.C. Cervantes , et al. 2016 . Arousal dynamics drive vocal production in marmoset monkeys . Journal of Neurophysiology 116 : 753 – 764 . doi: 10.1152/jn.00136.2016 OpenUrl CrossRef PubMed 34. ↵ Schaefer R. & D. Colombelli_JNégrel . 2021 . Behavioural and heart rate responses to stressors in two populations of little penguins that differ in levels of human disturbance and predation risk . Ibis 163 : 858 – 874 . doi: 10.1111/ibi.12925 OpenUrl CrossRef 35. Crockford C. , I. Herbinger , L. Vigilant , et al. 2004 . Wild chimpanzees produce group-specific calls: A case for vocal learning? Ethology 110 : 221 – 243 . doi: 10.1111/j.1439-0310.2004.00968.x OpenUrl CrossRef Web of Science 36. Wallin N.L. , Merker B. , & Brown S. Geissmann T. 2000 . Gibbon songs and human music from an evolutionary perspective . In The Origins of Music Wallin N.L. , Merker B. , & Brown S. , Eds. 103 – 123 . Cambridge, Massachusetts : The MIT Press . 37. Marshall Jr J.T. & E.R. Marshall . 1976 . Gibbons and their territorial songs . Science 193 : 235 – 237 . doi: 10.1126/science.193.4249.235 OpenUrl Abstract / FREE Full Text 38. Mitani J.C. 1988 . Male gibbon (Hylobates agilis) singing behavior: Natural history, song variations and function . Ethology 79 : 177 – 194 . doi: 10.1111/j.1439-0310.1988.tb00710.x OpenUrl CrossRef 39. Perlman M. & R. Salmi . 2017 . Gorillas may use their laryngeal air sacs for whinny-type vocalizations and male display . Journal of Language Evolution 2 : 126 – 140 . doi: 10.1093/jole/lzx012 OpenUrl CrossRef 40. Kaplan G. 2009 . Animals and music: Between cultural definitions and sensory evidence . Sign Systems Studies 37 : 423 – 453 . OpenUrl CrossRef 41. Taylor H. & D. Lestel . 2011 . The Australian pied butcherbird and the natureculture continuum . Journal of Interdisciplinary Music Studies 5 : 57 – 83 . doi: 10.4407/jims.2011.07.004 OpenUrl CrossRef 42. Baptista L.F. & R.A. Keister . 2005 . Why birdsong is sometimes like music . Perspectives in Biology and Medicine 48 : 426 – 443 . doi: 10.1353/pbm.2005.0066 OpenUrl CrossRef PubMed Web of Science 43. Bilger H.T. , E. Vertosick , A. Vickers , et al. 2021 . Higher-order musical temporal structure in bird song . Frontiers in Psychology 12 : 1 – 11 . doi: 10.3389/fpsyg.2021.629456 OpenUrl CrossRef 44. Hartshorne C. 1973 . Born to sing: An interpretation and world survey of bird song . The Wilson Bulletin 85 : 517 – 519 . OpenUrl 45. Olds W.B. 1922 . Bird-music . The Musical Quarterly 8 : 242 – 255 . OpenUrl 46. Searcy W.A. , P. Marler & S.S. Peters . 1981 . Species song discrimination in adult female song and swamp sparrows . Animal Behaviour 29 : 997 – 1003 . doi: 10.1016/S0003-3472(81)80053-X OpenUrl CrossRef 47. Roeske T.C. , D. Kelty-Stephen & S. Wallot . 2018 . Multifractal analysis reveals music-like dynamic structure in songbird rhythms . Scientific Reports 8 : 1 – 15 . doi: 10.1038/s41598-018-22933-2 OpenUrl CrossRef PubMed 48. Treutler W.J. 1898 . Music in relation to man and animals . Proceedings of the Musical Association 25 : 71 – 91 . doi: 10.1093/jrma/25.1.71 OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted April 05, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Accelerando and crescendo in African penguin display songs Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Accelerando and crescendo in African penguin display songs Taylor A. Hersh , Yannick Jadoul , Marco Gamba , Andrea Ravignani , Livio Favaro bioRxiv 2025.04.04.647185; doi: https://doi.org/10.1101/2025.04.04.647185 Share This Article: Copy Citation Tools Accelerando and crescendo in African penguin display songs Taylor A. Hersh , Yannick Jadoul , Marco Gamba , Andrea Ravignani , Livio Favaro bioRxiv 2025.04.04.647185; doi: https://doi.org/10.1101/2025.04.04.647185 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Animal Behavior and Cognition Subject Areas All Articles Animal Behavior and Cognition (7622) Biochemistry (17648) Bioengineering (13868) Bioinformatics (41876) Biophysics (21422) Cancer Biology (18552) Cell Biology (25458) Clinical Trials (138) Developmental Biology (13364) Ecology (19866) Epidemiology (2067) Evolutionary Biology (24290) Genetics (15589) Genomics (22475) Immunology (17711) Microbiology (40325) Molecular Biology (17144) Neuroscience (88469) Paleontology (666) Pathology (2826) Pharmacology and Toxicology (4815) Physiology (7635) Plant Biology (15113) Scientific Communication and Education (2044) Synthetic Biology (4286) Systems Biology (9814) Zoology (2268)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall
last seen: 2026-05-21T05:10:58.409756+00:00
License: CC-BY-NC-ND-4.0