<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article
  PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD with MathML3 v1.2 20190208//EN" "JATS-journalpublishing1-mathml3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="research-article" dtd-version="1.2" xml:lang="en">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">JBDGM</journal-id>
<journal-id journal-id-type="nlm-ta">Jahrb Musikpsychol</journal-id>
<journal-title-group>
<journal-title>Jahrbuch Musikpsychologie</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Jahrb. Musikpsychol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2569-5665</issn>
<publisher><publisher-name>PsychOpen</publisher-name></publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">jbdgm.205</article-id>
<article-id pub-id-type="doi">10.5964/jbdgm.205</article-id>
<article-categories>
<subj-group subj-group-type="heading"><subject>Research Reports</subject></subj-group>

<subj-group subj-group-type="badge">
<subject>Data</subject>
<subject>Code</subject>
<subject>Materials</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>The Acquisition of Tonal Hierarchies in Western Music During School Years: A Re-Analysis of 40 Years of Research</article-title>
<trans-title-group xml:lang="de">
<trans-title>Der Erwerb tonaler Hierarchien in westlicher Musik während der Schulzeit: Eine Re-Analyse der Ergebnisse aus 40 Jahren Forschung</trans-title>
</trans-title-group>
<alt-title alt-title-type="right-running">Development of Tonal Hierarchy: 40 Years of Research</alt-title>
<alt-title specific-use="APA-reference-style" xml:lang="en">The acquisition of tonal hierarchies in western music during school years: A re-analysis of 40 years of research</alt-title>
</title-group>
<contrib-group>
	
<contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid" authenticated="false">https://orcid.org/0000-0003-2917-3362</contrib-id><name name-style="western"><surname>Mütze</surname><given-names>Hanna</given-names></name><xref ref-type="corresp" rid="cor1">*</xref><xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
	<role vocab="credit" vocab-identifier="http://credit.niso.org/"
		vocab-term="Conceptualization"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/conceptualization/"
		>Conceptualization</role>
	<role vocab="credit" vocab-identifier="http://credit.niso.org/"
		vocab-term="Methodology"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/methodology/"
		>Methodology</role>
	<role vocab="credit" vocab-identifier="http://credit.niso.org/"
		vocab-term="Investigation"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/investigation/"
		>Investigation</role>
	<role vocab="credit" vocab-identifier="http://credit.niso.org/"
		vocab-term="Data curation"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/data-curation/"
		>Data curation</role>
	<role
		vocab="credit"
		vocab-identifier="http://credit.niso.org/"
		vocab-term="Formal Analysis"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/formal-analysis/"
		>Formal analysis</role>
	<role
		vocab="credit"
		vocab-identifier="http://credit.niso.org/"
		vocab-term="Visualization"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/visualization/"
		>Visualization</role>
	<role
		vocab="credit"
		vocab-identifier="http://credit.niso.org/"
		vocab-term="Writing – original draft"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/writing-original-draft/"
		>Writing – original draft</role>
</contrib>
	
	
	
<contrib contrib-type="author"><contrib-id contrib-id-type="orcid" authenticated="false">https://orcid.org/0000-0002-9758-9434</contrib-id><name name-style="western"><surname>Platz</surname><given-names>Friedrich</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
	<role vocab="credit" vocab-identifier="http://credit.niso.org/"
		vocab-term="Conceptualization"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/conceptualization/"
		>Conceptualization</role>
	<role
		vocab="credit"
		vocab-identifier="http://credit.niso.org/"
		vocab-term="Supervision"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/supervision/"
		>Supervision</role>
	<role
		vocab="credit"
		vocab-identifier="http://credit.niso.org/"
		vocab-term="Validation"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/validation/"
		>Validation</role>
	<role
		vocab="credit"
		vocab-identifier="http://credit.niso.org/"
		vocab-term="Writing – review &amp; editing"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/writing-review-editing/"
		>Writing – review &amp; editing</role>
</contrib>
	
	
	
<contrib contrib-type="author"><contrib-id contrib-id-type="orcid" authenticated="false">https://orcid.org/0000-0003-3520-4698</contrib-id><name name-style="western"><surname>Busch</surname><given-names>Veronika</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
	<role vocab="credit" vocab-identifier="http://credit.niso.org/"
		vocab-term="Conceptualization"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/conceptualization/"
		>Conceptualization</role>
	<role
		vocab="credit"
		vocab-identifier="http://credit.niso.org/"
		vocab-term="Supervision"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/supervision/"
		>Supervision</role>
	<role
		vocab="credit"
		vocab-identifier="http://credit.niso.org/"
		vocab-term="Validation"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/validation/"
		>Validation</role>
	<role
		vocab="credit"
		vocab-identifier="http://credit.niso.org/"
		vocab-term="Writing – review &amp; editing"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/writing-review-editing/"
		>Writing – review &amp; editing</role>
	<role
		vocab="credit"
		vocab-identifier="http://credit.niso.org/"
		vocab-term="Project administration"
		vocab-term-identifier="http://credit.niso.org/contributor-roles/project-administration/"
		>Project administration</role>
</contrib>
	


	<contrib contrib-type="reviewer"><name name-style="western"><surname>Kopiez</surname><given-names>Reinhard</given-names></name></contrib>
	
	<contrib contrib-type="reviewer"><name name-style="western"><surname>Frieler</surname><given-names>Klaus</given-names></name></contrib>
	
	<contrib contrib-type="reviewer"><name name-style="western"><surname>Schäfer</surname><given-names>Thomas</given-names></name></contrib>
	

<aff id="aff1"><label>1</label><institution content-type="dept">Department of Musicology and Music Education</institution>, <institution>University of Bremen</institution>, <addr-line><city>Bremen</city></addr-line>, <country country="DE">Germany</country></aff>
<aff id="aff2"><label>2</label><institution>Institut für Ästhetisch-Kulturelle Wissenschaft und Praxis, Europa-Universität Flensburg, Flensburg</institution>, <country country="DE">Germany</country></aff>
</contrib-group>
<author-notes>
<corresp id="cor1"><label>*</label>Department of Musicology and Music Education, University of Bremen, Bibliothekstraße 1, 28359 Bremen, Germany. <email xlink:href="muetzeh@uni-bremen.de">muetzeh@uni-bremen.de</email></corresp>
</author-notes>
<pub-date date-type="pub" publication-format="electronic"><day>12</day><month>11</month><year>2025</year></pub-date>
	<pub-date pub-type="collection" publication-format="electronic"><year>2025</year></pub-date>
<volume>33</volume><elocation-id>e205</elocation-id>
<history>
<date date-type="received">
<day>26</day>
<month>08</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>22</day>
<month>09</month>
<year>2025</year>
</date>
</history>
<permissions><copyright-year>2025</copyright-year><copyright-holder>Mütze, Platz, &amp; Busch</copyright-holder><license license-type="open-access" specific-use="CC BY 4.0" xlink:href="https://creativecommons.org/licenses/by/4.0/"><ali:license_ref>https://creativecommons.org/licenses/by/4.0/</ali:license_ref><license-p>This is an open-access article distributed under the terms of the Creative Commons Attribution (CC BY) 4.0 License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p></license></permissions>
<abstract>
<p>Understanding the relationships between different pitches as a form of tonality is a key element of listening skills in Western tonal music. Tonal hierarchies (i.e., genre-dependent differing prominence of tones) are reflected in the internal representations of tonal hierarchies (IRTH) in long-term memory. Over the past 40 years, research on how individuals—primarily students aged 6 to 15, as well as adults—acquire IRTH has yielded varied and sometimes contradictory conclusions about the timeline and underlying mechanisms of this process. This review aims to synthesize the evidence and critically examine potential reasons for the heterogeneity in prior findings. To this end, two approaches were applied. First, a Bayesian three-level meta-analysis of 60 effect sizes from 16 studies, reported in 13 articles, revealed a medium difference in IRTH sensitivity between younger and older participants. Second, a model comparison analysis based on cross-sectional data from a single study revealed a non-linear growth dynamic, with a larger increase during adolescence as the best model solution to describe the relationship between sensitivity and age. We also examined the considerable heterogeneity observed within and between studies, particularly how task-specific features of the operationalizations might account for these differences. These findings contribute to the development of theoretical models of music-related skill acquisition and suggest directions for future research.</p>
</abstract><trans-abstract xml:lang="de">
<p>Das Verständnis der Beziehungen zwischen verschiedenen Tonhöhen als eine Form der Tonalität ist ein zentraler Bestandteil der Hörfähigkeit in westlich-tonaler Musik. Tonale Hierarchien (d. h. die genreabhängig unterschiedliche Prominenz von Tönen) spiegeln sich in internen Repräsentationen tonaler Hierarchien (IRTH) im Langzeitgedächtnis wider. In den vergangenen 40 Jahren hat die Forschung darüber, wie Teilnehmende – hauptsächlich Schulkinder im Alter von 6 bis 15 Jahren, aber auch Erwachsene – IRTH erwerben, unterschiedliche und mitunter widersprüchliche Schlussfolgerungen hinsichtlich des zeitlichen Ablaufs und der zugrunde liegenden Mechanismen hervorgebracht. In diesem Beitrag sollen die Erkenntnisse zusammengefasst und mögliche Gründe für die Heterogenität der Ergebnisse kritisch untersucht werden. Zu diesem Zweck wurden zwei Ansätze angewandt. Erstens ergab eine Bayesianische Meta-Analyse von 60 Effektgrößen aus 16 Studien, die in 13 Artikeln berichtet wurden, einen Medianunterschied der IRTH-Empfindlichkeit zwischen jüngeren und älteren Kindern im Umfang einer mittleren Effektgröße. Zweitens zeigte eine Modellvergleichsanalyse auf der Grundlage von Querschnittsdaten aus einer einzigen Studie eine nichtlineare Wachstumsdynamik mit einem größeren Anstieg während der Adoleszenz und nicht im Kindes-/Grundschulalter als beste Modelllösung zur Beschreibung der Beziehung zwischen Sensibilität und Alter. Eine Heterogenitätsanalyse zeigte abschließend, dass sich die Verteilung der Effektstärken früherer Studien maßgeblich auf aufgabenspezifische Merkmale im Zuge der Operationalisierungen der Repräsentation tonaler Hierarchien zurückführen und erklären lassen. Diese Ergebnisse tragen zur Entwicklung theoretischer Modelle über den Erwerb musikbezogener Fertigkeiten bei und eröffnen Perspektiven für zukünftige Forschungen.</p></trans-abstract>
<kwd-group kwd-group-type="author"><kwd>tonal development</kwd><kwd>probe tone</kwd><kwd>Bayesian meta-analysis</kwd><kwd>musical skill acquisition</kwd></kwd-group>
<kwd-group kwd-group-type="translator" xml:lang="de"><kwd>tonale Entwicklung</kwd><kwd>Prüftonverfahren</kwd><kwd>bayessche Metaanalyse</kwd><kwd>musikalischer Fertigkeitserwerb</kwd></kwd-group>
</article-meta>
</front>
<body>
	<sec sec-type="intro"><title/>
<p>Tonality is reflected by the variations in prominence given to tones on a scale (<xref ref-type="bibr" rid="r68">Piston, 1978</xref>; <xref ref-type="bibr" rid="r94">von Helmholtz, 1896</xref>) because of differences in their frequency of occurrence, metrical position, and duration (<xref ref-type="bibr" rid="r71">Prince &amp; Schmuckler, 2014</xref>; <xref ref-type="bibr" rid="r91">Verosky, 2021</xref>). Most Western music considers the concept of tonality as:</p>
<disp-quote>
<p>…one of the main conceptual categories of Western musical thought, [referring] to the orientation of melodies and harmonies towards a referential (or tonic) pitch class. In the broadest possible sense, however, it refers to systematic arrangements of pitch phenomena and relations between them. (<xref ref-type="bibr" rid="r36">Hyer, 2021</xref>, p. 1)</p></disp-quote>
<p>Several music psychology models suggest that tonality perception is linked to the varying stabilities perceived in individual tones (<xref ref-type="bibr" rid="r80">Schmuckler, 2016</xref>). <xref ref-type="bibr" rid="r47">Krumhansl and Shepard (1979)</xref> demonstrate that tonal hierarchy is reflected in individuals’ stability ratings of tones, depending on the hierarchical level in the preceding tonal context. This hierarchy in classical/romantic music includes four levels: tonic, tonic triad, other diatonic tones, and non-diatonic tones (<xref ref-type="bibr" rid="r46">Krumhansl &amp; Kessler, 1982</xref>). <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref> conclude that tonal hierarchy is stored in long-term memory as internal representations of tonal hierarchies (IRTH). In this paper, the ability to perceive the different stabilities of tones is referred to as sensitivity to IRTH.</p>
<p>Based on the above, our analyses focus on the IRTH acquisition processes (i.e., how IRTH evolves with increasing age). The scientific debate about the timing and mechanisms of IRTH development is ongoing (<xref ref-type="bibr" rid="r66">Patel, 2021</xref>), with narrative summaries (e.g., <xref ref-type="bibr" rid="r10">Corrigall &amp; Schellenberg, 2016</xref>; <xref ref-type="bibr" rid="r21">Gembris, 2017a</xref>) and theoretical models offering varied and sometimes contradictory conclusions. Earlier theories, such as Brehmer's concept of “tonal giftedness” (German: “Begabung”), suggest that this ability is fully developed by age 7 (Kühn, n.d., cited in <xref ref-type="bibr" rid="r8">Brehmer, 1925</xref>, p. 172). <xref ref-type="bibr" rid="r24">Gordon (2012)</xref> argues that musical aptitude and audiation show significant development before stabilizing around age 9, with limited improvement thereafter. This extended developmental trajectory contrasts with Brehmer's earlier views.</p>
<p><xref ref-type="bibr" rid="r19">Gardner’s (1973)</xref> theory includes two stages of artistic development concluding around age 7, whereas <xref ref-type="bibr" rid="r85">Swanwick and Tillman (1986</xref>) propose four stages extending into adolescence. <xref ref-type="bibr" rid="r30">Hargreaves (1996)</xref> supports the latter view, emphasizing the importance of ages 8 to 15 for mastering musical rules. Conversely, <xref ref-type="bibr" rid="r82">Serafine (1988)</xref> suggests a more restricted sensitive period for tonal learning from ages 8 to 10. In stark contrast, recent research highlights statistical learning as a key factor in lifelong IRTH development (<xref ref-type="bibr" rid="r41">Jonaitis &amp; Saffran, 2009</xref>; <xref ref-type="bibr" rid="r95">Vuvan, 2013</xref>), with evidence showing that this process begins as early as infancy (<xref ref-type="bibr" rid="r77">Saffran et al., 1999</xref>). Thus, whether IRTH has already developed fully by one’s school years or continues to develop during that time remains an open question.</p>
<p>Regarding primary studies, <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref> identify a clear age-related progression in IRTH: first- and second-graders prefer diatonic tones over non-diatonic tones, third- and fourth-graders prefer the tonic triad over other diatonic tones, and fifth-graders as well as adults prefer the tonic overall. <xref ref-type="bibr" rid="r54">Maier-Karius and Schwarzer (2011)</xref>, <xref ref-type="bibr" rid="r64">Paananen (2007</xref>, <xref ref-type="bibr" rid="r65">2009</xref>), and <xref ref-type="bibr" rid="r81">Schwarzer et al. (1993)</xref> replicate this trajectory; however, <xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref>, <xref ref-type="bibr" rid="r79">Schellenberg et al. (2005)</xref>, <xref ref-type="bibr" rid="r83">Speer and Meeks (1985)</xref>, and <xref ref-type="bibr" rid="r99">Wilson and Wales (1995)</xref> find either earlier or later IRTH acquisition.</p>
<p>The failure to replicate previous findings may be related to several factors, such as participant characteristics or methodological differences. One factor might be formal musical training, defined as systematic instruction in music theory or practice (<xref ref-type="bibr" rid="r28">Hanna-Pladdy &amp; MacKay, 2011</xref>). Although some studies suggest that formal training enhances IRTH acquisition (<xref ref-type="bibr" rid="r11">Corrigall et al., 2022</xref>; <xref ref-type="bibr" rid="r55">Mandikal Vasuki et al., 2016</xref>), others find no such effect, primarily attributing acquisition to implicit learning processes (<xref ref-type="bibr" rid="r15">Cui, 2019</xref>; <xref ref-type="bibr" rid="r61">Müllensiefen et al., 2014</xref>). Moreover, the influence of formal training may depend on factors such as age, ongoing training, and varying types of operationalization (<xref ref-type="bibr" rid="r2">Asztalos &amp; Csapo, 2017</xref>; <xref ref-type="bibr" rid="r60">Müllensiefen et al., 2022</xref>; <xref ref-type="bibr" rid="r101">Zhang et al., 2020</xref>). Cultural background (<xref ref-type="bibr" rid="r56">Matsunaga et al., 2020</xref>), gender (<xref ref-type="bibr" rid="r51">Lin, 2023</xref>), and socioeconomic status (<xref ref-type="bibr" rid="r57">Miles et al., 2016</xref>) may also modulate IRTH acquisition.</p>
<p>Studies may also suffer from a lack of statistical power, which increases the likelihood of failing to detect a true population effect (<xref ref-type="bibr" rid="r18">Ellis, 2010</xref>). Finally, the specific method used to measure IRTH may affect the results. In contrast to the predictions of earlier theories on the development of tonal hierarchies, which rely on explicit measures with (partially) time-independent response formats, several studies using implicit measures report detecting tonal knowledge even in early childhood, indicating an earlier onset of this ability than previously suggested (<xref ref-type="bibr" rid="r40">Jentschke et al., 2005</xref>; <xref ref-type="bibr" rid="r70">Politimou et al., 2021</xref>; <xref ref-type="bibr" rid="r87">Trehub et al., 1999</xref>). <xref ref-type="bibr" rid="r11">Corrigall et al. (2022)</xref> find that task characteristics influence IRTH acquisition in school-aged children, with significant differences only emerging in explicit tasks.</p>
<p>In summary, despite 40 years of vibrant research, we are faced with a highly heterogeneous body of literature, making it difficult to draw clear evidence on the shape of IRTH skill acquisition. This complexity pertains not only to identifying the general developmental trajectory but also to distinguishing between specific phases of skill acquisition, such as the phase of initial skill acquisition and the potential onset of a saturation effect—a plateau in skill improvement in relation to the conditions (e.g., formal instruction) under which differences in the shapes and effects of skill acquisition occur.</p>
<sec sec-type="other1"><title>Aims and Objectives</title>
<p>We conducted a critical review of four decades of research on the development of IRTH sensitivity. Despite a sizeable volume of studies, the findings remain heterogeneous and partially contradictory, particularly regarding developmental trajectories and the influence of musical training. Building on <xref ref-type="bibr" rid="r24">Gordon’s (2012)</xref> theory of music learning, which posits that core aspects of tonal sensitivity are largely developed by age 9, we formulated four exploratory research questions. By examining these questions, this study aimed to (1) assess the magnitude of age-related changes in IRTH sensitivity, (2) examine whether sensitivity increases significantly beyond age 9, (3) investigate the role of musical training, and (4) explore the effects of different operationalizations of IRTH measurement.</p></sec>
<sec sec-type="other2"><title>Research Questions</title>
<p><bold>Research Question 1 (RQ1).</bold> How substantial is the average age-related development of IRTH sensitivity?</p>
<p><?disable-indent?><bold>Research Question 2 (RQ2).</bold> Does IRTH sensitivity continue to increase beyond the age of 9, or does it level off, as predicted by Gordon’s learning theory?</p>
	<p><?disable-indent?><bold>Research Question 3 (RQ3).</bold> Is IRTH sensitivity significantly higher in musically trained individuals than in those without musical training?</p>
	<p><?disable-indent?><bold>Research Question 4 (RQ4).</bold> Does the implicit measurement of IRTH sensitivity via response time yield lower estimates than more explicit operationalizations?</p></sec></sec>
<sec sec-type="methods"><title>Method</title>
<sec><title>Procedure</title>
<p>We conducted a systematic and comprehensive literature search (<xref ref-type="bibr" rid="r97">What Works Clearinghouse, 2020</xref>) between January and April 2022 to identify eligible studies. The study selection followed a predefined process outlined in the review protocol (see Supplementary Material S1), which was not published before the review was conducted. In the final sample, we included only primary research studies of the preliminary literature corpus that used a hypothesis-testing approach, followed either a cross-sectional or longitudinal design, were published between 1982<xref ref-type="fn" rid="fn1"><sup>1</sup></xref><fn id="fn1"><label>1</label>
<p>We included only articles published after 1982 following <xref ref-type="bibr" rid="r46">Krumhansl and Kessler’s (1982)</xref> pioneering work in this field.</p></fn> and April 2022, investigated a sample of healthy elementary and secondary school students, and defined the measurement of IRTH sensitivity as a dependent variable based on either a listening task (probe tone paradigm, response time measures, and goodness-of-fit ratings in syntax-violation paradigms) or a creative production task (harmonization of a given melody, tonal composition, and improvisation to a given chord sequence). These operationalizations were further specified as described below.</p>
<p>First, the probe tone paradigm (<xref ref-type="bibr" rid="r47">Krumhansl &amp; Shepard, 1979</xref>) involves presenting one or two of the 12 chromatic tones (the "probe") after establishing the tonal context (e.g., an ascending major scale), followed by a brief silence. Participants rate how well the probe tones fit the tonal context. This process continues until all 12 chromatic tones are rated. The perceived stability of each tone is measured based on participants’ goodness-of-fit ratings. The correlation of these ratings with the prototypical tonal hierarchy (see above) defines participants’ sensitivity to IRTH. Although no standardized protocols or psychometric criteria<xref ref-type="fn" rid="fn2"><sup>2</sup></xref><fn id="fn2"><label>2</label>
<p>The lack of these psychometric criteria also applies to all of the measurement methods (exception: <xref ref-type="bibr" rid="r99">Wilson &amp; Wales, 1995</xref>).</p></fn> have been established, the probe tone paradigm has been consistently replicated across various contexts, demonstrating its robustness (<xref ref-type="bibr" rid="r58">Morgan et al., 2019</xref>; <xref ref-type="bibr" rid="r78">Sauvé et al., 2021</xref>).</p>
<p>Second, some studies use goodness-of-fit ratings in a syntax-violation paradigm (e.g., <xref ref-type="bibr" rid="r11">Corrigall et al., 2022</xref>). Participants judge how well the final tone of short melodies fits within the preceding harmonic context with varying degrees of tonal congruence (e.g., a tonic note such as "C" in C major versus a non-diatonic note such as "C#"). A greater difference in ratings between congruent and incongruent endings indicates IRTH acquisition, with higher ratings for congruent endings reflecting higher IRTH sensitivity.</p>
<p>Third, <xref ref-type="bibr" rid="r79">Schellenberg et al. (2005)</xref> and <xref ref-type="bibr" rid="r11">Corrigall et al. (2022)</xref> focus on response times (as introduced by <xref ref-type="bibr" rid="r39">Janata &amp; Reisberg, 1988</xref>). Rather than explicitly evaluating the tonal congruence of melody endings, participants rate other musical features, such as the timbre of the final tone, while hearing a priming sequence with either a tonally congruent (expected) or incongruent (unexpected) final tone. Faster and more accurate responses are expected when the target tone or chord is more tonally congruent with the preceding context, indicating stronger IRTH sensitivity.</p>
<p>Fourth, other methods involve creative production tasks, such as composing (<xref ref-type="bibr" rid="r99">Wilson &amp; Wales, 1995</xref>), improvising while listening to a pre-recorded tonal chord sequence (<xref ref-type="bibr" rid="r63">Paananen, 2003</xref>), or harmonizing a melody (<xref ref-type="bibr" rid="r65">Paananen, 2009</xref>). The outcome variables are defined by the degree of tonal fit and timing of the tones or chords used by the participants. <xref ref-type="bibr" rid="r99">Wilson and Wales (1995</xref>, p. 102) report a substantial to almost perfect inter-rater agreement (cf., <xref ref-type="bibr" rid="r50">Landis &amp; Koch, 1977</xref>) for expert assessments of compositions <inline-formula><mml:math id="m1"><mml:mfenced separators="|"><mml:mrow><mml:mo>.</mml:mo><mml:mn>69</mml:mn><mml:mi> </mml:mi><mml:mo>≤</mml:mo><mml:mi>κ</mml:mi><mml:mi> </mml:mi><mml:mo>≤</mml:mo><mml:mo>.</mml:mo><mml:mn>92</mml:mn></mml:mrow></mml:mfenced></mml:math></inline-formula>.</p>
	<p>In the next step, three independent and trained coders (including the first author) coded the included studies according to a previously developed protocol (see Supplemental Material S2). After calculating the initial inter-rater reliability, which showed almost perfect agreement <inline-formula><mml:math id="m2"><mml:mfenced separators="|"><mml:mrow><mml:mi>κ</mml:mi><mml:mo>=</mml:mo><mml:mi> </mml:mi><mml:mo>.</mml:mo><mml:mn>92</mml:mn></mml:mrow></mml:mfenced></mml:math></inline-formula>, coding discrepancies were resolved by consensus. The studies vary in whether and how they report participants' formal musical training; therefore, we calculated the percentage of those with training for each age group. Sufficient data are available in 11 studies, while other variables are coded as not applicable (“n/a”).</p></sec>
<sec><title>Data Analysis</title>
<p>Data were analyzed using two approaches. First, we conducted a Bayesian three-level meta-analysis to provide a quantitative summary of the systematic review, offer an overview, identify notable studies, and investigate differences in IRTH measurements. Second, we conducted a model comparison analysis of the cross-sectional data of a single study (<xref ref-type="bibr" rid="r45">Krumhansl &amp; Keil, 1982</xref>) investigating the growth trajectory of IRTH acquisition.</p>
<p>In the meta-analytical approach, effect sizes were estimated from primary studies using the metafor package (<xref ref-type="bibr" rid="r92">Viechtbauer, 2010</xref>) in R (<xref ref-type="bibr" rid="r74">R Core Team, 2022</xref>) and, if needed, transformed into Cohen’s <inline-formula><mml:math id="m3"><mml:mi>d</mml:mi></mml:math></inline-formula> following <xref ref-type="bibr" rid="r6">Borenstein and Hedges (2019</xref>, pp. 214–234). The procedure for effect size calculations, raw data, and a markdown script for the Bayesian three-level meta-analysis are shown in Supplemental Materials S3, S4, and S5.</p>
<p>In the subsequent analysis step, the effect sizes were aggregated and weighted using a Bayesian three-level meta-analysis with the R package brms (<xref ref-type="bibr" rid="r9">Bürkner, 2017</xref>), following the procedure of <xref ref-type="bibr" rid="r32">Harrer et al. (2021)</xref>. Unlike a one-level fixed effect model that only attributes variance to sampling error, the two-level random effects model separates variance into sampling errors<xref ref-type="fn" rid="fn3"><sup>3</sup></xref><fn id="fn3"><label>3</label>
<p>As a consequence of <xref ref-type="bibr" rid="r88">Turner and Higgins (2019</xref>, p. 302), Bayesian models do not estimate the sampling error, as it is assumed to be known based on the sample size.</p></fn> and between-study heterogeneity (<inline-formula><mml:math id="m4"><mml:msubsup><mml:mrow><mml:mi mathvariant="normal">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup></mml:math></inline-formula>). This model captures inherent differences between studies, such as measurement methods.</p>
<p>Our model further includes a third level of variance <inline-formula><mml:math id="m5"><mml:mfenced separators="|"><mml:mrow><mml:msubsup><mml:mrow><mml:mi mathvariant="normal">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi></mml:math></inline-formula>reflecting the nested structure of effect sizes within studies and accounting for the variance within single studies, such as different age groups. This multilevel approach (for a formal model description, see Supplemental Material S6) better reflects the nested structure of our data and avoids the statistical issues of traditional univariate meta-analysis, which can misestimate heterogeneity and increase the risk of false positives (<xref ref-type="bibr" rid="r32">Harrer et al., 2021</xref>; <xref ref-type="bibr" rid="r35">Hedges, 2019</xref>). We compared models with differing levels of complexity by computing marginal likelihoods using the bridge sampling method implemented in the brms package.</p>
	<p>We chose Bayesian meta-analysis for two key reasons. First, it allows for the explicit modeling of heterogeneity uncertainty (<inline-formula><mml:math id="m6"><mml:msup><mml:mrow><mml:mi>τ</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup></mml:math></inline-formula>), which can yield more stable estimates in small-sample contexts—especially when applying weakly or moderately informative priors (<xref ref-type="bibr" rid="r32">Harrer et al., 2021</xref>). Notably, although Bayesian methods are not inherently robust to small samples or poor study quality, they provide a principled framework for incorporating prior knowledge and quantifying uncertainty. Second, prior information can improve the posterior estimation of key parameters, such as <inline-formula><mml:math id="m7"><mml:mi mathvariant="normal">μ</mml:mi></mml:math></inline-formula> (intercept) and <inline-formula><mml:math id="m8"><mml:mi>τ</mml:mi></mml:math></inline-formula> (standard deviations; <xref ref-type="bibr" rid="r76">Röver, 2020</xref>).</p>
	<p>To address the context-dependence of choosing the prior parameter settings (<xref ref-type="bibr" rid="r20">Gelman et al., 2015</xref>), we initially used two separate and weakly informative zero-centered priors for <inline-formula><mml:math id="m9"><mml:mi mathvariant="normal">μ</mml:mi></mml:math></inline-formula> and<inline-formula><mml:math id="m10"><mml:mi mathvariant="normal"> </mml:mi><mml:mi mathvariant="normal">τ</mml:mi></mml:math></inline-formula>, as recommended by <xref ref-type="bibr" rid="r98">Williams et al. (2018)</xref> and <xref ref-type="bibr" rid="r32">Harrer et al. (2021</xref>, Setting Prior Distributions, para. 5):</p>
<list id="L1" list-type="bullet">
<list-item>
<p>Prior 1: <inline-formula><mml:math id="m11"><mml:mi mathvariant="normal">μ</mml:mi><mml:mi mathvariant="normal"> </mml:mi><mml:mo>∼</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mi mathvariant="normal">o</mml:mi><mml:mi mathvariant="normal">r</mml:mi><mml:mi mathvariant="normal">m</mml:mi><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">l</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mn>1</mml:mn></mml:mrow></mml:mfenced></mml:math></inline-formula></p></list-item>
<list-item>
	<p>Prior 2: <inline-formula><mml:math id="m12"><mml:mi mathvariant="normal">τ</mml:mi><mml:mi mathvariant="normal"> </mml:mi><mml:mo>∼</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mi mathvariant="normal">H</mml:mi><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">l</mml:mi><mml:mi mathvariant="normal">f</mml:mi><mml:mi mathvariant="normal">c</mml:mi><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">u</mml:mi><mml:mi mathvariant="normal">c</mml:mi><mml:mi mathvariant="normal">h</mml:mi><mml:mi mathvariant="normal">y</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mn>0.5</mml:mn></mml:mrow></mml:mfenced></mml:math></inline-formula></p></list-item>
</list>
	<p>Subsequently, we performed sensitivity analyses to estimate the impact of prior parameter choices on the posterior density distributions of the parameter estimates. Therefore, following <xref ref-type="bibr" rid="r76">Röver (2020)</xref> and <xref ref-type="bibr" rid="r88">Turner and Higgins (2019)</xref>, we used two alternative weakly informative priors for both <inline-formula><mml:math id="m13"><mml:mi mathvariant="normal">μ</mml:mi></mml:math></inline-formula> and<inline-formula><mml:math id="m14"><mml:mi mathvariant="normal"> </mml:mi><mml:mi mathvariant="normal">τ</mml:mi></mml:math></inline-formula>, while τ was modeled as a standard deviation parameter constrained to be positive, implying half-distributions for the respective priors:</p>
<list id="L2" list-type="bullet">
<list-item>
<p>Prior 3: <inline-formula><mml:math id="m15"><mml:mi mathvariant="normal">μ</mml:mi><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mi mathvariant="normal">τ</mml:mi><mml:mi mathvariant="normal"> </mml:mi><mml:mo>∼</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mi mathvariant="normal">N</mml:mi><mml:mi mathvariant="normal">o</mml:mi><mml:mi mathvariant="normal">r</mml:mi><mml:mi mathvariant="normal">m</mml:mi><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">l</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mn>0.5</mml:mn></mml:mrow></mml:mfenced></mml:math></inline-formula></p></list-item>
<list-item>
<p>Prior 4: <inline-formula><mml:math id="m16"><mml:mi mathvariant="normal">μ</mml:mi><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mi mathvariant="normal">τ</mml:mi><mml:mi mathvariant="normal"> </mml:mi><mml:mo>∼</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mi>t</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mn>3</mml:mn><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mn>2.5</mml:mn></mml:mrow></mml:mfenced></mml:math></inline-formula></p></list-item>
</list>
<p>We did not conduct a meta-regression using age as a moderator because of the limited number of studies, heterogeneity in age reporting, and insufficient information on age distribution in several samples.</p>
<p>We examined the magnitude of age-related development in IRTH sensitivity (RQ1) by fitting a Bayesian three-level meta-analytic model using the brms package in R. Small effects (<inline-formula><mml:math id="m17"><mml:mi>d</mml:mi><mml:mi> </mml:mi><mml:mo>≈</mml:mo><mml:mi> </mml:mi><mml:mn>0.2</mml:mn></mml:math></inline-formula>) are often considered the minimum threshold for practical relevance in developmental research (e.g., <xref ref-type="bibr" rid="r23">Gignac &amp; Szodorai, 2016</xref>), and the average difference in IRTH sensitivity between older and younger participants meets or exceeds the benchmark for a small effect. Insufficient information reported in the primary studies prevented us from conducting a meta-regression with musical training as a moderator (RQ2). Therefore, the impact of musical training on IRTH development remains an open research question.</p>
<p>To address RQ3, we estimated the impact of operationalization on effect size using a Bayesian three-level meta-regression in brms. The model included operationalization as a moderator, accounted for the nesting of effect sizes within studies, and incorporated their standard errors. Random effects were specified at the study and within-study levels.</p>
<p>We examined RQ4 using <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref>, who report notable within-study heterogeneity, to compare learning-theory-informed models using data from. The dataset comprised four age groups assessed across five probe tone conditions. Based on age-specific difference scores, we fitted linear (linear, quadratic, cubic) and non-linear (sigmoidal, logistic, mixed, saturated) functions to model the development of tone judgment stability. Analyses were conducted using the R packages lme4 (<xref ref-type="bibr" rid="r3">Bates et al., 2015</xref>) and nlme (<xref ref-type="bibr" rid="r67">Pinheiro &amp; Bates, 2024</xref>; see S7 for data and S8 for code).</p></sec></sec>
<sec sec-type="results"><title>Results</title>
<p>Our search process yielded <italic>h</italic> = 3,635 hits. We excluded articles based on a range of criteria (see <xref ref-type="fig" rid="f1">Figure 1</xref> for details). Ultimately, we included <italic>i</italic> = 13 articles reporting <italic>j</italic> = 16 studies with <italic>y</italic> = 60 effect sizes for <italic>N</italic> = 1,287 participants.</p>
	
	<fig id="f1" position="anchor" fig-type="figure" orientation="portrait"><label>Figure 1</label><caption>
<title>Study Selection Flowchart</title></caption><graphic xlink:href="jbdgm.205-f1" position="anchor" orientation="portrait"/></fig>
	
<p><xref ref-type="table" rid="t1">Table 1</xref> presents the descriptive statistics for the effect sizes of the included studies. All studies were cross-sectional, with no longitudinal studies fulfilling the eligibility criteria. The sample sizes of the included studies ranged from <italic>n</italic> = 24 (<xref ref-type="bibr" rid="r65">Paananen, 2009</xref>; <xref ref-type="bibr" rid="r83">Speer &amp; Meeks, 1985</xref>) to <italic>n</italic> = 285 (<xref ref-type="bibr" rid="r49">Lamont &amp; Cross, 1994</xref>). The studies’ contributions to the pooled effect size estimation differed, with weights ranging from approximately 2% (<xref ref-type="bibr" rid="r65">Paananen, 2009</xref>; <xref ref-type="bibr" rid="r83">Speer &amp; Meeks, 1985</xref>) to 20% (<xref ref-type="bibr" rid="r49">Lamont &amp; Cross, 1994</xref>). Effect sizes varied widely, 0 ≤ <italic>d</italic> ≤ 3.9 with 0.14 ≤ υ ≤ 0.41, indicating substantial variance.</p>
	
	<?figure f1?>
	
<table-wrap id="t1" position="anchor" orientation="portrait">
<label>Table 1</label><caption><title>Descriptive Statistics of Effect Sizes in Primary Studies and the Multi-Level Data Structure</title></caption>
<table frame="hsides" rules="groups">
<col width="40%" align="left"/>
<col width="10%"/>
<col width="10%"/>
<col width="10%"/>
<col width="10%"/>
<col width="10%"/>
<col width="10%"/>
<thead>
<tr>
<th valign="bottom" rowspan="2" scope="rowgroup" align="left">Author (Year)</th>
	<th valign="bottom" colspan="3" scope="colgroup">ID<hr/></th>
	<th valign="bottom" rowspan="2"><inline-formula><mml:math id="m27"><mml:mi>d</mml:mi></mml:math></inline-formula></th>
	<th valign="bottom" rowspan="2"><inline-formula><mml:math id="m28"><mml:msup><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup></mml:math></inline-formula></th>
	<th valign="bottom" rowspan="2"><inline-formula><mml:math id="m29"><mml:mi>N</mml:mi></mml:math></inline-formula></th>
</tr>
<tr>
<th scope="colgroup">Article</th>
<th>Study</th>
<th>ES</th>
</tr>
</thead>
<tbody>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>1</td>
<td align="char" char=".">2.35</td>
<td align="char" char=".">0.24</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>2</td>
<td align="char" char=".">1.78</td>
<td align="char" char=".">0.20</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>3</td>
<td align="char" char=".">0.00</td>
<td align="char" char=".">0.14</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>4</td>
<td align="char" char=".">0.00</td>
<td align="char" char=".">0.14</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>5</td>
<td align="char" char=".">0.00</td>
<td align="char" char=".">0.14</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>6</td>
<td align="char" char=".">0.87</td>
<td align="char" char=".">0.16</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>7</td>
<td align="char" char=".">1.10</td>
<td align="char" char=".">0.16</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>8</td>
<td align="char" char=".">0.56</td>
<td align="char" char=".">0.15</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>9</td>
<td align="char" char=".">0.00</td>
<td align="char" char=".">0.14</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>10</td>
<td align="char" char=".">0.00</td>
<td align="char" char=".">0.14</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>11</td>
<td align="char" char=".">3.90</td>
<td align="char" char=".">0.41</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>12</td>
<td align="char" char=".">3.02</td>
<td align="char" char=".">0.31</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>13</td>
<td align="char" char=".">0.72</td>
<td align="char" char=".">0.15</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>14</td>
<td align="char" char=".">0.60</td>
<td align="char" char=".">0.15</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></td>
<td>1</td>
<td>1</td>
<td>15</td>
<td align="char" char=".">1.24</td>
<td align="char" char=".">0.17</td>
<td>28</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r83">Speer and Meeks (1985)</xref></td>
<td>2</td>
<td>2</td>
<td>16</td>
<td align="char" char=".">0.66</td>
<td align="char" char=".">0.18</td>
<td>24</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r14">Cuddy and Badertscher (1987)</xref></td>
<td>3</td>
<td>3</td>
<td>17</td>
<td align="char" char=".">0.50</td>
<td align="char" char=".">0.10</td>
<td>41</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r14">Cuddy and Badertscher (1987)</xref></td>
<td>3</td>
<td>3</td>
<td>18</td>
<td align="char" char=".">0.58</td>
<td align="char" char=".">0.14</td>
<td>33</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r81">Schwarzer et al. (1993)</xref></td>
<td>4</td>
<td>4</td>
<td>19</td>
<td align="char" char=".">1.21</td>
<td align="char" char=".">0.10</td>
<td>46</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r81">Schwarzer et al. (1993)</xref></td>
<td>4</td>
<td>4</td>
<td>20</td>
<td align="char" char=".">1.49</td>
<td align="char" char=".">0.11</td>
<td>46</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r81">Schwarzer et al. (1993)</xref></td>
<td>4</td>
<td>4</td>
<td>21</td>
<td align="char" char=".">1.70</td>
<td align="char" char=".">0.12</td>
<td>46</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r49">Lamont and Cross (1994)</xref></td>
<td>5</td>
<td>5</td>
<td>22</td>
<td align="char" char=".">0.69</td>
<td align="char" char=".">0.02</td>
<td>285</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r99">Wilson and Wales (1995)</xref></td>
<td>6</td>
<td>6</td>
<td>23</td>
<td align="char" char=".">0.10</td>
<td align="char" char=".">0.07</td>
<td>54</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r63">Paananen (2003)</xref></td>
<td>7</td>
<td>7</td>
<td>24</td>
<td align="char" char=".">0.61</td>
<td align="char" char=".">0.17</td>
<td>24</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r63">Paananen (2003)</xref></td>
<td>7</td>
<td>7</td>
<td>25</td>
<td align="char" char=".">0.78</td>
<td align="char" char=".">0.18</td>
<td>24</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r63">Paananen (2003)</xref></td>
<td>7</td>
<td>7</td>
<td>26</td>
<td align="char" char=".">0.53</td>
<td align="char" char=".">0.17</td>
<td>24</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r63">Paananen (2003)</xref></td>
<td>7</td>
<td>7</td>
<td>27</td>
<td align="char" char=".">0.40</td>
<td align="char" char=".">0.17</td>
<td>24</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r63">Paananen (2003)</xref></td>
<td>7</td>
<td>7</td>
<td>28</td>
<td align="char" char=".">0.49</td>
<td align="char" char=".">0.17</td>
<td>24</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r63">Paananen (2003)</xref></td>
<td>7</td>
<td>7</td>
<td>29</td>
<td align="char" char=".">0.31</td>
<td align="char" char=".">0.17</td>
<td>24</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r63">Paananen (2003)</xref></td>
<td>7</td>
<td>7</td>
<td>30</td>
<td align="char" char=".">0.30</td>
<td align="char" char=".">0.17</td>
<td>24</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r63">Paananen (2003)</xref></td>
<td>7</td>
<td>7</td>
<td>31</td>
<td align="char" char=".">0.28</td>
<td align="char" char=".">0.17</td>
<td>24</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r63">Paananen (2003)</xref></td>
<td>7</td>
<td>7</td>
<td>32</td>
<td align="char" char=".">0.43</td>
<td align="char" char=".">0.17</td>
<td>24</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r63">Paananen (2003)</xref></td>
<td>7</td>
<td>7</td>
<td>33</td>
<td align="char" char=".">0.23</td>
<td align="char" char=".">0.17</td>
<td>24</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r79">Schellenberg et al. (2005)</xref> I</td>
<td>8</td>
<td>8</td>
<td>34</td>
<td align="char" char=".">0.68</td>
<td align="char" char=".">0.19</td>
<td>23</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r79">Schellenberg et al. (2005)</xref> II</td>
<td>8</td>
<td>9</td>
<td>35</td>
<td align="char" char=".">0.53</td>
<td align="char" char=".">0.12</td>
<td>36</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r79">Schellenberg et al. (2005)</xref> III</td>
<td>8</td>
<td>10</td>
<td>36</td>
<td align="char" char=".">0.43</td>
<td align="char" char=".">0.09</td>
<td>44</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r65">Paananen (2009)</xref></td>
<td>9</td>
<td>11</td>
<td>37</td>
<td align="char" char=".">0.46</td>
<td align="char" char=".">0.26</td>
<td>17</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r65">Paananen (2009)</xref></td>
<td>9</td>
<td>11</td>
<td>38</td>
<td align="char" char=".">-0.05</td>
<td align="char" char=".">0.26</td>
<td>17</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r65">Paananen (2009)</xref></td>
<td>9</td>
<td>11</td>
<td>39</td>
<td align="char" char=".">-0.36</td>
<td align="char" char=".">0.18</td>
<td>23</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r65">Paananen (2009)</xref></td>
<td>9</td>
<td>11</td>
<td>40</td>
<td align="char" char=".">0.62</td>
<td align="char" char=".">0.18</td>
<td>23</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r65">Paananen (2009)</xref></td>
<td>9</td>
<td>11</td>
<td>41</td>
<td align="char" char=".">1.56</td>
<td align="char" char=".">0.27</td>
<td>20</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r65">Paananen (2009)</xref></td>
<td>9</td>
<td>11</td>
<td>42</td>
<td align="char" char=".">0.78</td>
<td align="char" char=".">0.22</td>
<td>20</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r54">Maier-Karius and Schwarzer (2011)</xref></td>
<td>10</td>
<td>12</td>
<td>43</td>
<td align="char" char=".">0.71</td>
<td align="char" char=".">0.06</td>
<td>72</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r54">Maier-Karius and Schwarzer (2011)</xref></td>
<td>10</td>
<td>12</td>
<td>44</td>
<td align="char" char=".">1.23</td>
<td align="char" char=".">0.15</td>
<td>42</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r38">James et al. (2012)</xref></td>
<td>11</td>
<td>13</td>
<td>45</td>
<td align="char" char=".">0.77</td>
<td align="char" char=".">0.04</td>
<td>112</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r38">James et al. (2012)</xref></td>
<td>11</td>
<td>13</td>
<td>46</td>
<td align="char" char=".">0.11</td>
<td align="char" char=".">0.04</td>
<td>112</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r38">James et al. (2012)</xref></td>
<td>11</td>
<td>13</td>
<td>47</td>
<td align="char" char=".">0.45</td>
<td align="char" char=".">0.04</td>
<td>112</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> I</td>
<td>12</td>
<td>14</td>
<td>48</td>
<td align="char" char=".">0.69</td>
<td align="char" char=".">0.09</td>
<td>48</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> I</td>
<td>12</td>
<td>14</td>
<td>49</td>
<td align="char" char=".">0.46</td>
<td align="char" char=".">0.08</td>
<td>50</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> I</td>
<td>12</td>
<td>14</td>
<td>50</td>
<td align="char" char=".">-0.04</td>
<td align="char" char=".">0.08</td>
<td>52</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> I</td>
<td>12</td>
<td>14</td>
<td>51</td>
<td align="char" char=".">0.29</td>
<td align="char" char=".">0.09</td>
<td>48</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> I</td>
<td>12</td>
<td>14</td>
<td>52</td>
<td align="char" char=".">0.63</td>
<td align="char" char=".">0.09</td>
<td>48</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> II</td>
<td>12</td>
<td>15</td>
<td>53</td>
<td align="char" char=".">-0.37</td>
<td align="char" char=".">0.08</td>
<td>51</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> II</td>
<td>12</td>
<td>15</td>
<td>54</td>
<td align="char" char=".">0.18</td>
<td align="char" char=".">0.09</td>
<td>44</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> II</td>
<td>12</td>
<td>15</td>
<td>55</td>
<td align="char" char=".">0.71</td>
<td align="char" char=".">0.10</td>
<td>42</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> II</td>
<td>12</td>
<td>15</td>
<td>56</td>
<td align="char" char=".">-0.09</td>
<td align="char" char=".">0.08</td>
<td>49</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> II</td>
<td>12</td>
<td>15</td>
<td>57</td>
<td align="char" char=".">0.67</td>
<td align="char" char=".">0.08</td>
<td>52</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r11">Corrigall et al. (2022)</xref></td>
<td>13</td>
<td>16</td>
<td>58</td>
<td align="char" char=".">0.33</td>
<td align="char" char=".">0.04</td>
<td>97</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r11">Corrigall et al. (2022)</xref></td>
<td>13</td>
<td>16</td>
<td>59</td>
<td align="char" char=".">-0.25</td>
<td align="char" char=".">0.04</td>
<td>97</td>
</tr>
<tr>
<td><xref ref-type="bibr" rid="r11">Corrigall et al. (2022)</xref></td>
<td>13</td>
<td>16</td>
<td>60</td>
<td align="char" char=".">0.82</td>
<td align="char" char=".">0.04</td>
<td>97</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The studies included participants from various age groups, ranging from age 6 (e.g., <xref ref-type="bibr" rid="r45">Krumhansl &amp; Keil, 1982</xref>) to age 15 (<xref ref-type="bibr" rid="r65">Paananen, 2009</xref>). Adults were used as the treatment group in five studies (e.g., <xref ref-type="bibr" rid="r56">Matsunaga et al., 2020</xref>) because they were assumed to have fully developed IRTH, making them a suitable reference population. However, as suggested by our subsequent model comparison analyses, this assumption appears to be only partially accurate, as adults do not consistently demonstrate superior performance in tasks with higher cognitive demands. For a visualization of the correlation between the age of the treatment group, the age of the control group, and the effect sizes, see the scatter plot in Supplemental Material S9. Most studies used the probe tone technique for the dependent variable, either with a rating scale (<italic>j</italic> = 5) or by asking the participants to produce the most appropriate probe tone (<italic>j</italic> = 1). This includes studies using goodness-of-fit ratings for syntax violations and three studies using creative tasks, such as composition, improvisation, or harmonization (<xref ref-type="table" rid="t2">Table 2</xref>).</p>
<table-wrap id="t2" position="anchor" orientation="landscape">
<label>Table 2</label><caption><title>Characteristics of Primary Studies</title></caption>
<table frame="hsides" rules="groups">
<col width="5%" align="left"/>
<col width="32%"/>
<col width="9%"/>
<col width="9%"/>
<col width="9%"/>
<col width="9%"/>
<col width="9%"/>
<col width="9%"/>
<col width="9%"/>
<thead>
<tr>
<th valign="bottom" rowspan="2" scope="rowgroup" align="left">ID</th>
	<th valign="bottom" rowspan="2" align="left">Author (Year)</th>
	<th valign="bottom" rowspan="2">DV</th>
	<th valign="bottom" colspan="2" scope="colgroup"><italic>n</italic><hr/></th>
	<th valign="bottom" colspan="2" scope="colgroup">Mean Age<hr/></th>
	<th valign="bottom" colspan="2" scope="colgroup">Children with Formal Musical Training (%)<hr/></th>
</tr>
<tr>
<th>Treat</th>
<th>Cont</th>
<th>Treat</th>
<th>Cont</th>
<th>Treat</th>
<th>Cont</th>
</tr>
</thead>
<tbody>
<tr>
<td>1</td>
	<td align="left"><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref>, comp. 1</td>
<td>PT</td>
<td>14</td>
<td>14</td>
	<td align="char" char=".">8.5</td>
	<td align="char" char=".">6.5</td>
<td>71</td>
<td>43</td>
</tr>
<tr>
<td>1</td>
	<td align="left"><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref>, comp. 2</td>
<td>PT</td>
<td>14</td>
<td>14</td>
<td align="char" char=".">10.5</td>
<td align="char" char=".">8.5</td>
<td>79</td>
<td>71</td>
</tr>
<tr>
<td>1</td>
	<td align="left"><xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref>, comp. 3</td>
<td>PT</td>
<td>14</td>
<td>14</td>
<td>20</td>
<td align="char" char=".">10.5</td>
<td>86</td>
<td>79</td>
</tr>
<tr>
<td>2</td>
	<td align="left"><xref ref-type="bibr" rid="r83">Speer and Meeks (1985)</xref><sup>a</sup></td>
<td>PT</td>
<td>12</td>
<td>12</td>
<td>10</td>
<td>7</td>
<td>42</td>
<td>33</td>
</tr>
<tr>
<td>3</td>
	<td align="left"><xref ref-type="bibr" rid="r14">Cuddy and Badertscher (1987)</xref>, comp. 1</td>
<td>PT</td>
<td>21</td>
<td>20</td>
<td align="char" char=".">8.5</td>
<td align="char" char=".">6.5</td>
<td>43</td>
<td>45</td>
</tr>
<tr>
<td>3</td>
	<td align="left"><xref ref-type="bibr" rid="r14">Cuddy and Badertscher (1987)</xref>, comp. 2</td>
<td>PT</td>
<td>12</td>
<td>21</td>
<td align="char" char=".">10.5</td>
<td align="char" char=".">8.5</td>
<td>42</td>
<td>43</td>
</tr>
<tr>
<td>4</td>
	<td align="left"><xref ref-type="bibr" rid="r81">Schwarzer et al. (1993)</xref><sup>a</sup></td>
<td>PTP</td>
<td>20</td>
<td>26</td>
<td>20</td>
<td>9</td>
<td>25</td>
<td>23</td>
</tr>
<tr>
<td>5</td>
	<td align="left"><xref ref-type="bibr" rid="r49">Lamont and Cross (1994)</xref><sup>b</sup></td>
<td>PT</td>
<td>285</td>
<td>—</td>
<td>6-9</td>
<td>—</td>
<td>n/a</td>
<td>n/a</td>
</tr>
<tr>
<td>6</td>
	<td align="left"><xref ref-type="bibr" rid="r99">Wilson and Wales (1995)</xref></td>
<td>Comp</td>
<td>36</td>
<td>37</td>
<td>9</td>
<td>7</td>
<td>42</td>
<td>62</td>
</tr>
<tr>
<td>7</td>
	<td align="left"><xref ref-type="bibr" rid="r63">Paananen (2003)</xref>, comp. 1</td>
<td>Imp</td>
<td>12</td>
<td>12</td>
<td align="char" char=".">8.5</td>
<td align="char" char=".">6.5</td>
<td>n/a</td>
<td>n/a</td>
</tr>
<tr>
<td>7</td>
	<td align="left"><xref ref-type="bibr" rid="r63">Paananen (2003)</xref>, comp. 2</td>
<td>Imp</td>
<td>12</td>
<td>12</td>
<td align="char" char=".">10.5</td>
<td align="char" char=".">8.5</td>
<td>n/a</td>
<td>n/a</td>
</tr>
<tr>
<td>8</td>
	<td align="left"><xref ref-type="bibr" rid="r79">Schellenberg et al. (2005)</xref> I</td>
<td>RT</td>
<td>13</td>
<td>10</td>
<td align="char" char=".">10.5</td>
<td align="char" char=".">6.5</td>
<td>100</td>
<td>0</td>
</tr>
<tr>
<td>9</td>
	<td align="left"><xref ref-type="bibr" rid="r79">Schellenberg et al. (2005)</xref> II</td>
<td>RT</td>
<td>19</td>
<td>17</td>
<td align="char" char=".">10.5</td>
<td align="char" char=".">7.5</td>
<td>47</td>
<td>41</td>
</tr>
<tr>
<td>10</td>
	<td align="left"><xref ref-type="bibr" rid="r79">Schellenberg et al. (2005)</xref> III</td>
<td>RT</td>
<td>22</td>
<td>22</td>
<td align="char" char=".">10.5</td>
<td align="char" char=".">7.5</td>
<td>59</td>
<td>50</td>
</tr>
<tr>
<td>11</td>
	<td align="left"><xref ref-type="bibr" rid="r65">Paananen (2009)</xref>, comp. 1</td>
<td>Harm</td>
<td>12</td>
<td>11</td>
<td align="char" char=".">8.5</td>
<td align="char" char=".">6.5</td>
<td>n/a</td>
<td>n/a</td>
</tr>
<tr>
<td>11</td>
	<td align="left"><xref ref-type="bibr" rid="r65">Paananen (2009)</xref>, comp. 2</td>
<td>Harm</td>
<td>12</td>
<td>11</td>
<td align="char" char=".">10.5</td>
<td>8.5</td>
<td>n/a</td>
<td>n/a</td>
</tr>
<tr>
<td>11</td>
	<td align="left"><xref ref-type="bibr" rid="r65">Paananen (2009)</xref>, comp. 3</td>
<td>Harm</td>
<td>8</td>
<td>12</td>
<td align="char" char=".">14.5</td>
<td align="char" char=".">10.5</td>
<td>n/a</td>
<td>n/a</td>
</tr>
<tr>
<td>12</td>
	<td align="left"><xref ref-type="bibr" rid="r54">Maier-Karius and Schwarzer (2011)</xref>, comp. 1</td>
<td>PT</td>
<td>32</td>
<td>40</td>
<td align="char" char=".">9.5</td>
<td align="char" char=".">6.5</td>
<td>25</td>
<td>18</td>
</tr>
<tr>
<td>15</td>
	<td align="left"><xref ref-type="bibr" rid="r54">Maier-Karius and Schwarzer (2011)</xref><sup>a</sup>, comp. 2</td>
<td>PT</td>
<td>10</td>
<td>32</td>
<td>20</td>
<td align="char" char=".">9.5</td>
<td>100</td>
<td>25</td>
</tr>
<tr>
<td>13</td>
	<td align="left"><xref ref-type="bibr" rid="r38">James et al. (2012)</xref><sup>b</sup></td>
<td>GoF</td>
<td>112</td>
<td>—</td>
<td>6-10</td>
<td>—</td>
<td>n/a</td>
<td>n/a</td>
</tr>
<tr>
<td>14</td>
	<td align="left"><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> I, comp. 1</td>
<td>GoF</td>
<td>24</td>
<td>24</td>
<td>9</td>
<td>7</td>
<td>0</td>
<td>08</td>
</tr>
<tr>
<td>14</td>
	<td align="left"><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> I, comp. 2</td>
<td>GoF</td>
<td>26</td>
<td>24</td>
<td align="char" char=".">10.5</td>
<td>9</td>
<td>0</td>
<td>0</td>
</tr>
<tr>
<td>14</td>
	<td align="left"><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> I, comp. 3</td>
<td>GoF</td>
<td>28</td>
<td>26</td>
<td align="char" char=".">12.5</td>
<td align="char" char=".">10.5</td>
<td>0</td>
<td>0</td>
</tr>
<tr>
<td>14</td>
	<td align="left"><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> I, comp. 4</td>
<td>GoF</td>
<td>20</td>
<td>28</td>
<td>14</td>
<td align="char" char=".">13.5</td>
<td>0</td>
<td>0</td>
</tr>
<tr>
<td>14</td>
	<td align="left"><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> I, comp. 5</td>
<td>GoF</td>
<td>28</td>
<td>28</td>
<td>20</td>
<td>14</td>
<td>0</td>
<td>0</td>
</tr>
<tr>
<td>15</td>
	<td align="left"><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> II, comp. 1</td>
<td>GoF</td>
<td>25</td>
<td>26</td>
<td>9</td>
<td>7</td>
<td>0</td>
<td>0</td>
</tr>
<tr>
<td>15</td>
	<td align="left"><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> II, comp. 2</td>
<td>GoF</td>
<td>19</td>
<td>25</td>
<td>11</td>
<td>9</td>
<td>0</td>
<td>0</td>
</tr>
<tr>
<td>15</td>
	<td align="left"><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref>, II, comp. 3</td>
<td>GoF</td>
<td>23</td>
<td>19</td>
<td>13</td>
<td>11</td>
<td>0</td>
<td>0</td>
</tr>
<tr>
<td>15</td>
	<td align="left"><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> II, comp. 4</td>
<td>GoF</td>
<td>26</td>
<td>23</td>
<td>15</td>
<td>13</td>
<td>0</td>
<td>0</td>
</tr>
<tr>
<td>15</td>
	<td align="left"><xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> II, comp. 5</td>
<td>GoF</td>
<td>26</td>
<td>26</td>
<td>20</td>
<td>15</td>
<td>0</td>
<td>0</td>
</tr>
<tr>
<td>16</td>
	<td align="left"><xref ref-type="bibr" rid="r11">Corrigall et al. (2022)</xref></td>
<td>RT, GoF</td>
<td>49</td>
<td>48</td>
<td align="char" char=".">6.5</td>
<td align="char" char=".">10.5</td>
<td>55</td>
<td>45</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>Note.</italic> comp. = age group comparison in case of multi-arm studies; 1 = youngest group; 2 = next oldest group, etc., up to comp. 5; DV = dependent variable; PT = probe tone rating; PTP = probe tone production (participants played the probe tone on a keyboard); Imp = improvisation; Comp = composition; Harm = harmonization; RT = response time; GoF = goodness-of-fit ratings; Treat = treatment group (older participants); Cont = control group (younger children); <inline-formula><mml:math id="m33"><mml:mi>n</mml:mi><mml:mi> </mml:mi></mml:math></inline-formula>= number of participants in each group; n/a in the columns of musical training: the available information is insufficient to reproduce the number of musically trained participants in each subgroup. Formal musical training is operationalized differently in each study.</p>
<p><sup>a</sup>indicates sudies, in which the mean age for adults was set to 20 years due to insufficient information, in detail, <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982</xref>, p. 246) reported only undergraduate or graduate students as adults, <xref ref-type="bibr" rid="r54">Maier-Karius and Schwarzer (2011</xref>, p. 172) graduate students, and <xref ref-type="bibr" rid="r81">Schwarzer et al. (1993</xref>, p. 77) provided an age range of 19–45 years. <sup>b</sup>provided only a global effect size for primary school students; therefore, the age of the youngest and oldest participants were coded.</p>
</table-wrap-foot>
</table-wrap>
<p>The control variables differed significantly across studies. Some researchers, such as <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref>, did not explicitly control for prior formal musical training. In contrast, others, such as <xref ref-type="bibr" rid="r11">Corrigall et al. (2022)</xref>, treated it as a key variable. The participants with formal musical training in each sample ranged from none (coded as 0; <xref ref-type="bibr" rid="r56">Matsunaga et al., 2020</xref>) to all (coded as 1; <xref ref-type="bibr" rid="r54">Maier-Karius &amp; Schwarzer, 2011</xref>). Three studies reported the percentage of musically trained participants only across the sample: <xref ref-type="bibr" rid="r63">Paananen (2003)</xref>, 13.89%; <xref ref-type="bibr" rid="r65">Paananen (2009)</xref>, 13.63%; and <xref ref-type="bibr" rid="r38">James et al. (2012)</xref>, 16.96%. Formal musical training could not be included as a moderator in the statistical model, owing to limited data and a lack of an apparent long-term sampling practice considering these variables (<xref ref-type="bibr" rid="r32">Harrer et al., 2021</xref>)</p>
<p>Study quality was evaluated using various criteria (see Supplemental Material S2), with an average score of <italic>M</italic> = 19.3 (<italic>SD</italic> = 2.3) out of 43. Overall, study quality was relatively homogeneous; however, only one study reported psychometric quality criteria (<xref ref-type="bibr" rid="r99">Wilson &amp; Wales, 1995</xref>).</p>
<sec><title>Bayesian Three-Level Meta-Analysis</title>
<p>We initially estimated a four-level meta-analysis to aggregate effect sizes, as two articles (<xref ref-type="bibr" rid="r56">Matsunaga et al., 2020</xref>; <xref ref-type="bibr" rid="r79">Schellenberg et al., 2005</xref>) reported independent studies, suggesting potential within-article heterogeneity. However, although a comparison between the initial four-level model and a three-level meta-analysis model showed that the Bayes factor, <italic>BF</italic><sub>10</sub> = 1.92, provided insufficient evidence to decisively favor either model (for a general discussion, see <xref ref-type="bibr" rid="r89">van Doorn et al., 2021</xref>), the three-level model was ultimately chosen because of its slightly better data fit and based on the principle of parsimony (<xref ref-type="bibr" rid="r90">Vandekerckhove et al., 2015</xref>). The model comparison did not support further simplifying the model to a random-effects structure<xref ref-type="fn" rid="fn4"><sup>4</sup></xref><fn id="fn4"><label>4</label>
<p>A Bayes factor comparing both models provided strong evidence in favor of the three-level model (<italic>BF</italic><sub>10</sub> = 33,283.83).</p></fn>.</p>
<p>Before interpreting the results, we confirmed model convergence for our three-level structure by conducting posterior predictive checks and examining the <inline-formula><mml:math id="m37"><mml:mover accent="true"><mml:mrow><mml:mi>R</mml:mi></mml:mrow><mml:mo>^</mml:mo></mml:mover></mml:math></inline-formula>-values of the parameter estimates (<xref ref-type="bibr" rid="r32">Harrer et al., 2021</xref>). All <inline-formula><mml:math id="m38"><mml:mover accent="true"><mml:mrow><mml:mi>R</mml:mi></mml:mrow><mml:mo>^</mml:mo></mml:mover></mml:math></inline-formula>-values <inline-formula><mml:math id="m39"><mml:mfenced separators="|"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>R</mml:mi></mml:mrow><mml:mo>^</mml:mo></mml:mover><mml:mo>≤</mml:mo><mml:mn>1.01</mml:mn></mml:mrow></mml:mfenced></mml:math></inline-formula> indicated successful convergence (<xref ref-type="bibr" rid="r9">Bürkner, 2017</xref>). Additionally, visual inspection confirmed that the posterior distributions aligned with the initial unimodal normal distribution, supporting our assumption of normality (see Appendix Figure A2-1). Sensitivity analyses using different weakly informed priors further support the robustness assumption of our results (<xref ref-type="table" rid="t3">Table 3</xref>).</p>
<table-wrap id="t3" position="anchor" orientation="landscape">
<label>Table 3</label><caption><title>Prior and Posterior Model Parameters of Three-Level Meta-Analysis Model and Sensitivity Analyses</title></caption>
<table frame="hsides" rules="groups">
<col width="15%" align="left"/>
<col width="15%"/>
<col width="15%"/>
<col width="15%"/>
<col width="15%"/>
<col width="25%"/>
<thead>
<tr>
<th valign="bottom" rowspan="3" scope="rowgroup" align="left">Model Parameter</th>
	<th valign="bottom" colspan="2" scope="colgroup">Priors of the Three-Level Model <hr/></th>
	<th valign="bottom" colspan="2" scope="colgroup">Alternatives in Prior Choice<hr/></th>
	<th valign="bottom" rowspan="3" align="left">Conclusions</th>
</tr>
<tr>
<th scope="colgroup">Prior 1</th>
<th>Prior 2</th>
<th>Prior 3</th>
<th>Prior 4</th>
</tr>
<tr>
<th scope="colgroup">N(0, 1)</th>
	<th>HalfCauchy(0, 0.5)</th>
<th>N(0, 0.5)</th>
<th><italic>t</italic>(3, 0, 2.5)</th>
</tr>
</thead>
<tbody>
<tr>
<td>Intercept (µ)</td>
<td><italic>Mdn</italic> = 0.57 (0.37, 0.77)</td>
<td>—</td>
	<td><italic>Mdn</italic> = 0.56 (0.36, 0.75)</td>
<td><italic>Mdn</italic> = 0.58 (0.37, 0.78)</td>
	<td align="left">Small, but practically negligible difference for both estimates. Prior 3 goes along with a slightly different, but insignificant shrinkage of the point estimates towards the center of the prior)</td>
</tr>
	<tr style="transparent-border-top">
<td>Between-study <inline-formula><mml:math id="m48"><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:math></inline-formula></td>
<td>—</td>
		<td><italic>Mdn</italic> = 0.20 (0.00, 0.40)</td>
<td><italic>Mdn</italic> = 0.20 (0.04, 0.40)</td>
<td><italic>Mdn</italic> = 0.21 (0.04, 0.42)</td>
	<td align="left">Minor, but practically negligible differences between both parameter estimates. Prior 4 produced a slightly wider 95% credible interval, reflecting marginally more uncertainty.</td>
</tr>
<tr style="transparent-border-top">
<td>Within-study <inline-formula><mml:math id="m52"><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:math></inline-formula></td>
<td>—</td>
	<td><italic>Mdn</italic> = 0.43 (0.27, 0.60)</td>
	<td><italic>Mdn</italic> = 0.43 (0.28, 0.60)</td>
	<td><italic>Mdn</italic> = 0.45 (0.27, 0.61)</td>
	<td align="left">Minor, but practically negligible variation across priors.</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
	<p><italic>Note.</italic> Posterior medians (<italic>Mdn</italic>) are used as point estimates; 95% credible intervals are presented in parentheses; for Priors 3 and 4, half-distributions were used for modeling τ<sub>1</sub> and τ<sub>2</sub>.</p>
</table-wrap-foot>
</table-wrap>
<p>We assessed publication bias using a Bayesian Egger test, which indicated a significant intercept (β<sub>1</sub> = 7.46, 95% <italic>CI</italic> [3.12, 11.67]), suggesting potential publication bias. However, previous studies have recommended conducting this approach on a corpus of at least 30 studies because asymmetry tests for standardized mean differences are prone to inflated Type I error rates (<xref ref-type="bibr" rid="r72">Pustejovsky &amp; Rodgers, 2019</xref>; <xref ref-type="bibr" rid="r75">Renkewitz &amp; Keiner, 2019</xref>). A visual inspection of the funnel plot (see Appendix Figure A2-2), showing the standard error of the reported effect sizes as a function of their magnitude, suggests the potential for slight asymmetry; however, this is primarily driven by <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982</xref>; Study ID 1). Thus, we found no significant evidence of general publication bias caused by selective reporting.</p>
	<p>We further explored potential sources of bias by examining the model-based relationships between μ and τ<sub>1</sub> (<xref ref-type="fig" rid="f2">Figure 2a</xref>), and μ and τ<sub>2</sub> (<xref ref-type="fig" rid="f2">Figure 2b</xref>). Although visual inspection suggested only marginal associations, Pearson correlations revealed statistically significant but negligible effects in both cases: μ and τ<sub>1</sub>, <italic>r</italic>(11998) = -.09, <italic>p</italic> &lt; .001, 95% <italic>CI</italic> (-.11, -.07); μ and τ<sub>2</sub>, <italic>r</italic>(11998) = .08, <italic>p</italic> &lt; .001, 95% <italic>CI</italic> (.06, .10). These results indicated that any potential relationship between effect sizes and heterogeneity is minimal, thus providing little evidence of systematic publication bias.</p>
	
	<fig id="f2" position="anchor" fig-type="figure" orientation="portrait"><label>Figure 2</label><caption>
			<title>Heatmap of the Joint Posterior Distribution of Model Parameters μ (x-axis) and Standard Deviations τ (y-axis)</title><p><italic>Note.</italic> <xref ref-type="fig" rid="f2">Figure 2a</xref> depicts the relationship between μ and τ<sub>1</sub> (between-study standard deviation). <xref ref-type="fig" rid="f2">Figure 2b</xref> shows the relationship between μ and τ<sub>2</sub> (within-study standard deviation). The color gradient reflects the density scale, with higher values (lighter regions) indicating higher density and lower values (darker regions) indicating lower density. Red lines in each plot represent the maximum likelihood point estimates of both parameters.</p></caption><graphic xlink:href="jbdgm.205-f2" position="anchor" orientation="portrait"/></fig>
	

<p>Based on the observed data, hierarchical model, and prior choices, we produced a point estimation for the pooled medium-sized effect (<italic>Mdn</italic><sub><italic>d</italic></sub> = 0.57). As indicated by the credible intervals of the pooled effect size (<xref ref-type="table" rid="t3">Table 3</xref>), we could further conclude that the general so-called “true” effect size—expressed as Cohen’s <italic>d</italic>—reflects a medium to nearly large difference in IRTH sensitivity between younger and older participants. Moreover, the 95% credible interval for the effect lies entirely above zero (0.37, 0.77)<xref ref-type="fn" rid="fn5"><sup>5</sup></xref><fn id="fn5"><label>5</label>
<p>The 95% credible interval (95% CrI) is a highest density interval, i.e., the smallest possible interval containing the probability mass of 95% of the most probable values in the posterior parameter distribution. It represents the region where every point has a higher probability density than any point outside, reflecting the uncertainty in the estimate (<xref ref-type="bibr" rid="r89">van Doorn et al., 2021</xref>, p. 822).</p></fn> along with decisive evidence against a point-null hypothesis (<italic>BF</italic><sub>10</sub> = 11999). We further assess whether the age-related increase in IRTH sensitivity exceeds a negligible magnitude, that is, whether it is neither trivially different from zero nor within the range of a small effect <inline-formula><mml:math id="m74"><mml:mfenced separators="|"><mml:mrow><mml:msub><mml:mrow><mml:mi>H</mml:mi></mml:mrow><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub><mml:mo>:</mml:mo><mml:mn>0</mml:mn><mml:mi> </mml:mi><mml:mo>≤</mml:mo><mml:mi> </mml:mi><mml:mfenced open="|" close="|" separators="|"><mml:mrow><mml:mi>d</mml:mi></mml:mrow></mml:mfenced><mml:mi> </mml:mi><mml:mo>&lt;</mml:mo><mml:mi> </mml:mi><mml:mn>0.2</mml:mn><mml:mo>,</mml:mo><mml:mi> </mml:mi><mml:msub><mml:mrow><mml:mi>B</mml:mi><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:mn>01</mml:mn></mml:mrow></mml:msub><mml:mi> </mml:mi><mml:mo>&gt;</mml:mo><mml:mi> </mml:mi><mml:mn>10</mml:mn></mml:mrow></mml:mfenced></mml:math></inline-formula>. Therefore, we used Bayes factors to quantify the evidence that the result exceeded the small-effect threshold <inline-formula><mml:math id="m75"><mml:mfenced separators="|"><mml:mrow><mml:msub><mml:mrow><mml:mi>H</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>:</mml:mo><mml:mi> </mml:mi><mml:mfenced open="|" close="|" separators="|"><mml:mrow><mml:mi>d</mml:mi></mml:mrow></mml:mfenced><mml:mi> </mml:mi><mml:mo>≥</mml:mo><mml:mi> </mml:mi><mml:mn>0.2</mml:mn><mml:mo>,</mml:mo><mml:mi> </mml:mi><mml:msub><mml:mrow><mml:mi>B</mml:mi><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:mn>10</mml:mn></mml:mrow></mml:msub><mml:mi> </mml:mi><mml:mo>&gt;</mml:mo><mml:mi> </mml:mi><mml:mn>10</mml:mn></mml:mrow></mml:mfenced></mml:math></inline-formula> by using a Bayesian model comparison approach. Our analyses revealed a Bayes Factor providing decisive support for the alternative assumption (<italic>BF</italic><sub>10</sub> = 1332.33) indicating that the age-related increase in IRTH sensitivity is unlikely to be marginal. Instead, it should be best interpreted as a substantively meaningful skill-development effect with a high probability of at least medium-to-strong magnitude. We further illustrated the cumulative posterior evidence by plotting the empirical cumulative distribution functions for <inline-formula><mml:math id="m77"><mml:mi mathvariant="normal">µ</mml:mi></mml:math></inline-formula>, <inline-formula><mml:math id="m78"><mml:msub><mml:mrow><mml:mi mathvariant="normal">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:math></inline-formula> and <inline-formula><mml:math id="m79"><mml:msub><mml:mrow><mml:mi mathvariant="normal">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub></mml:math></inline-formula> (see Appendix Figure A2-3) to facilitate the interpretation of the probability that these parameters exceed meaningful thresholds.</p>
<p>Furthermore, based on the hierarchical model and its estimated parameters, we revealed a model with parameter estimates as solution in which at least one effect size estimate from each study falls within the 95% credible interval of the pooled effect size (<xref ref-type="fig" rid="f3">Figure 3</xref>). At first glance, <xref ref-type="bibr" rid="r81">Schwarzer et al. (1993)</xref> appear to be an exception; however, although the point estimates of effect sizes in their study are predicted to fall well outside the 95% credible interval of the pooled effect size, their respective 95% credible intervals still intersect with this range.</p>
	
	<fig id="f3" position="anchor" fig-type="figure" orientation="portrait"><label>Figure 3</label><caption>
			<title>Forest Plot of the Bayesian Three-Level Model With Estimated Effect Sizes of Individual Studies and the Pooled Effect Size</title><p><italic>Note.</italic> The densities represent their respective posterior distributions. Medians serve as point estimates for the effect sizes. Blue shading highlights estimated effect sizes and parts of the posterior distributions that fall within the 95% credible interval of the pooled effect size.</p></caption><graphic xlink:href="jbdgm.205-f3" position="anchor" orientation="portrait"/></fig>
	
	
<p>Although the vast majority of the effect sizes reported in investigated studies fall within the expected 50–80% credible intervals according to our hierarchical model (<xref ref-type="fig" rid="f4">Figure 4</xref>), some observed effect sizes reported by <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref> deviate from this pattern. Specifically, the results of two studies (ID 11 and ID 12) exhibit exceptionally high effect sizes. Although our model considers these values possible, they are highly unlikely from a statistical standpoint. For example, according to our model, the probability that the estimate for the effect size for ID 12 in <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref>, denoted as <inline-formula><mml:math id="m80"><mml:msub><mml:mrow><mml:mi mathvariant="normal">θ</mml:mi></mml:mrow><mml:mrow><mml:mn>1,12</mml:mn></mml:mrow></mml:msub></mml:math></inline-formula> in the posterior samples, is greater than or equal to the observed effect size <inline-formula><mml:math id="m81"><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mtext>ES</mml:mtext></mml:mrow><mml:mrow><mml:mn>1,12</mml:mn></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mn>3.02</mml:mn><mml:mo>)</mml:mo></mml:math></inline-formula> is relatively low at 2.1%, <inline-formula><mml:math id="m82"><mml:mi>P</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">θ</mml:mi></mml:mrow><mml:mrow><mml:mn>1,12</mml:mn></mml:mrow></mml:msub><mml:mo>≥</mml:mo><mml:msub><mml:mrow><mml:mtext>ES</mml:mtext></mml:mrow><mml:mrow><mml:mn>1,12</mml:mn></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>y</mml:mi><mml:mo>,</mml:mo><mml:mi>M</mml:mi></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:mn>0.021</mml:mn></mml:math></inline-formula>. In contrast, the observed effect size for ID 11 has an even lower probability of occurring, at less than 1% <inline-formula><mml:math id="m83"><mml:mo>(</mml:mo><mml:mi>P</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:msub><mml:mrow><mml:mi>θ</mml:mi></mml:mrow><mml:mrow><mml:mn>1,11</mml:mn></mml:mrow></mml:msub><mml:mo>≥</mml:mo><mml:msub><mml:mrow><mml:mtext>ES</mml:mtext></mml:mrow><mml:mrow><mml:mn>1,11</mml:mn></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>y</mml:mi><mml:mo>,</mml:mo><mml:mi>M</mml:mi></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:mn>0.005</mml:mn><mml:mo>)</mml:mo></mml:math></inline-formula>.</p>
	
	<?figure f3?>
	
	<fig id="f4" position="anchor" fig-type="figure" orientation="portrait"><label>Figure 4</label><caption>
			<title>Model-Based Probability Predictions for the Occurrence of Each Effect Size</title><p><italic>Note.</italic> Whereas the vast majority of effect sizes have a high probability of occurrence based on the model-based expectations, some values have extremely low statistical probability, such as ID 11 and ID 12.</p></caption><graphic xlink:href="jbdgm.205-f4" position="anchor" orientation="portrait"/></fig>

	
<p>The multilevel model revealed significant heterogeneity, divided into between- and within-study heterogeneity. Although the median between-study variance, <inline-formula><mml:math id="m84"><mml:msubsup><mml:mrow><mml:mi mathvariant="normal">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0.04</mml:mn><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mn>95</mml:mn><mml:mi mathvariant="normal">%</mml:mi><mml:mi mathvariant="normal"> </mml:mi><mml:mi>C</mml:mi><mml:mi>r</mml:mi><mml:mi>I</mml:mi><mml:mi mathvariant="normal"> </mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>00</mml:mn><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mn>0.16</mml:mn></mml:mrow></mml:mfenced><mml:mo>,</mml:mo></mml:math></inline-formula> accounted for only 18% of the total variance, the majority of the heterogeneity (82%) could be attributed to within-study variance, <inline-formula><mml:math id="m85"><mml:msubsup><mml:mrow><mml:mi mathvariant="normal">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0.18</mml:mn><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mn>95</mml:mn><mml:mi mathvariant="normal">%</mml:mi><mml:mi mathvariant="normal"> </mml:mi><mml:mi>C</mml:mi><mml:mi>r</mml:mi><mml:mi>I</mml:mi><mml:mi mathvariant="normal"> </mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>07</mml:mn><mml:mo>,</mml:mo><mml:mi mathvariant="normal"> </mml:mi><mml:mn>0.36</mml:mn></mml:mrow></mml:mfenced></mml:math></inline-formula>.</p>
<p>However, differences in age-group compositions across studies prevented us from answering RQ2 using this analytical approach, which is discussed below. Furthermore, RQ3 could only be addressed in an exploratory manner, as the limited number of studies and inconsistent reporting of relevant sample characteristics hindered formal statistical testing. <xref ref-type="table" rid="t2">Table 2</xref> summarizes the proportions of musically trained and untrained individuals across the included samples.</p>
	<p>We addressed RQ4 by examining whether differences in IRTH measurement type could explain the variability in effect sizes. The central goal of a meta-analysis is to account for heterogeneity in the data (<xref ref-type="bibr" rid="r5">Borenstein, 2019</xref>). Therefore, we followed <xref ref-type="bibr" rid="r11">Corrigall et al. (2022)</xref> and introduced a categorical moderator representing six measurement types: probe tone, response time, goodness-of-fit rating, composition, improvisation, and harmonization. The analysis revealed largely overlapping 95% credible intervals and only small differences in posterior means, suggesting that the measurement type had no systematic effect (<xref ref-type="fig" rid="f5">Figure 5</xref>). However, comparing model fit using R<sup>2</sup> values (<xref ref-type="bibr" rid="r34">Hayes, 2022</xref>) showed a slight improvement in the moderated model, <italic>R</italic><sup>2</sup> = .51, 95% <italic>CrI</italic> (.30, .72), compared to the model without a moderator, <italic>R</italic><sup>2</sup> = .48, 95% <italic>CrI</italic> (.27, .70). Although the Bayes factor of <italic>BF</italic><sub>10</sub> = 38.80 indicated a strong statistical preference for the moderated model (<xref ref-type="bibr" rid="r89">van Doorn et al., 2021</xref>), the practical significance of this improvement remained uncertain, given the modest differences in parameter estimates. Therefore, we directly addressed RQ4 by comparing the response time measures with all other operationalizations. These comparisons yielded weak-to-moderate evidence against a systematic difference for goodness-of-fit ratings (<italic>BF</italic><sub>10</sub> = 0.48), harmonization (<italic>BF</italic><sub>10</sub> = 1.00), and improvisation (<italic>BF</italic><sub>10</sub> = 0.84) in lower estimates for response time measures compared to probe tone ratings <inline-formula><mml:math id="m92"><mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mi>B</mml:mi><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:mn>10</mml:mn><mml:mi> </mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi> </mml:mi><mml:mn>12.99</mml:mn><mml:mo>)</mml:mo></mml:math></inline-formula>. Overall, the results indicated smaller effect sizes for response time measurements in probe tone ratings only, with no consistent reduction in effect sizes for response time measurements.</p>
	
	<fig id="f5" position="anchor" fig-type="figure" orientation="portrait"><label>Figure 5</label><caption>
			<title>Posterior Distributions of the Intercept and Moderator Levels of the Bayesian Three-Level Moderated Meta-Analysis</title><p><italic>Note</italic>. Effect sizes are standardized mean differences (<italic>d</italic>). Thin error bars are 50% <italic>CrI</italic> of <italic>d</italic>. Thick error bars indicate 95% <italic>CrI</italic> of <italic>d</italic>.</p></caption><graphic xlink:href="jbdgm.205-f5" position="anchor" orientation="portrait"/></fig>

	
<p>Taken together, these results suggest that response time measurements do not consistently yield lower IRTH sensitivity estimates compared to more explicit operationalizations. Therefore, the current evidence does not support RQ4, except for a notable difference in probe tone ratings.</p>
<p>The observed within- and between-study heterogeneity was likely caused by specific artifacts, such as sample and characteristics. However, we cannot pinpoint these factors more precisely because of the limited information in the primary studies. However, certain possibilities were excluded based on the model comparison analysis presented below.</p>
<p>Thus far, we have reported evidence of a medium-to-strong age-related increase in IRTH sensitivity, although the high variance somewhat obscures this trend. However, these analyses do not clarify whether age-specific learning gains are present, particularly (1) whether acquisition continues beyond age 9 and (2) whether there are sensitive periods during school years that would be reflected in a non-linear learning trajectory. Thus, we conducted further analyses to address these uncertainties.</p></sec>
<sec><title>Model Comparison Analysis</title>
<p>Based on the <italic>AIC</italic>, <italic>BIC</italic>, and <italic>RMSEA</italic> model comparison criteria, the non-linear mixed model best fits <xref ref-type="bibr" rid="r45">Krumhansl and Keil’s (1982)</xref> data (see Appendix Table A1-1), suggesting no linear or sigmoidal increase in IRTH sensitivity between ages 6 and 20. <xref ref-type="fig" rid="f6">Figure 6</xref> shows the age-related development of various IRTH sensitivity outcomes according to the non-linear mixed model. Based on the maximum increase in IRTH sensitivity at age 20 (<italic>k</italic> = 0.08), we concluded that IRTH continues to develop into adulthood and is not fully developed by age 9.</p>
	
	<fig id="f6" position="anchor" fig-type="figure" orientation="portrait"><label>Figure 6</label><caption>
			<title>Development of IRTH Modelled as a Non-Linear Function of Age</title><p><italic>Note</italic>. Standardized mean differences (<italic>d</italic>) as indicator of tonal recognition stability based on reanalyzed cross-sectional data of <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982</xref>, pp. 247–248) as measured with the two sample tones probe tone paradigm (see section procedure for explanation).</p></caption><graphic xlink:href="jbdgm.205-f6" position="anchor" orientation="portrait"/></fig>
	
<p>Furthermore, the distinct trajectories shown in <xref ref-type="fig" rid="f6">Figure 6</xref> suggest that outcomes may strongly depend on specific task characteristics, even within a single-measurement paradigm. Although the differentiation between pairs of diatonic and non-diatonic tones, as well as the tonic triad versus other diatonic tones, shows a steep increase, more subtle IRTHs, such as the preference for the tonic over other tonic triad tones, show little to no increase, even in adults.</p>

<?figure f6?>

</sec></sec>
<sec sec-type="discussion"><title>Discussion</title>
<p>Our study aimed to synthesize 40 years of research examining the impact of age-related experience with Western tonal music on IRTH acquisition in school-aged children. Additionally, we explored sources of variance both within and between studies to better understand the heterogeneity in study outcomes.</p>
	<p>In a first approach, we aggregated eligible studies in a Bayesian three-level meta-analysis to precisely quantify the mean increase in IRTH sensitivity between younger and older participants. On average, the results indicated a moderate increase in IRTH acquisition during one’s school years, depending on the cognitive demands of the tasks measuring IRTH sensitivity. This finding has significant educational implications. The observed medium effect size supports the implementation of targeted programs (e.g., <xref ref-type="bibr" rid="r25">Government of the UK, Department of Education, 2021</xref>) to enhance tonal sensitivity in school-aged children, as this is sufficiently substantial to be practically relevant for educational initiatives (<xref ref-type="bibr" rid="r33">Hattie, 2012</xref>). Future research should further investigate these acquisitional trajectories and explore potential critical periods beyond the age range covered in our study (<xref ref-type="bibr" rid="r31">Hargreaves &amp; Lamont, 2017</xref>).</p>
<p>Subsequently, we conducted a model comparison of single-study results to explore the timing and potential shapes of learning trajectories within IRTH acquisition as a function of task characteristics. The findings provide converging evidence against early closure models that assume a fixed endpoint of acquisition by age 7 or 9 (<xref ref-type="bibr" rid="r22">Gembris, 2017b</xref>; <xref ref-type="bibr" rid="r24">Gordon, 2012</xref>). Our findings indicate that IRTH sensitivity instead continues to develop through adolescence and into adulthood, supporting gradual or open-ended models of acquisition (e.g., <xref ref-type="bibr" rid="r30">Hargreaves, 1996</xref>) and aligning with neurocognitive and educational frameworks of lifelong learning (<xref ref-type="bibr" rid="r1">Altenmüller, 2022</xref>; <xref ref-type="bibr" rid="r52">Mack et al., 2025</xref>). We also observed improvements among participants without formal musical training, underscoring the role of enculturation and mere exposure (<xref ref-type="bibr" rid="r16">Demorest &amp; Morrison, 2016</xref>). Furthermore, data from participants with ongoing formal training—such as the adult volunteers in <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref>, who had 7.8 years of musical training on average—indicate that IRTH performance remains trainable beyond early childhood. These patterns suggest a skill development process shaped not only by exposure but also by the cognitive demands of the task. Higher task complexity may require a level of expertise that emerges only through extended, potentially formalized practice. Consequently, the observed plateau effects likely reflect task-specific thresholds rather than universal developmental limits.</p>
<p>A more detailed analysis using a model comparison approach revealed that a task-specific non-linear model best captured the developmental trajectory, a pattern also observed in other musical contexts, such as the development of melody perception (<xref ref-type="bibr" rid="r51">Lin, 2023</xref>). Notably, our analysis revealed substantial differences in IRTH developmental trajectories, which varied not only as a non-linear function of age but also as a function of specific task characteristics. <xref ref-type="bibr" rid="r56">Matsunaga et al. (2020)</xref> also reported variations across tasks, who found that Japanese children recognized Western diatonic tones at age 7 but identified the tonic only at age 13. In contrast, implicit measures of IRTH demonstrated sensitivity to the tonic in ages 6 to 7 (<xref ref-type="bibr" rid="r11">Corrigall et al., 2022</xref>; <xref ref-type="bibr" rid="r79">Schellenberg et al., 2005</xref>), suggesting that implicit processes may precede explicit ones in tonal development (<xref ref-type="bibr" rid="r11">Corrigall et al., 2022</xref>). Neuroscientific (<xref ref-type="bibr" rid="r13">Corrigall &amp; Trainor, 2014</xref>) and behavioral studies using implicit measures (<xref ref-type="bibr" rid="r86">Trainor &amp; Trehub, 1992</xref>) further support the notion that some tonal abilities might develop earlier than others. Our meta-analysis, which focused primarily on explicit tasks, aligns with research showing later acquisition in explicit tonal processing.</p>
<p>However, data from all reviewed studies currently lack sufficient evidence to determine the correlative relationship between the various operationalizations used or whether they can be attributed to a single latent variable (IRTH) to which all prior operationalizations conceptually refer. To date, no statistical examination has been conducted to determine whether all operationalizations capture the same latent variable, assuming that IRTH follows a general factor model. Alternatively, these operationalizations may represent dimensions of a composite factor model or discrete partially uncorrelated constructs associated with different latent variables. A test-theoretical approach would be valuable to address this question across age groups (e.g., <xref ref-type="bibr" rid="r4">Bond &amp; Fox, 2015</xref>), enabling the subsequent examination of developmental trajectories of IRTH in a longitudinal study. Owing to insufficient statistical information in the primary studies, RQ3 regarding the effects of formal musical training on IRTH acquisition could not be answered fully based on the available evidence. However, it can be inferred from our findings that although IRTH sensitivity develops in children without formal musical training (e.g., <xref ref-type="bibr" rid="r56">Matsunaga et al., 2020</xref>), formal musical training may enhance explicit judgments (e.g., <inline-formula><mml:math id="m100"><mml:mi>d</mml:mi><mml:mo>=</mml:mo><mml:mn>1.23</mml:mn></mml:math></inline-formula> for musical experts in <xref ref-type="bibr" rid="r54">Maier-Karius &amp; Schwarzer, 2011</xref>). However, it has minimal impact on implicit response times (e.g., <inline-formula><mml:math id="m101"><mml:mi>d</mml:mi><mml:mo>=</mml:mo><mml:mn>0.68</mml:mn></mml:math></inline-formula> falling within the 95% CrI of the modeled mean in <xref ref-type="bibr" rid="r79">Schellenberg et al., 2005</xref>). This pattern is consistent with <xref ref-type="bibr" rid="r11">Corrigall et al.’s (2022)</xref> findings and is further supported by studies employing productive IRTH operationalizations (e.g., <xref ref-type="bibr" rid="r26">Guilbault, 2009</xref>; <xref ref-type="bibr" rid="r99">Wilson &amp; Wales, 1995</xref>). However, several studies have reported no advantage of formal musical training for goodness-of-fit ratings (<xref ref-type="bibr" rid="r37">James et al., 2015</xref>; <xref ref-type="bibr" rid="r79">Schellenberg et al., 2005</xref>; <xref ref-type="bibr" rid="r84">Stalinski &amp; Schellenberg, 2010</xref>) or observed improvements in implicit measures such as brain function in musically trained participants (<xref ref-type="bibr" rid="r42">Koelsch et al., 2005</xref>; <xref ref-type="bibr" rid="r53">Magne et al., 2006</xref>; <xref ref-type="bibr" rid="r73">Putkinen et al., 2014</xref>; <xref ref-type="bibr" rid="r96">Wehrum et al., 2011</xref>).</p>
<p>Although the limited data prevented us from disentangling the individual contributions of age, informal and formal musical training, and their interactions, our analyses underscore the need for further research in this area. The recurrent absence of data emphasizes the importance of transparent and sustainable research data management (<xref ref-type="bibr" rid="r17">Eerola, 2025</xref>), including practices such as verbatim reporting of instructions, providing original stimuli, reporting means and standard deviations for each condition and treatment group (or supplying raw data), and specifying test quality criteria (e.g., test-retest correlation for repeated measurements). By addressing these aspects, future studies will enable meta-analyses such as ours to be conducted more broadly and provide more precise estimates.</p>
<p>The following limitations should be considered when interpreting the results. Generally, meta-analyses inherit the methodological limitations of primary studies. For example, all included studies used cross-sectional quasi-randomized or observational study designs. Although common in this field (<xref ref-type="bibr" rid="r7">Boutron et al., 2022</xref>), these methods may introduce additional variance (<xref ref-type="bibr" rid="r62">Murad et al., 2016</xref>). Another example is the predominantly low statistical power of the primary studies (<xref ref-type="bibr" rid="r18">Ellis, 2010</xref>). Although meta-analytic weighting procedures account for sampling errors by assigning lower weights to less precise estimates, studies with small samples remain more susceptible to extreme or unstable effect size estimates owing to higher random variability (<xref ref-type="bibr" rid="r32">Harrer et al., 2021</xref>). Therefore, a high proportion of such studies may increase heterogeneity, particularly if their estimates are systematically biased or selectively reported. This highlights the importance of adequately designed and reported primary studies and calls for caution when interpreting highly variable or inconsistent findings stemming from small samples. From a conceptual standpoint, a limitation of our study lies in the treatment of age as an independent variable based on its frequent reporting in several studies. Age influences various cognitive factors, such as maturation, enculturation, exposure, and musical skill acquisition, that are likely to affect IRTH acquisition (<xref ref-type="bibr" rid="r16">Demorest &amp; Morrison, 2016</xref>; <xref ref-type="bibr" rid="r27">Halford, 2014</xref>; <xref ref-type="bibr" rid="r29">Hannon &amp; Trainor, 2007</xref>; <xref ref-type="bibr" rid="r100">Zajonc, 2001</xref>). However, the specific contributions of these factors remain unclear in both the primary studies and our own analyses. For example, formal musical training is known to enhance IRTH (<xref ref-type="bibr" rid="r12">Corrigall &amp; Trainor, 2009</xref>; <xref ref-type="bibr" rid="r43">Kraus &amp; Chandrasekaran, 2010</xref>; <xref ref-type="bibr" rid="r59">Müllensiefen, 2022</xref>; <xref ref-type="bibr" rid="r93">Virtala et al., 2012</xref>) but likely interacts with age and informal musical activities (<xref ref-type="bibr" rid="r48">Lamont, 1998</xref>). Future research should aim to disentangle the contributions of these factors and clarify their interactions to better understand IRTH acquisition. Another limitation is the substantial heterogeneity observed in the Bayesian three-level meta-analysis, which may have obscured the overall effect. This heterogeneity can be primarily attributed to <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref>.</p>
<p>In summary, although our research question regarding smaller effect sizes for response time measurements compared to other more explicit measurements remains partially unanswered, with probe tone ratings being the exception, the model comparison analysis of <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref> indicates task-specific differences. Our findings underscore the pivotal influence of task characteristics on IRTH measurements reported over the past 40 years. This aligns with prior research highlighting performance variations stemming from differences in probe tone instructions (<xref ref-type="bibr" rid="r44">Kristop et al., 2020</xref>) and supports insights gained from re-analyses of measurement instruments (<xref ref-type="bibr" rid="r69">Platz et al., 2022</xref>). Reviewing the knowledge gained from 40 years of research in a structured manner is worthwhile because it provides specific insights for the profitable continuation of the research tradition and general findings for appropriately handling data that enable fruitful re-analyses. This discussion highlights key challenges in IRTH research and underscores the importance of employing validated methodological approaches to accurately model and interpret data. Future studies should address these limitations and focus on developing more precise and comprehensive models based on valid measures to better capture the complex dynamics of IRTH development.</p>

</sec>
</body>
<back>
	
	<sec sec-type="ethics-statement">
		<title>Ethics Statement</title>
		<p>No ethical issues and/or ethics approvals need to be disclosed.</p>
	</sec>
	
<app-group>
<app id="app"><title>Appendix</title>
<sec id="secA.1"><title>A1. Table</title>
<table-wrap id="tA.1" position="anchor" orientation="portrait">
<label>Table A1-1</label><caption><title>Comparison of Statistical Models Based on Their Fit to the Data for Describing the Growth Trajectories Observed in <xref ref-type="bibr" rid="r45">Krumhansl and Keil (1982)</xref></title></caption>
<table frame="hsides" rules="groups">
<col width="40%" align="left"/>
<col width="20%"/>
<col width="20%"/>
<col width="20%"/>
<thead>
<tr>
<th>Model</th>
<th>AIC</th>
<th>BIC</th>
<th>RMSEA</th>
</tr>
</thead>
<tbody>
<tr>
<td>Non-linear mixed model</td>
<td align="char" char=".">6.61</td>
<td align="char" char=".">10.60</td>
<td align="char" char=".">0.03</td>
</tr>
<tr>
<td>Logistic model</td>
<td align="char" char=".">39.97</td>
<td align="char" char=".">43.96</td>
<td align="char" char=".">0.09</td>
</tr>
<tr>
<td>Quadratic model</td>
<td align="char" char=".">42.37</td>
<td align="char" char=".">47.35</td>
<td align="char" char=".">0.09</td>
</tr>
<tr>
<td>Cubic model</td>
<td align="char" char=".">44.09</td>
<td align="char" char=".">50.07</td>
<td align="char" char=".">0.09</td>
</tr>
<tr>
<td>Linear model</td>
<td align="char" char=".">47.07</td>
<td align="char" char=".">51.05</td>
<td align="char" char=".">0.09</td>
</tr>
<tr>
<td>Non-linear saturation model</td>
<td align="char" char=".">48.94</td>
<td align="char" char=".">52.92</td>
<td align="char" char=".">0.12</td>
</tr>
<tr>
<td>Sigmoidal model</td>
<td align="char" char=".">49.83</td>
<td align="char" char=".">53.81</td>
<td align="char" char=".">0.17</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>Note.</italic> AIC: Akaike Information Criterion; BIC: Bayesian Information Criterion; RMSEA: Root Mean Square Error of Approximation.</p>
</table-wrap-foot>
</table-wrap></sec>
<sec id="secA.2"><title>A2. Figures</title>
	
	<fig id="fA.2" position="anchor" fig-type="figure" orientation="portrait"><label>Figure A2-1</label><caption>
<title>Posterior Probability Density for Modeled Parameters for the Bayesian Three-Level Model: (a) <inline-formula><mml:math id="m102"><mml:mi mathvariant="bold-italic">μ</mml:mi></mml:math></inline-formula> for the Mean, (b) <inline-formula><mml:math id="m103"><mml:msub><mml:mrow><mml:mi mathvariant="bold-italic">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:math></inline-formula> for Between-Study Standard Deviation, and (c) <inline-formula><mml:math id="m104"><mml:msub><mml:mrow><mml:mi mathvariant="bold-italic">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub></mml:math></inline-formula> for the Within-Study Standard Deviation</title></caption><graphic xlink:href="jbdgm.205-fA2.1" position="anchor" orientation="portrait"/></fig>
	
	<fig id="fA.2___1" position="anchor" fig-type="figure" orientation="portrait"><label>Figure A2-2</label><caption>
			<title>Funnel Plot of Reported Study Estimates by Standard Errors</title><p><italic>Note.</italic> Solid line: modelled mean effect; dashed lines (outer): 95% CI; dotted lines (inner): 80% CI. Each point represents an individual study, color-coded by Study ID.</p></caption><graphic xlink:href="jbdgm.205-fA2.2" position="anchor" orientation="portrait"/></fig>
	

	<fig id="fA.2___2" position="anchor" fig-type="figure" orientation="portrait"><label>Figure A2-3</label><caption>
<title>Empirical Cumulative Probability Function for Modeled Parameters for the Bayesian Three-Level Model: (a) <inline-formula><mml:math id="m105"><mml:mi mathvariant="bold-italic">μ</mml:mi></mml:math></inline-formula> for the Mean, (b) <inline-formula><mml:math id="m106"><mml:msub><mml:mrow><mml:mi mathvariant="bold-italic">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:math></inline-formula> for Between-Study Standard Deviation, and (c) <inline-formula><mml:math id="m107"><mml:msub><mml:mrow><mml:mi mathvariant="bold-italic">τ</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub></mml:math></inline-formula> for the Within-Study Standard Deviation</title></caption><graphic xlink:href="jbdgm.205-fA2.3" position="anchor" orientation="portrait"/></fig></sec>
</app>
</app-group><ack><title>Other Support/Acknowledgement</title>
<p>We would like to thank Editage (<ext-link ext-link-type="uri" xlink:href="http://www.editage.com">www.editage.com</ext-link>) for English language editing.</p></ack>
<ref-list><title>References</title>
<ref id="r1"><mixed-citation publication-type="book">Altenmüller, E. (2022). Brain mechanisms of music learning and performing. In G. E. McPherson (Ed.), <italic>The Oxford handbook of music performance: Development and learning, proficiencies, performance practices, and psychology</italic> (Vol. 2, pp. 157–178). Oxford University Press.<pub-id pub-id-type="doi">10.1093/oxfordhb/9780190056285.013.24</pub-id></mixed-citation></ref>
<ref id="r2"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Asztalos</surname>, <given-names>K.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Csapo</surname>, <given-names>B.</given-names></string-name></person-group> (<year>2017</year>). <article-title>Development of musical abilities: Cross-sectional computer-based assessments in educational contexts.</article-title> <source>Psychology of Music</source>, <volume>45</volume>(<issue>5</issue>), <fpage>682</fpage>–<lpage>698</lpage>. <pub-id pub-id-type="doi">10.1177/0305735616678055</pub-id></mixed-citation></ref>
<ref id="r3"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Bates</surname>, <given-names>D.</given-names></string-name>, <string-name name-style="western"><surname>Mächler</surname>, <given-names>M.</given-names></string-name>, <string-name name-style="western"><surname>Bolker</surname>, <given-names>B.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Walker</surname>, <given-names>S.</given-names></string-name></person-group> (<year>2015</year>). <article-title>Fitting linear mixed-effects models using lme4.</article-title> <source>Journal of Statistical Software</source>, <volume>67</volume>(<issue>1</issue>). <pub-id pub-id-type="doi">10.18637/jss.v067.i01</pub-id></mixed-citation></ref>
<ref id="r4"><mixed-citation publication-type="book">Bond, T., &amp; Fox, C. M. (2015). <italic>Applying the Rasch model: Fundamental measurement in the human sciences</italic> (3rd ed.). Taylor &amp; Francis Group.</mixed-citation></ref>
<ref id="r5"><mixed-citation publication-type="book">Borenstein, M. (2019). Heterogeneity in meta-analysis. In H. Cooper, L. V. Hedges, &amp; J. C. Valentine (Eds.), <italic>The handbook of research synthesis and meta-analysis</italic> (3rd ed., pp. 453–470). Russell Sage Foundation.</mixed-citation></ref>
<ref id="r6"><mixed-citation publication-type="book">Borenstein, M., &amp; Hedges, L. V. (2019). Effect sizes for meta-analysis. In H. Cooper, L. V. Hedges, &amp; J. C. Valentine (Eds.), <italic>The handbook of research synthesis and meta-analysis</italic> (3rd ed., pp. 207–243). Russell Sage Foundation.</mixed-citation></ref>
<ref id="r7"><mixed-citation publication-type="book">Boutron, I., Page, M. J., Higgins, J. P. T., Altman, D. G., Lundh, A., &amp; Hróbjartsson, A. (2022). Chapter 7: Considering bias and conflicts of interest among the included studies. In J. P. T. Higgins, J. Thomas, J. Chandler, M. Chumpston, T. Li, M. J. Page, &amp; V. Welch (Eds.), <italic>Cochrane handbook for systematic reviews of interventions</italic> (Version 6.3, updated February 2022). Cochrane. <ext-link ext-link-type="uri" xlink:href="https://www.cochrane.org/authors/handbooks-and-manuals/handbook/archive/v6.3">https://www.cochrane.org/authors/handbooks-and-manuals/handbook/archive/v6.3</ext-link></mixed-citation></ref>
<ref id="r8"><mixed-citation publication-type="book">Brehmer, F. (1925). <italic>Melodieauffassung und melodische Begabung des Kindes</italic> [Melodic perception and melodic giftedness in the child]. Barth.</mixed-citation></ref>
<ref id="r9"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Bürkner</surname>, <given-names>P.-C.</given-names></string-name></person-group> (<year>2017</year>). <article-title>brms: An R package for Bayesian multilevel models using Stan.</article-title> <source>Journal of Statistical Software</source>, <volume>80</volume>, <fpage>1</fpage>–<lpage>28</lpage>. <pub-id pub-id-type="doi">10.18637/jss.v080.i01</pub-id></mixed-citation></ref>
<ref id="r10"><mixed-citation publication-type="book">Corrigall, K. A., &amp; Schellenberg, E. G. (2016). Music cognition in childhood. In S. Hallam, I. Cross, &amp; M. H. Thaut (Eds.), <italic>The child as musician: A handbook of musical development</italic> (2nd ed., pp. 81–101). Oxford University Press.</mixed-citation></ref>
<ref id="r11"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Corrigall</surname>, <given-names>K. A.</given-names></string-name>, <string-name name-style="western"><surname>Tillmann</surname>, <given-names>B.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Schellenberg</surname>, <given-names>E. G.</given-names></string-name></person-group> (<year>2022</year>). <article-title>Measuring children’s harmonic knowledge with implicit and explicit tests.</article-title> <source>Music Perception</source>, <volume>39</volume>(<issue>4</issue>), <fpage>361</fpage>–<lpage>370</lpage>. <pub-id pub-id-type="doi">10.1525/mp.2022.39.4.361</pub-id></mixed-citation></ref>
<ref id="r12"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Corrigall</surname>, <given-names>K. A.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Trainor</surname>, <given-names>L. J.</given-names></string-name></person-group> (<year>2009</year>). <article-title>Effects of musical training on key and harmonic perception.</article-title> <source>Annals of the New York Academy of Sciences</source>, <volume>1169</volume>(<issue>1</issue>), <fpage>164</fpage>–<lpage>168</lpage>. <pub-id pub-id-type="doi">10.1111/j.1749-6632.2009.04769.x</pub-id><pub-id pub-id-type="pmid">19673773</pub-id></mixed-citation></ref>
<ref id="r13"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Corrigall</surname>, <given-names>K. A.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Trainor</surname>, <given-names>L. J.</given-names></string-name></person-group> (<year>2014</year>). <article-title>Enculturation to musical pitch structure in young children: Evidence from behavioral and electrophysiological methods.</article-title> <source>Developmental Science</source>, <volume>17</volume>(<issue>1</issue>), <fpage>142</fpage>–<lpage>158</lpage>. <pub-id pub-id-type="doi">10.1111/desc.12100</pub-id><pub-id pub-id-type="pmid">24205955</pub-id></mixed-citation></ref>
<ref id="r14"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Cuddy</surname>, <given-names>L. L.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Badertscher</surname>, <given-names>B.</given-names></string-name></person-group> (<year>1987</year>). <article-title>Recovery of the tonal hierarchy: Some comparisons across age and levels of musical experience.</article-title> <source>Perception &amp; Psychophysics</source>, <volume>41</volume>(<issue>6</issue>), <fpage>609</fpage>–<lpage>620</lpage>. <pub-id pub-id-type="doi">10.3758/BF03210493</pub-id></mixed-citation></ref>
<ref id="r15"><mixed-citation publication-type="web">Cui, A.-X. (2019). <italic>Characterizing statistical learning of music</italic> [Dissertation, Queen’s University]. ProQuest Dissertations Publishing. <ext-link ext-link-type="uri" xlink:href="https://www.proquest.com/openview/89fa1699a21bf11f4c790d98c5fcab6a/1?pq-origsite=gscholar&amp;cbl=18750&amp;diss=y">https://www.proquest.com/openview/89fa1699a21bf11f4c790d98c5fcab6a/1?pq-origsite=gscholar&amp;cbl=18750&amp;diss=y</ext-link></mixed-citation></ref>
<ref id="r16"><mixed-citation publication-type="book">Demorest, S. M., &amp; Morrison, S. J. (2016). Quantifying culture: The cultural distance hypothesis of melodic expectancy. In J. Y. Chiao, S.-C. Li, R. Seligman, &amp; R. Turner (Eds.), <italic>The Oxford handbook of cultural neuroscience</italic> (pp. 183–194). Oxford University Press.</mixed-citation></ref>
<ref id="r17"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Eerola</surname>, <given-names>T.</given-names></string-name></person-group> (<year>2025</year>). <article-title>Prevalence of transparency and reproducibility-related research practices in music psychology (2017–2022).</article-title> <source>Musicae Scientiae</source>, <volume>29</volume>(<issue>2</issue>), <fpage>385</fpage>–<lpage>399</lpage>. <pub-id pub-id-type="doi">10.1177/10298649241300885</pub-id></mixed-citation></ref>
<ref id="r18"><mixed-citation publication-type="book">Ellis, P. D. (2010). <italic>The essential guide to effect sizes: Statistical power, meta-analysis, and the interpretation of research results</italic>. Cambridge University Press.</mixed-citation></ref>
<ref id="r19"><mixed-citation publication-type="book">Gardner, H. (1973). <italic>The arts and human development: A psychological study of the artistic process</italic>. John Wiley &amp; Sons.</mixed-citation></ref>
<ref id="r20"><mixed-citation publication-type="book">Gelman, A., Carlin, J. B., Stern, H. S., Dunson, D. B., Vehtari, A., &amp; Rubin, D. B. (2015). <italic>Bayesian data analysis</italic> (3rd ed.). Chapman and Hall/CRC.</mixed-citation></ref>
<ref id="r21"><mixed-citation publication-type="book">Gembris, H. (2017a). Entwicklungstheorien und empirische Befunde [Developmental theories and empirical results]. In H. Gembris (Ed.), <italic>Grundlagen musikalischer Entwicklung und Begabung</italic> (5th ed., pp. 233–265). Wißner.</mixed-citation></ref>
<ref id="r22"><mixed-citation publication-type="book">Gembris, H. (2017b). <italic>Grundlagen musikalischer Begabung und Entwicklung [Foundations of musical giftedness and development]</italic> (5th ed.). Wißner.</mixed-citation></ref>
<ref id="r23"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Gignac</surname>, <given-names>G. E.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Szodorai</surname>, <given-names>E. T.</given-names></string-name></person-group> (<year>2016</year>). <article-title>Effect size guidelines for individual differences researchers.</article-title> <source>Personality and Individual Differences</source>, <volume>102</volume>, <fpage>74</fpage>–<lpage>78</lpage>. <pub-id pub-id-type="doi">10.1016/j.paid.2016.06.069</pub-id></mixed-citation></ref>
<ref id="r24"><mixed-citation publication-type="book">Gordon, E. E. (2012). <italic>Learning sequences in music: A contemporary music learning theory</italic> (8th ed.). Gia Publications.</mixed-citation></ref>
<ref id="r25"><mixed-citation publication-type="web">Government of the UK, Department of Education. (2021). <italic>National curriculum in England: Music programmes of study</italic>. <ext-link ext-link-type="uri" xlink:href="https://www.gov.uk/government/publications/national-curriculum-in-england-music-programmes-of-study/national-curriculum-in-england-music-programmes-of-study">https://www.gov.uk/government/publications/national-curriculum-in-england-music-programmes-of-study/national-curriculum-in-england-music-programmes-of-study</ext-link></mixed-citation></ref>
<ref id="r26"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Guilbault</surname>, <given-names>D. M.</given-names></string-name></person-group> (<year>2009</year>). <article-title>The effects of harmonic accompaniment on the tonal improvisations of students in first through sixth grade.</article-title> <source>Journal of Research in Music Education</source>, <volume>57</volume>(<issue>2</issue>), <fpage>81</fpage>–<lpage>91</lpage>. <pub-id pub-id-type="doi">10.1177/0022429409337201</pub-id></mixed-citation></ref>
<ref id="r27"><mixed-citation publication-type="book">Halford, G. S. (2014). <italic>Children’s understanding: The development of mental models</italic>. Psychology Press.</mixed-citation></ref>
<ref id="r28"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Hanna-Pladdy</surname>, <given-names>B.</given-names></string-name>, &amp; <string-name name-style="western"><surname>MacKay</surname>, <given-names>A.</given-names></string-name></person-group> (<year>2011</year>). <article-title>The relation between instrumental musical activity and cognitive aging.</article-title> <source>Neuropsychology</source>, <volume>25</volume>(<issue>3</issue>), <fpage>378</fpage>–<lpage>386</lpage>. <pub-id pub-id-type="doi">10.1037/a0021895</pub-id><pub-id pub-id-type="pmid">21463047</pub-id></mixed-citation></ref>
<ref id="r29"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Hannon</surname>, <given-names>E. E.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Trainor</surname>, <given-names>L. J.</given-names></string-name></person-group> (<year>2007</year>). <article-title>Music acquisition: Effects of enculturation and formal training on development.</article-title> <source>Trends in Cognitive Sciences</source>, <volume>11</volume>(<issue>11</issue>), <fpage>466</fpage>–<lpage>472</lpage>. <pub-id pub-id-type="doi">10.1016/j.tics.2007.08.008</pub-id><pub-id pub-id-type="pmid">17981074</pub-id></mixed-citation></ref>
<ref id="r30"><mixed-citation publication-type="book">Hargreaves, D. J. (1996). The development of artistic and musical competence. In I. Deliege &amp; J. A. Sloboda (Eds.), <italic>Musical beginnings: Origins and development of musical competence</italic> (pp. 145–170). Oxford University Press.</mixed-citation></ref>
<ref id="r31"><mixed-citation publication-type="book">Hargreaves, D. J., &amp; Lamont, A. (2017). Cognition, perception, and learning. In D. J. Hargreaves &amp; A. Lamont (Eds.), <italic>The psychology of musical development</italic> (1st ed., pp. 14–57). Cambridge University Press. <pub-id pub-id-type="doi">10.1017/9781107281868</pub-id></mixed-citation></ref>
<ref id="r32"><mixed-citation publication-type="web">Harrer, M., Cuijpers, P., Furukawa, T. A., &amp; Ebert, D. D. (2021). <italic>Doing meta-analysis in R: A hands-on guide</italic>. Chapman and Hall/CRC. <ext-link ext-link-type="uri" xlink:href="https://bookdown.org/MathiasHarrer/Doing_Meta_Analysis_in_R/bayesianma.html">https://bookdown.org/MathiasHarrer/Doing_Meta_Analysis_in_R/bayesianma.html</ext-link></mixed-citation></ref>
<ref id="r33"><mixed-citation publication-type="book">Hattie, J. (2012). <italic>Visible learning</italic>. Routledge.</mixed-citation></ref>
<ref id="r34"><mixed-citation publication-type="book">Hayes, A. F. (2022). <italic>Introduction to mediation, moderation, and conditional process analysis: A regression-based approach</italic> (3rd ed.). Guilford Press.</mixed-citation></ref>
<ref id="r35"><mixed-citation publication-type="book">Hedges, L. V. (2019). Stochastically dependent effect sizes. In H. Cooper, L. V. Hedges, &amp; J. C. Valentine (Eds.), <italic>The handbook of research synthesis and meta-analysis</italic> (3rd ed., pp. 281–298). Russell Sage Foundation.</mixed-citation></ref>
<ref id="r36"><mixed-citation publication-type="web">Hyer, B. (2021). <italic>Tonality</italic> [Online Dictionary]. Grove Music Online. <ext-link ext-link-type="uri" xlink:href="https://www.oxfordmusiconline.com/grovemusic/view/10.1093/gmo/9781561592630.001.0001/omo-9781561592630-e-0000028102">https://www.oxfordmusiconline.com/grovemusic/view/10.1093/gmo/9781561592630.001.0001/omo-9781561592630-e-0000028102</ext-link></mixed-citation></ref>
<ref id="r37"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>James</surname>, <given-names>C. E.</given-names></string-name>, <string-name name-style="western"><surname>Cereghetti</surname>, <given-names>D. M.</given-names></string-name>, <string-name name-style="western"><surname>Tribes</surname>, <given-names>E. R.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Oechslin</surname>, <given-names>M. S.</given-names></string-name></person-group> (<year>2015</year>). <article-title>Electrophysiological evidence for a specific neural correlate of musical violation expectation in primary-school children.</article-title> <source>NeuroImage</source>, <volume>104</volume>, <fpage>386</fpage>–<lpage>397</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuroimage.2014.09.047</pub-id><pub-id pub-id-type="pmid">25278251</pub-id></mixed-citation></ref>
<ref id="r38"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>James</surname>, <given-names>C. E.</given-names></string-name>, <string-name name-style="western"><surname>Dupuis-Lozeron</surname>, <given-names>E.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Hauert</surname>, <given-names>C.-A.</given-names></string-name></person-group> (<year>2012</year>). <article-title>Appraisal of musical syntax violations by primary school children: Effects of age and practice.</article-title> <source>Swiss Journal of Psychology</source>, <volume>71</volume>(<issue>3</issue>), <fpage>161</fpage>–<lpage>168</lpage>. <pub-id pub-id-type="doi">10.1024/1421-0185/a000084</pub-id></mixed-citation></ref>
<ref id="r39"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Janata</surname>, <given-names>P.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Reisberg</surname>, <given-names>D.</given-names></string-name></person-group> (<year>1988</year>). <article-title>Response-time measures as a means of exploring tonal hierarchies.</article-title> <source>Music Perception</source>, <volume>6</volume>(<issue>2</issue>), <fpage>161</fpage>–<lpage>172</lpage>. <pub-id pub-id-type="doi">10.2307/40285423</pub-id></mixed-citation></ref>
<ref id="r40"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Jentschke</surname>, <given-names>S.</given-names></string-name>, <string-name name-style="western"><surname>Koelsch</surname>, <given-names>S.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Friederici</surname>, <given-names>A. D.</given-names></string-name></person-group> (<year>2005</year>). <article-title>Investigating the relationship of music and language in children: Influences of musical training and language impairment.</article-title> <source>Annals of the New York Academy of Sciences</source>, <volume>1060</volume>(<issue>1</issue>), <fpage>231</fpage>–<lpage>242</lpage>. <pub-id pub-id-type="doi">10.1196/annals.1360.016</pub-id><pub-id pub-id-type="pmid">16597770</pub-id></mixed-citation></ref>
<ref id="r41"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Jonaitis</surname>, <given-names>E. M.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Saffran</surname>, <given-names>J. R.</given-names></string-name></person-group> (<year>2009</year>). <article-title>Learning harmony: The role of serial statistics.</article-title> <source>Cognitive Science</source>, <volume>33</volume>(<issue>5</issue>), <fpage>951</fpage>–<lpage>968</lpage>. <pub-id pub-id-type="doi">10.1111/j.1551-6709.2009.01036.x</pub-id><pub-id pub-id-type="pmid">21585492</pub-id></mixed-citation></ref>
<ref id="r42"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Koelsch</surname>, <given-names>S.</given-names></string-name>, <string-name name-style="western"><surname>Fritz</surname>, <given-names>T.</given-names></string-name>, <string-name name-style="western"><surname>Schulze</surname>, <given-names>K.</given-names></string-name>, <string-name name-style="western"><surname>Alsop</surname>, <given-names>D.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Schlaug</surname>, <given-names>G.</given-names></string-name></person-group> (<year>2005</year>). <article-title>Adults and children processing music: An fMRI study.</article-title> <source>NeuroImage</source>, <volume>25</volume>(<issue>4</issue>), <fpage>1068</fpage>–<lpage>1076</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuroimage.2004.12.050</pub-id><pub-id pub-id-type="pmid">15850725</pub-id></mixed-citation></ref>
<ref id="r43"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Kraus</surname>, <given-names>N.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Chandrasekaran</surname>, <given-names>B.</given-names></string-name></person-group> (<year>2010</year>). <article-title>Music training for the development of auditory skills.</article-title> <source>Nature Reviews. Neuroscience</source>, <volume>11</volume>(<issue>8</issue>), <fpage>599</fpage>–<lpage>605</lpage>. <pub-id pub-id-type="doi">10.1038/nrn2882</pub-id><pub-id pub-id-type="pmid">20648064</pub-id></mixed-citation></ref>
<ref id="r44"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Kristop</surname>, <given-names>C. A.</given-names></string-name>, <string-name name-style="western"><surname>Moreno</surname>, <given-names>S. J.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Anta</surname>, <given-names>J. F.</given-names></string-name></person-group> (<year>2020</year>). <article-title>What do listeners understand by “continuity” and “closure?” Tracking down the links between tonal expectancy, music training, and conceptualization.</article-title> <source>Psychology of Music</source>, <volume>48</volume>(<issue>3</issue>), <fpage>344</fpage>–<lpage>357</lpage>. <pub-id pub-id-type="doi">10.1177/0305735618803000</pub-id></mixed-citation></ref>
<ref id="r45"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Krumhansl</surname>, <given-names>C. L.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Keil</surname>, <given-names>F. C.</given-names></string-name></person-group> (<year>1982</year>). <article-title>Acquisition of the hierarchy of tonal functions in music.</article-title> <source>Memory &amp; Cognition</source>, <volume>10</volume>(<issue>3</issue>), <fpage>243</fpage>–<lpage>251</lpage>. <pub-id pub-id-type="doi">10.3758/BF03197636</pub-id><pub-id pub-id-type="pmid">7121246</pub-id></mixed-citation></ref>
<ref id="r46"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Krumhansl</surname>, <given-names>C. L.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Kessler</surname>, <given-names>E. J.</given-names></string-name></person-group> (<year>1982</year>). <article-title>Tracing the dynamic changes in perceived tonal organization in a spatial representation of musical keys.</article-title> <source>Psychological Review</source>, <volume>89</volume>(<issue>4</issue>), <fpage>334</fpage>–<lpage>368</lpage>. <pub-id pub-id-type="doi">10.1037/0033-295X.89.4.334</pub-id><pub-id pub-id-type="pmid">7134332</pub-id></mixed-citation></ref>
<ref id="r47"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Krumhansl</surname>, <given-names>C. L.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Shepard</surname>, <given-names>R. N.</given-names></string-name></person-group> (<year>1979</year>). <article-title>Quantification of the hierarchy of tonal functions within a diatonic context.</article-title> <source>Journal of Experimental Psychology. Human Perception and Performance</source>, <volume>5</volume>(<issue>4</issue>), <fpage>579</fpage>–<lpage>594</lpage>. <pub-id pub-id-type="doi">10.1037/0096-1523.5.4.579</pub-id><pub-id pub-id-type="pmid">528960</pub-id></mixed-citation></ref>
<ref id="r48"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Lamont</surname>, <given-names>A.</given-names></string-name></person-group> (<year>1998</year>). <article-title>Music, education, and the development of pitch perception: The role of context, age, and musical experience.</article-title> <source>Psychology of Music</source>, <volume>26</volume>(<issue>1</issue>), <fpage>7</fpage>–<lpage>25</lpage>. <pub-id pub-id-type="doi">10.1177/0305735698261003</pub-id></mixed-citation></ref>
<ref id="r49"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Lamont</surname>, <given-names>A.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Cross</surname>, <given-names>I.</given-names></string-name></person-group> (<year>1994</year>). <article-title>Children’s cognitive representations of musical pitch.</article-title> <source>Music Perception</source>, <volume>12</volume>(<issue>1</issue>), <fpage>27</fpage>–<lpage>55</lpage>. <pub-id pub-id-type="doi">10.2307/40285754</pub-id></mixed-citation></ref>
<ref id="r50"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Landis</surname>, <given-names>J. R.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Koch</surname>, <given-names>G. G.</given-names></string-name></person-group> (<year>1977</year>). <article-title>The measurement of observer agreement for categorical data.</article-title> <source>Biometrics</source>, <volume>33</volume>(<issue>1</issue>), <fpage>159</fpage>–<lpage>174</lpage>. <pub-id pub-id-type="doi">10.2307/2529310</pub-id><pub-id pub-id-type="pmid">843571</pub-id></mixed-citation></ref>
<ref id="r51"><mixed-citation publication-type="confproc">Lin, H.-R. (2023, September 8–10). <italic>Bedeutung von Geschlecht und sozioökonomischem Status für die Entwicklung musikalischer Fähigkeiten bei Jugendlichen: Vorläufige Ergebnisse der Langzeitstudie LongGold</italic> [Relevance of gender and socioeconomic status for the development of musical skills in adolescence: Preliminary results of the longitudinal study LongGold] [Paper presentation]. The 39th annual meeting of the German Society for Music Psychology, Hannover.</mixed-citation></ref>
<ref id="r52"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Mack</surname>, <given-names>M.</given-names></string-name>, <string-name name-style="western"><surname>Marie</surname>, <given-names>D.</given-names></string-name>, <string-name name-style="western"><surname>Worschech</surname>, <given-names>F.</given-names></string-name>, <string-name name-style="western"><surname>Krüger</surname>, <given-names>T. H. C.</given-names></string-name>, <string-name name-style="western"><surname>Sinke</surname>, <given-names>C.</given-names></string-name>, <string-name name-style="western"><surname>Altenmüller</surname>, <given-names>E.</given-names></string-name>, <string-name name-style="western"><surname>James</surname>, <given-names>C. E.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Kliegel</surname>, <given-names>M.</given-names></string-name></person-group> (<year>2025</year>). <article-title>Effects of a 1-year piano intervention on cognitive flexibility in older adults.</article-title> <source>Psychology and Aging</source>, <volume>40</volume>(<issue>2</issue>), <fpage>218</fpage>–<lpage>235</lpage>. <pub-id pub-id-type="doi">10.1037/pag0000871</pub-id><pub-id pub-id-type="pmid">39679985</pub-id></mixed-citation></ref>
<ref id="r53"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Magne</surname>, <given-names>C.</given-names></string-name>, <string-name name-style="western"><surname>Schon</surname>, <given-names>D.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Besson</surname>, <given-names>M.</given-names></string-name></person-group> (<year>2006</year>). <article-title>Musician children detect pitch violations in both music and language better than nonmusician children: Behavioral and electrophysiological approaches.</article-title> <source>Journal of Cognitive Neuroscience</source>, <volume>18</volume>(<issue>2</issue>), <fpage>199</fpage>–<lpage>211</lpage>. <pub-id pub-id-type="doi">10.1162/jocn.2006.18.2.199</pub-id><pub-id pub-id-type="pmid">16494681</pub-id></mixed-citation></ref>
<ref id="r54"><mixed-citation publication-type="book">Maier-Karius, J., &amp; Schwarzer, G. (2011). Die Beziehung zwischen Tonalitätsverstehen und kognitiven Fähigkeiten [The correlation between tonal understanding and cognitive abilities]. In W. Auhagen, C. Bullerjahn, &amp; H. Höge (Eds.), <italic>Jahrbuch der Deutschen Gesellschaft für Musikpsychologie</italic> (Vol. 21, pp. 164–184). Hogrefe. <pub-id pub-id-type="doi">10.23668/psycharchives.2940</pub-id></mixed-citation></ref>
<ref id="r55"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Mandikal Vasuki</surname>, <given-names>P. R.</given-names></string-name>, <string-name name-style="western"><surname>Sharma</surname>, <given-names>M.</given-names></string-name>, <string-name name-style="western"><surname>Demuth</surname>, <given-names>K.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Arciuli</surname>, <given-names>J.</given-names></string-name></person-group> (<year>2016</year>). <article-title>Musicians’ edge: A comparison of auditory processing, cognitive abilities, and statistical learning.</article-title> <source>Hearing Research</source>, <volume>342</volume>, <fpage>112</fpage>–<lpage>123</lpage>. <pub-id pub-id-type="doi">10.1016/j.heares.2016.10.008</pub-id><pub-id pub-id-type="pmid">27770623</pub-id></mixed-citation></ref>
<ref id="r56"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Matsunaga</surname>, <given-names>R.</given-names></string-name>, <string-name name-style="western"><surname>Hartono</surname>, <given-names>P.</given-names></string-name>, <string-name name-style="western"><surname>Yokosawa</surname>, <given-names>K.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Abe</surname>, <given-names>J.</given-names></string-name></person-group> (<year>2020</year>). <article-title>The development of sensitivity to tonality structure of music: Evidence from Japanese children raised in a simultaneous and unbalanced bi-musical environment.</article-title> <source>Music Perception</source>, <volume>37</volume>(<issue>3</issue>), <fpage>225</fpage>–<lpage>239</lpage>. <pub-id pub-id-type="doi">10.1525/mp.2020.37.3.225</pub-id></mixed-citation></ref>
<ref id="r57"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Miles</surname>, <given-names>S. A.</given-names></string-name>, <string-name name-style="western"><surname>Miranda</surname>, <given-names>R. A.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Ullman</surname>, <given-names>M. T.</given-names></string-name></person-group> (<year>2016</year>). <article-title>Sex differences in music: A female advantage at recognizing familiar melodies.</article-title> <source>Frontiers in Psychology</source>, <volume>7</volume>, <elocation-id>278</elocation-id>. <pub-id pub-id-type="doi">10.3389/fpsyg.2016.00278</pub-id><pub-id pub-id-type="pmid">26973574</pub-id></mixed-citation></ref>
<ref id="r58"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Morgan</surname>, <given-names>E.</given-names></string-name>, <string-name name-style="western"><surname>Fogel</surname>, <given-names>A.</given-names></string-name>, <string-name name-style="western"><surname>Nair</surname>, <given-names>A.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Patel</surname>, <given-names>A. D.</given-names></string-name></person-group> (<year>2019</year>). <article-title>Statistical learning and Gestalt-like principles predict melodic expectations.</article-title> <source>Cognition</source>, <volume>189</volume>, <fpage>23</fpage>–<lpage>34</lpage>. <pub-id pub-id-type="doi">10.1016/j.cognition.2018.12.015</pub-id><pub-id pub-id-type="pmid">30913527</pub-id></mixed-citation></ref>
<ref id="r59"><mixed-citation publication-type="web">Müllensiefen, D. (2022, September 2–4). <italic>Die Entwicklung kognitiver und musikalischer Fähigkeiten: Vorläufige Ergebnisse einer Langzeitstudie</italic> [The development of cognitive and musical abilities: Preliminary results from a long-term study] [Paper Presentation]. The 38th annual meeting of the German Society for Music Psychology, Würzburg. <ext-link ext-link-type="uri" xlink:href="https://longgoldstudy.files.wordpress.com/2022/09/dgm2022_muellensiefen-et-al_vorlaeufige-ergebnisse.pdf">https://longgoldstudy.files.wordpress.com/2022/09/dgm2022_muellensiefen-et-al_vorlaeufige-ergebnisse.pdf</ext-link></mixed-citation></ref>
<ref id="r60"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Müllensiefen</surname>, <given-names>D.</given-names></string-name>, <string-name name-style="western"><surname>Elvers</surname>, <given-names>P.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Frieler</surname>, <given-names>K.</given-names></string-name></person-group> (<year>2022</year>). <article-title>Musical development during adolescence: Perceptual skills, cognitive resources, and musical training.</article-title> <source>Annals of the New York Academy of Sciences</source>, <volume>1518</volume>(<issue>1</issue>), <fpage>264</fpage>–<lpage>281</lpage>. <pub-id pub-id-type="doi">10.1111/nyas.14911</pub-id><pub-id pub-id-type="pmid">36251356</pub-id></mixed-citation></ref>
<ref id="r61"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Müllensiefen</surname>, <given-names>D.</given-names></string-name>, <string-name name-style="western"><surname>Gingras</surname>, <given-names>B.</given-names></string-name>, <string-name name-style="western"><surname>Musil</surname>, <given-names>J.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Stewart</surname>, <given-names>L.</given-names></string-name></person-group> (<year>2014</year>). <article-title>The musicality of non-musicians: An index for assessing musical sophistication in the general population.</article-title> <source>PLoS One</source>, <volume>9</volume>(<issue>2</issue>), <elocation-id>e89642</elocation-id>. <pub-id pub-id-type="doi">10.1371/journal.pone.0089642</pub-id><pub-id pub-id-type="pmid">24586929</pub-id></mixed-citation></ref>
<ref id="r62"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Murad</surname>, <given-names>M. H.</given-names></string-name>, <string-name name-style="western"><surname>Asi</surname>, <given-names>N.</given-names></string-name>, <string-name name-style="western"><surname>Alsawas</surname>, <given-names>M.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Alahdab</surname>, <given-names>F.</given-names></string-name></person-group> (<year>2016</year>). <article-title>New evidence pyramid.</article-title> <source>BMJ Evidence-Based Medicine</source>, <volume>21</volume>(<issue>4</issue>), <fpage>125</fpage>–<lpage>127</lpage>. <pub-id pub-id-type="doi">10.1136/ebmed-2016-110401</pub-id><pub-id pub-id-type="pmid">27339128</pub-id></mixed-citation></ref>
<ref id="r63"><mixed-citation publication-type="web">Paananen, P. (2003). <italic>Monta polkua musiikkiin: Tonaalisen musiikin perusrakenteiden kehittyminen musiikin tuottamis- ja improvisaatiotehtävissä ikävuosina 6–11</italic> [Many paths to music: The development of the basic structures of tonal music in music production and improvisation tasks in ages 6–11] [Unpublished doctoral dissertation, University of Jyväskylä, Finland]. <ext-link ext-link-type="uri" xlink:href="http://search.ebscohost.com/login.aspx?direct=true&amp;db=rih&amp;AN=A534346&amp;site=ehost-live">http://search.ebscohost.com/login.aspx?direct=true&amp;db=rih&amp;AN=A534346&amp;site=ehost-live</ext-link></mixed-citation></ref>
<ref id="r64"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Paananen</surname>, <given-names>P.</given-names></string-name></person-group> (<year>2007</year>). <article-title>Melodic improvisation at the age of 6–11 years: Development of pitch and rhythm.</article-title> <source>Musicae Scientiae</source>, <volume>11</volume>(<issue>1</issue>), <fpage>89</fpage>–<lpage>119</lpage>. <pub-id pub-id-type="doi">10.1177/102986490701100104</pub-id></mixed-citation></ref>
<ref id="r65"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Paananen</surname>, <given-names>P.</given-names></string-name></person-group> (<year>2009</year>). <article-title>Children’s and adolescents’ harmonisation of a tonal melody.</article-title> <source>Music Education Research</source>, <volume>11</volume>(<issue>2</issue>), <fpage>153</fpage>–<lpage>174</lpage>. <pub-id pub-id-type="doi">10.1080/14613800902923294</pub-id></mixed-citation></ref>
<ref id="r66"><mixed-citation publication-type="confproc">Patel, A. D. (2021, July 28–21). <italic>Measuring and modeling melodic expectation using singing: Surprising findings and new opportunities for cross-cultural research</italic> [Keynote]. ICMPC16-ESCOM11. Connectivity and diversity in music cognition, University of Sheffield, UK.</mixed-citation></ref>
<ref id="r67"><mixed-citation publication-type="web">Pinheiro, J., &amp; Bates, D. (2024). <italic>nlme: Linear and nonlinear mixed effects models</italic> (Version 3.1–166) [Computer software]. <ext-link ext-link-type="uri" xlink:href="https://CRAN.R-project.org/package=nlme">https://CRAN.R-project.org/package=nlme</ext-link></mixed-citation></ref>
<ref id="r68"><mixed-citation publication-type="book">Piston, W. (1978). <italic>Harmony</italic> (4th ed.). Norton.</mixed-citation></ref>
<ref id="r69"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Platz</surname>, <given-names>F.</given-names></string-name>, <string-name name-style="western"><surname>Kopiez</surname>, <given-names>R.</given-names></string-name>, <string-name name-style="western"><surname>Lehmann</surname>, <given-names>A. C.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Wolf</surname>, <given-names>A.</given-names></string-name></person-group> (<year>2022</year>). <article-title>Measuring audiation or tonal memory? Evaluation of the discriminant validity of Edwin E. Gordon’s “Advanced Measures of Music Audiation.”</article-title>. <source>Music &amp; Science</source>, <volume>5</volume>, <elocation-id>20592043221105270</elocation-id>. <pub-id pub-id-type="doi">10.1177/20592043221105270</pub-id></mixed-citation></ref>
<ref id="r70"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Politimou</surname>, <given-names>N.</given-names></string-name>, <string-name name-style="western"><surname>Douglass-Kirk</surname>, <given-names>P.</given-names></string-name>, <string-name name-style="western"><surname>Pearce</surname>, <given-names>M.</given-names></string-name>, <string-name name-style="western"><surname>Stewart</surname>, <given-names>L.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Franco</surname>, <given-names>F.</given-names></string-name></person-group> (<year>2021</year>). <article-title>Melodic expectations in 5- and 6-year-old children.</article-title> <source>Journal of Experimental Child Psychology</source>, <volume>203</volume>, <elocation-id>105020</elocation-id>. <pub-id pub-id-type="doi">10.1016/j.jecp.2020.105020</pub-id><pub-id pub-id-type="pmid">33271397</pub-id></mixed-citation></ref>
<ref id="r71"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Prince</surname>, <given-names>J. B.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Schmuckler</surname>, <given-names>M. A.</given-names></string-name></person-group> (<year>2014</year>). <article-title>The tonal-metric hierarchy.</article-title> <source>Music Perception</source>, <volume>31</volume>(<issue>3</issue>), <fpage>254</fpage>–<lpage>270</lpage>. <pub-id pub-id-type="doi">10.1525/mp.2014.31.3.254</pub-id></mixed-citation></ref>
<ref id="r72"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Pustejovsky</surname>, <given-names>J. E.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Rodgers</surname>, <given-names>M. A.</given-names></string-name></person-group> (<year>2019</year>). <article-title>Testing for funnel plot asymmetry of standardized mean differences.</article-title> <source>Research Synthesis Methods</source>, <volume>10</volume>(<issue>1</issue>), <fpage>57</fpage>–<lpage>71</lpage>. <pub-id pub-id-type="doi">10.1002/jrsm.1332</pub-id><pub-id pub-id-type="pmid">30506832</pub-id></mixed-citation></ref>
<ref id="r73"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Putkinen</surname>, <given-names>V.</given-names></string-name>, <string-name name-style="western"><surname>Tervaniemi</surname>, <given-names>M.</given-names></string-name>, <string-name name-style="western"><surname>Saarikivi</surname>, <given-names>K.</given-names></string-name>, <string-name name-style="western"><surname>Ojala</surname>, <given-names>P.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Huotilainen</surname>, <given-names>M.</given-names></string-name></person-group> (<year>2014</year>). <article-title>Enhanced development of auditory change detection in musically trained school-aged children: A longitudinal event-related potential study.</article-title> <source>Developmental Science</source>, <volume>17</volume>(<issue>2</issue>), <fpage>282</fpage>–<lpage>297</lpage>. <pub-id pub-id-type="doi">10.1111/desc.12109</pub-id><pub-id pub-id-type="pmid">24283257</pub-id></mixed-citation></ref>
<ref id="r74"><mixed-citation publication-type="web">R Core Team. (2022). <italic>R: A language and environment for statistical computing</italic> (Version 4.2.1) [Computer software]. <ext-link ext-link-type="uri" xlink:href="https://www.R-project.org/">https://www.R-project.org/</ext-link></mixed-citation></ref>
<ref id="r75"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Renkewitz</surname>, <given-names>F.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Keiner</surname>, <given-names>M.</given-names></string-name></person-group> (<year>2019</year>). <article-title>How to detect publication bias in psychological research.</article-title> <source>Zeitschrift für Psychologie</source>, <volume>227</volume>(<issue>4</issue>), <fpage>261</fpage>–<lpage>279</lpage>. <pub-id pub-id-type="doi">10.1027/2151-2604/a000386</pub-id></mixed-citation></ref>
<ref id="r76"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Röver</surname>, <given-names>C.</given-names></string-name></person-group> (<year>2020</year>). <article-title>Bayesian random-effects meta-analysis using the bayesmeta R package.</article-title> <source>Journal of Statistical Software</source>, <volume>93</volume>(<issue>6</issue>), <fpage>1</fpage>–<lpage>51</lpage>. <pub-id pub-id-type="doi">10.18637/jss.v093.i06</pub-id></mixed-citation></ref>
<ref id="r77"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Saffran</surname>, <given-names>J. R.</given-names></string-name>, <string-name name-style="western"><surname>Johnson</surname>, <given-names>E. K.</given-names></string-name>, <string-name name-style="western"><surname>Aslin</surname>, <given-names>R. N.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Newport</surname>, <given-names>E. L.</given-names></string-name></person-group> (<year>1999</year>). <article-title>Statistical learning of tone sequences by human infants and adults.</article-title> <source>Cognition</source>, <volume>70</volume>(<issue>1</issue>), <fpage>27</fpage>–<lpage>52</lpage>. <pub-id pub-id-type="doi">10.1016/S0010-0277(98)00075-4</pub-id><pub-id pub-id-type="pmid">10193055</pub-id></mixed-citation></ref>
<ref id="r78"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Sauvé</surname>, <given-names>S. A.</given-names></string-name>, <string-name name-style="western"><surname>Cho</surname>, <given-names>A.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Zendel</surname>, <given-names>B. R.</given-names></string-name></person-group> (<year>2021</year>). <article-title>Mapping tonal hierarchy in the brain.</article-title> <source>Neuroscience</source>, <volume>465</volume>, <fpage>187</fpage>–<lpage>202</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuroscience.2021.03.019</pub-id><pub-id pub-id-type="pmid">33774126</pub-id></mixed-citation></ref>
<ref id="r79"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Schellenberg</surname>, <given-names>E. G.</given-names></string-name>, <string-name name-style="western"><surname>Bigand</surname>, <given-names>E.</given-names></string-name>, <string-name name-style="western"><surname>Poulin-Charronnat</surname>, <given-names>B.</given-names></string-name>, <string-name name-style="western"><surname>Garnier</surname>, <given-names>C.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Stevens</surname>, <given-names>C.</given-names></string-name></person-group> (<year>2005</year>). <article-title>Children’s implicit knowledge of harmony in western music.</article-title> <source>Developmental Science</source>, <volume>8</volume>(<issue>6</issue>), <fpage>551</fpage>–<lpage>566</lpage>. <pub-id pub-id-type="doi">10.1111/j.1467-7687.2005.00447.x</pub-id><pub-id pub-id-type="pmid">16246247</pub-id></mixed-citation></ref>
<ref id="r80"><mixed-citation publication-type="book">Schmuckler, M. A. (2016). Tonality and contour in melodic processing. In S. Hallam, I. Cross, &amp; M. H. Thaut (Eds.), <italic>The Oxford handbook of music psychology</italic> (2nd ed., pp. 143–165). Oxford University Press.</mixed-citation></ref>
<ref id="r81"><mixed-citation publication-type="book">Schwarzer, G., Siegiesmund, A., &amp; Wilkening, F. (1993). Entwicklung des Tonalitätsverstehens bei der Beurteilung und Produktion von Liedschlüssen [Development of tonal understanding measured by ratings and productions of song endings]. In K.-E. Behne, G. Kleinen, &amp; H. de La Motte-Haber (Eds.), <italic>Jahrbuch der Deutschen Gesellschaft für Musikpsychologie. Empirische Forschungen—Ästhetische Experimente</italic> (Vol. 10, pp. 75–90). Florian Noetzel.</mixed-citation></ref>
<ref id="r82"><mixed-citation publication-type="book">Serafine, M. L. (1988). <italic>Music as cognition: The development of thought in sound</italic>. Columbia University Press.</mixed-citation></ref>
<ref id="r83"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Speer</surname>, <given-names>J. R.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Meeks</surname>, <given-names>P. U.</given-names></string-name></person-group> (<year>1985</year>). <article-title>School children’s perception of pitch in music.</article-title> <source>Psychomusicology: Music, Mind, and Brain</source>, <volume>5</volume>(<issue>1</issue>), <fpage>49</fpage>–<lpage>56</lpage>. <pub-id pub-id-type="doi">10.1037/h0094200</pub-id></mixed-citation></ref>
<ref id="r84"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Stalinski</surname>, <given-names>S. M.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Schellenberg</surname>, <given-names>E. G.</given-names></string-name></person-group> (<year>2010</year>). <article-title>Shifting perceptions: Developmental changes in judgments of melodic similarity.</article-title> <source>Developmental Psychology</source>, <volume>46</volume>(<issue>6</issue>), <fpage>1799</fpage>–<lpage>1803</lpage>. <pub-id pub-id-type="doi">10.1037/a0020658</pub-id><pub-id pub-id-type="pmid">20822211</pub-id></mixed-citation></ref>
<ref id="r85"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Swanwick</surname>, <given-names>K.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Tillman</surname>, <given-names>J.</given-names></string-name></person-group> (<year>1986</year>). <article-title>The sequence of musical development: A study of children’s composition.</article-title> <source>British Journal of Music Education</source>, <volume>3</volume>(<issue>3</issue>), <fpage>305</fpage>–<lpage>339</lpage>. <pub-id pub-id-type="doi">10.1017/S0265051700000814</pub-id></mixed-citation></ref>
<ref id="r86"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Trainor</surname>, <given-names>L. J.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Trehub</surname>, <given-names>S. E.</given-names></string-name></person-group> (<year>1992</year>). <article-title>A comparison of infants’ and adults’ sensitivity to western musical structure.</article-title> <source>Journal of Experimental Psychology. Human Perception and Performance</source>, <volume>18</volume>(<issue>2</issue>), <fpage>394</fpage>–<lpage>402</lpage>. <pub-id pub-id-type="doi">10.1037/0096-1523.18.2.394</pub-id><pub-id pub-id-type="pmid">1593226</pub-id></mixed-citation></ref>
<ref id="r87"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Trehub</surname>, <given-names>S. E.</given-names></string-name>, <string-name name-style="western"><surname>Schellenberg</surname>, <given-names>E. G.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Kamenetsky</surname>, <given-names>S. B.</given-names></string-name></person-group> (<year>1999</year>). <article-title>Infants’ and adults’ perception of scale structure.</article-title> <source>Journal of Experimental Psychology. Human Perception and Performance</source>, <volume>25</volume>(<issue>4</issue>), <fpage>965</fpage>–<lpage>975</lpage>. <pub-id pub-id-type="doi">10.1037/0096-1523.25.4.965</pub-id><pub-id pub-id-type="pmid">10464941</pub-id></mixed-citation></ref>
<ref id="r88"><mixed-citation publication-type="book">Turner, R. M., &amp; Higgins, J. P. T. (2019). Bayesian meta-analysis. In H. Cooper, L. V. Hedges, &amp; J. C. Valentine (Eds.), <italic>The handbook of research synthesis and meta-analysis</italic> (3rd ed., pp. 299–314). Russell Sage Foundation.</mixed-citation></ref>
<ref id="r89"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>van Doorn</surname> , <given-names>J.</given-names></string-name>, <string-name name-style="western"><surname>van den Bergh</surname>, <given-names>D.</given-names></string-name>, <string-name name-style="western"><surname>Böhm</surname>, <given-names>U.</given-names></string-name>, <string-name name-style="western"><surname>Dablander</surname>, <given-names>F.</given-names></string-name>, <string-name name-style="western"><surname>Derks</surname>, <given-names>K.</given-names></string-name>, <string-name name-style="western"><surname>Draws</surname>, <given-names>T.</given-names></string-name>, <string-name name-style="western"><surname>Etz</surname>, <given-names>A.</given-names></string-name>, <string-name name-style="western"><surname>Evans</surname>, <given-names>N. J.</given-names></string-name>, <string-name name-style="western"><surname>Gronau</surname>, <given-names>Q. F.</given-names></string-name>, <string-name name-style="western"><surname>Haaf</surname>, <given-names>J. M.</given-names></string-name>, <string-name name-style="western"><surname>Hinne</surname>, <given-names>M.</given-names></string-name>, <string-name name-style="western"><surname>Kucharský</surname>, <given-names>Š.</given-names></string-name>, <string-name name-style="western"><surname>Ly</surname>, <given-names>A.</given-names></string-name>, <string-name name-style="western"><surname>Marsman</surname>, <given-names>M.</given-names></string-name>, <string-name name-style="western"><surname>Matzke</surname>, <given-names>D.</given-names></string-name>, <string-name name-style="western"><surname>Gupta</surname>, <given-names>A. R. K. N.</given-names></string-name>, <string-name name-style="western"><surname>Sarafoglou</surname>, <given-names>A.</given-names></string-name>, <string-name name-style="western"><surname>Stefan</surname>, <given-names>A.</given-names></string-name>, <string-name name-style="western"><surname>Voelkel</surname>, <given-names>J. G.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Wagenmakers</surname>, <given-names>E.-J.</given-names></string-name></person-group> (<year>2021</year>). <article-title>The JASP guidelines for conducting and reporting a Bayesian analysis.</article-title> <source>Psychonomic Bulletin and Review</source>, <volume>28</volume>(<issue>3</issue>), <fpage>813</fpage>–<lpage>826</lpage>. <pub-id pub-id-type="doi">10.3758/s13423-020-01798-5</pub-id></mixed-citation></ref>
<ref id="r90"><mixed-citation publication-type="book">Vandekerckhove, J., Matzke, D., &amp; Wagenmakers, E.-J. (2015). Model comparison and the principle of parsimony. In J. R. Busemeyer, Z. Wang, J. T. Townsend, &amp; A. Eidels (Eds.), <italic>Model comparison and the principle of parsimony</italic> (Vol. 1, pp. 300–319). Oxford University Press. <pub-id pub-id-type="doi">10.1093/oxfordhb/9780199957996.013.14</pub-id></mixed-citation></ref>
<ref id="r91"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Verosky</surname>, <given-names>N. J.</given-names></string-name></person-group> (<year>2021</year>). <article-title>Interpreting the tonal hierarchy through corpus analysis.</article-title> <source>Psychomusicology: Music, Mind, and Brain</source>, <volume>31</volume>(<issue>2</issue>), <fpage>96</fpage>–<lpage>106</lpage>. <pub-id pub-id-type="doi">10.1037/pmu0000276</pub-id></mixed-citation></ref>
<ref id="r92"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Viechtbauer</surname>, <given-names>W.</given-names></string-name></person-group> (<year>2010</year>). <article-title>Conducting meta-analyses in R with the metafor package.</article-title> <source>Journal of Statistical Software</source>, <volume>36</volume>(<issue>3</issue>). <pub-id pub-id-type="doi">10.18637/jss.v036.i03</pub-id><pub-id pub-id-type="pmid">20808728</pub-id></mixed-citation></ref>
<ref id="r93"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Virtala</surname>, <given-names>P.</given-names></string-name>, <string-name name-style="western"><surname>Huotilainen</surname>, <given-names>M.</given-names></string-name>, <string-name name-style="western"><surname>Putkinen</surname>, <given-names>V.</given-names></string-name>, <string-name name-style="western"><surname>Makkonen</surname>, <given-names>T.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Tervaniemi</surname>, <given-names>M.</given-names></string-name></person-group> (<year>2012</year>). <article-title>Musical training facilitates the neural discrimination of major versus minor chords in 13-year-old children.</article-title> <source>Psychophysiology</source>, <volume>49</volume>(<issue>8</issue>), <fpage>1125</fpage>–<lpage>1132</lpage>. <pub-id pub-id-type="doi">10.1111/j.1469-8986.2012.01386.x</pub-id><pub-id pub-id-type="pmid">22681183</pub-id></mixed-citation></ref>
<ref id="r94"><mixed-citation publication-type="book">von Helmholtz, H. (1896). <italic>Die Lehre von den Tonempfindungen als physiologische Grundlage für die Theorie der Musik</italic> [On the sensations of tone as a physiological basis for the theory of music] (5th ed.). Friedrich Vieweg und Sohn.</mixed-citation></ref>
<ref id="r95"><mixed-citation publication-type="book">Vuvan, D. T. A. (2013). <italic>The statistical learning of musical expectancy</italic> [Doctoral dissertation]. University of Toronto (Canada). <ext-link ext-link-type="uri" xlink:href="https://utoronto.scholaris.ca/server/api/core/bitstreams/fc3e21ef-4769-4fb1-9475-684fb229f7cf/content">https://utoronto.scholaris.ca/server/api/core/bitstreams/fc3e21ef-4769-4fb1-9475-684fb229f7cf/content</ext-link></mixed-citation></ref>
<ref id="r96"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wehrum</surname>, <given-names>S.</given-names></string-name>, <string-name name-style="western"><surname>Degé</surname>, <given-names>F.</given-names></string-name>, <string-name name-style="western"><surname>Ott</surname>, <given-names>U.</given-names></string-name>, <string-name name-style="western"><surname>Walter</surname>, <given-names>B.</given-names></string-name>, <string-name name-style="western"><surname>Stippekohl</surname>, <given-names>B.</given-names></string-name>, <string-name name-style="western"><surname>Kagerer</surname>, <given-names>S.</given-names></string-name>, <string-name name-style="western"><surname>Schwarzer</surname>, <given-names>G.</given-names></string-name>, <string-name name-style="western"><surname>Vaitl</surname>, <given-names>D.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Stark</surname>, <given-names>R.</given-names></string-name></person-group> (<year>2011</year>). <article-title>Can you hear a difference? Neuronal correlates of melodic deviance processing in children.</article-title> <source>Brain Research</source>, <volume>1402</volume>, <fpage>80</fpage>–<lpage>92</lpage>. <pub-id pub-id-type="doi">10.1016/j.brainres.2011.05.057</pub-id><pub-id pub-id-type="pmid">21676378</pub-id></mixed-citation></ref>
<ref id="r97"><mixed-citation publication-type="web">What Works Clearinghouse. (2020). <italic>What Works Clearinghouse<sup>TM</sup> procedures handbook, Version 4.1</italic>. U.S. Department of Education, Institute of Education Science, National Center for Education Evaluation and Regional Assistance. <ext-link ext-link-type="uri" xlink:href="https://ies.ed.gov/ncee/wwc/Docs/referenceresources/WWC-Procedures-Handbook-v4-1-508.pdf">https://ies.ed.gov/ncee/wwc/Docs/referenceresources/WWC-Procedures-Handbook-v4-1-508.pdf</ext-link></mixed-citation></ref>
<ref id="r98"><mixed-citation publication-type="preprint">Williams, D. R., Rast, P., &amp; Bürkner, P.-C. (2018). <italic>Bayesian meta-analysis with weakly informative prior distributions</italic>. PsyArXiv. <pub-id pub-id-type="doi">10.31234/osf.io/7tbrm</pub-id></mixed-citation></ref>
<ref id="r99"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Wilson</surname>, <given-names>S. J.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Wales</surname>, <given-names>R. J.</given-names></string-name></person-group> (<year>1995</year>). <article-title>An exploration of children’s musical compositions.</article-title> <source>Journal of Research in Music Education</source>, <volume>43</volume>(<issue>2</issue>), <fpage>94</fpage>–<lpage>111</lpage>. <pub-id pub-id-type="doi">10.2307/3345672</pub-id></mixed-citation></ref>
<ref id="r100"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Zajonc</surname>, <given-names>R. B.</given-names></string-name></person-group> (<year>2001</year>). <article-title>Mere exposure: A gateway to the subliminal.</article-title> <source>Current Directions in Psychological Science</source>, <volume>10</volume>(<issue>6</issue>), <fpage>224</fpage>–<lpage>228</lpage>. <pub-id pub-id-type="doi">10.1111/1467-8721.00154</pub-id></mixed-citation></ref>
<ref id="r101"><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name name-style="western"><surname>Zhang</surname>, <given-names>J. D.</given-names></string-name>, <string-name name-style="western"><surname>Susino</surname>, <given-names>M.</given-names></string-name>, <string-name name-style="western"><surname>McPherson</surname>, <given-names>G. E.</given-names></string-name>, &amp; <string-name name-style="western"><surname>Schubert</surname>, <given-names>E.</given-names></string-name></person-group> (<year>2020</year>). <article-title>The definition of a musician in music psychology: A literature review and the six-year rule.</article-title> <source>Psychology of Music</source>, <volume>48</volume>(<issue>3</issue>), <fpage>389</fpage>–<lpage>409</lpage>. <pub-id pub-id-type="doi">10.1177/0305735618804038</pub-id></mixed-citation></ref>
</ref-list>
	<sec sec-type="data-availability" id="das"><title>Data Availability</title>
		<p>For this article, data and codebook are freely available (see <xref ref-type="bibr" rid="sp1_r1">Mütze et al., 2025a</xref>).</p>
	</sec>	

	
	
	
	<sec sec-type="supplementary-material" id="sp1"><title>Supplementary Materials</title>
		<p>For this article, the following Supplementary Materials are available:</p>
		
		<list list-type="bullet">
			<list-item><p>the raw data of the effect sizes, additionally coded variables of the meta-analysis (“Supplemental Material S4”), the raw data of the model comparison analysis (“Supplemental Material S7”) as well as the associated codebooks (see <xref ref-type="bibr" rid="sp1_r1">Mütze et al., 2025a</xref>)</p></list-item>
			<list-item><p>the R markdown with the code of the associated statistical analyses of the meta-analysis (“Supplemental Material S5”) as well as the R markdown with the code for the associated statistical analysis of the model comparison analysis (“Supplemental Material S8”) (see <xref ref-type="bibr" rid="sp1_r2">Mütze et al., 2025b</xref>)</p></list-item>
			<list-item><p>the review protocol (referred to as “Supplemental Material S1” in the manuscript), the coding protocol (“Supplemental Material S2”), the methods of effect size calculations (“Supplemental Material S3”), and the formal description of the mathematical model (“Supplemental Material S6”) (see <xref ref-type="bibr" rid="sp1_r3">Mütze et al., 2025c</xref>)</p></list-item>
			<list-item><p>the Scatterplot (“Supplemental Material S9”) (see <xref ref-type="bibr" rid="sp1_r4">Mütze et al., 2025d</xref>)</p></list-item>
		</list>
		
		
		<ref-list content-type="supplementary-material" id="suppl-ref-list">
			<ref id="sp1_r1">
				<mixed-citation publication-type="supplementary-material">
					<person-group person-group-type="author">
							<name name-style="western">
								<surname>Mütze</surname>
								<given-names>H.</given-names>
							</name>
							<name name-style="western">
								<surname>Platz</surname>
								<given-names>F.</given-names>
							</name>
							<name name-style="western">
								<surname>Busch</surname>
								<given-names>V.</given-names>
							</name>
					</person-group> (<year>2025a</year>). <source>Supplementary materials to "The acquisition of tonal hierarchies in western music during school years: A re-analysis of 40 years of research"</source> <comment>[Data, codebook]</comment>. <publisher-name>PsychArchives</publisher-name>. <pub-id pub-id-type="doi" xlink:href="https://doi.org/10.23668/psycharchives.21181">10.23668/psycharchives.21181</pub-id>		
				</mixed-citation>
			</ref>
			
			
			<ref id="sp1_r2">
				<mixed-citation publication-type="supplementary-material">
					<person-group person-group-type="author">
						<name name-style="western">
							<surname>Mütze</surname>
							<given-names>H.</given-names>
						</name>
						<name name-style="western">
							<surname>Platz</surname>
							<given-names>F.</given-names>
						</name>
						<name name-style="western">
							<surname>Busch</surname>
							<given-names>V.</given-names>
						</name>
					</person-group> (<year>2025b</year>). <source>Supplementary materials to "The acquisition of tonal hierarchies in western music during school years: A re-analysis of 40 years of research"</source> <comment>[Code]</comment>. <publisher-name>PsychArchives</publisher-name>. <pub-id pub-id-type="doi" xlink:href="https://doi.org/10.23668/psycharchives.21336">10.23668/psycharchives.21336</pub-id>		
				</mixed-citation>
			</ref>
			
			<ref id="sp1_r3">
				<mixed-citation publication-type="supplementary-material">
					<person-group person-group-type="author">
						<name name-style="western">
							<surname>Mütze</surname>
							<given-names>H.</given-names>
						</name>
						<name name-style="western">
							<surname>Platz</surname>
							<given-names>F.</given-names>
						</name>
						<name name-style="western">
							<surname>Busch</surname>
							<given-names>V.</given-names>
						</name>
					</person-group> (<year>2025c</year>). <source>Supplementary materials to "The acquisition of tonal hierarchies in western music during school years: A re-analysis of 40 years of research"</source> <comment>[Protocols, additional materials]</comment>. <publisher-name>PsychArchives</publisher-name>. <pub-id pub-id-type="doi" xlink:href="https://doi.org/10.23668/psycharchives.21183">10.23668/psycharchives.21183</pub-id>		
				</mixed-citation>
			</ref>
			
			<ref id="sp1_r4">
				<mixed-citation publication-type="supplementary-material">
					<person-group person-group-type="author">
						<name name-style="western">
							<surname>Mütze</surname>
							<given-names>H.</given-names>
						</name>
						<name name-style="western">
							<surname>Platz</surname>
							<given-names>F.</given-names>
						</name>
						<name name-style="western">
							<surname>Busch</surname>
							<given-names>V.</given-names>
						</name>
					</person-group> (<year>2025d</year>). <source>Supplementary materials to "The acquisition of tonal hierarchies in western music during school years: A re-analysis of 40 years of research"</source> <comment>[Scatterplot]</comment>. <publisher-name>PsychArchives</publisher-name>. <pub-id pub-id-type="doi" xlink:href="https://doi.org/10.23668/psycharchives.21184">10.23668/psycharchives.21184</pub-id>		
				</mixed-citation>
			</ref>
		</ref-list>
	</sec>
			

<fn-group>
<fn fn-type="financial-disclosure"><p>The authors have no funding to report.</p></fn>
</fn-group>
<fn-group>
<fn fn-type="conflict"><p>The authors have declared that no competing interests exist.</p></fn>
</fn-group>
</back>
</article>
