<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Hum. Neurosci.</journal-id>
<journal-title>Frontiers in Human Neuroscience</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Hum. Neurosci.</abbrev-journal-title>
<issn pub-type="epub">1662-5161</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fnhum.2017.00481</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Neuroscience</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Characterizing Neural Entrainment to Hierarchical Linguistic Units using Electroencephalography (EEG)</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Ding</surname> <given-names>Nai</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/111510/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Melloni</surname> <given-names>Lucia</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/32689/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Yang</surname> <given-names>Aotian</given-names></name>
<xref ref-type="aff" rid="aff9"><sup>9</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Yu</given-names></name>
<xref ref-type="aff" rid="aff10"><sup>10</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/435453/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Wen</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Poeppel</surname> <given-names>David</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<xref ref-type="aff" rid="aff9"><sup>9</sup></xref>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>College of Biomedical Engineering and Instrument Sciences, Zhejiang University</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>State Key Laboratory of Industrial Control Technology, Zhejiang University</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>Key Laboratory for Biomedical Engineering of Ministry of Education, Zhejiang University</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>Interdisciplinary Center for Social Sciences, Zhejiang University</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>Neuro and Behavior EconLab, Zhejiang University of Finance and Economics</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country></aff>
<aff id="aff6"><sup>6</sup><institution>Neuroscience Department, Max-Planck Institute for Empirical Aesthetics</institution>, <addr-line>Frankfurt</addr-line>, <country>Germany</country></aff>
<aff id="aff7"><sup>7</sup><institution>Department of Neurology, New York University Langone Medical Center</institution>, <addr-line>New York, NY</addr-line>, <country>United States</country></aff>
<aff id="aff8"><sup>8</sup><institution>Department of Neurophysiology, Max-Planck Institute for Brain Research</institution>, <addr-line>Frankfurt</addr-line>, <country>Germany</country></aff>
<aff id="aff9"><sup>9</sup><institution>Department of Psychology, New York University</institution>, <addr-line>New York, NY</addr-line>, <country>United States</country></aff>
<aff id="aff10"><sup>10</sup><institution>School of Computer and Information Engineering, Zhejiang Gongshang University</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Qing Cai, East China Normal University, China</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Liping Wang, Institute of Neuroscience, Shanghai, Chinese Academy of Sciences, China; Milene Bonte, Maastricht University, Netherlands</p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x0002A;Correspondence: Nai Ding <email>ding_nai&#x00040;zju.edu.cn</email></p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>28</day>
<month>09</month>
<year>2017</year>
</pub-date>
<pub-date pub-type="collection">
<year>2017</year>
</pub-date>
<volume>11</volume>
<elocation-id>481</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>04</month>
<year>2017</year>
</date>
<date date-type="accepted">
<day>19</day>
<month>09</month>
<year>2017</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2017 Ding, Melloni, Yang, Wang, Zhang and Poeppel.</copyright-statement>
<copyright-year>2017</copyright-year>
<copyright-holder>Ding, Melloni, Yang, Wang, Zhang and Poeppel</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) or licensor are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><p>To understand speech, listeners have to combine the words they hear into phrases and sentences. Recent magnetoencephalography (MEG) and electrocorticography (ECoG) studies show that cortical activity is concurrently entrained/synchronized to the rhythms of multiple levels of linguistic units including words, phrases, and sentences. Here we investigate whether this phenomenon can be observed using electroencephalography (EEG), a technique that is more widely available than MEG and ECoG. We show that the EEG responses concurrently track the rhythms of hierarchical linguistic units such as syllables/words, phrases, and sentences. The strength of the sentential-rate response correlates with how well each subject can detect random words embedded in a sequence of sentences. In contrast, only a syllabic-rate response is observed for an unintelligible control stimulus. In sum, EEG provides a useful tool to characterize neural encoding of hierarchical linguistic units, potentially even in individual participants.</p></abstract>
<kwd-group>
<kwd>EEG</kwd>
<kwd>entrainment</kwd>
<kwd>speech</kwd>
<kwd>phrase</kwd>
<kwd>hierarchical structures</kwd>
</kwd-group>
<contract-num rid="cn001">31500873</contract-num>
<contract-sponsor id="cn001">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content></contract-sponsor>
<counts>
<fig-count count="5"/>
<table-count count="0"/>
<equation-count count="4"/>
<ref-count count="36"/>
<page-count count="9"/>
<word-count count="5307"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>A critical feature of human language is that it can concatenate smaller units, e.g., words, into larger structures, e.g., phrases, and recursively bind such units into larger structures like sentences, governed by the constraints of a grammatical system (Chomsky, <xref ref-type="bibr" rid="B8">1957</xref>; Fitch and Friederici, <xref ref-type="bibr" rid="B16">2012</xref>; Berwick et al., <xref ref-type="bibr" rid="B4">2013</xref>; Everaert et al., <xref ref-type="bibr" rid="B13">2015</xref>). During speech comprehension, the acoustic speech signal is first mapped onto phonetic features, which are then deployed to retrieve lexical information (Poeppel et al., <xref ref-type="bibr" rid="B32">2008</xref>). To understand sentences, words have to be further combined into phrases and sentences, based on tacit grammatical knowledge (Townsend and Bever, <xref ref-type="bibr" rid="B35">2001</xref>; Phillips, <xref ref-type="bibr" rid="B31">2003</xref>). A number of studies have investigated the cortical network involved in the process of combining words into phrases and sentences (Friederici et al., <xref ref-type="bibr" rid="B18">2000</xref>; Lerner et al., <xref ref-type="bibr" rid="B24">2011</xref>; Pallier et al., <xref ref-type="bibr" rid="B29">2011</xref>; Nelson et al., <xref ref-type="bibr" rid="B28">2017</xref>). Those studies have shown increased activation in a distributed network involving the inferior frontal gyrus and the superior and middle temporal gyri when words combine into phrases. In terms of the neurophysiological processes, studies have shown that when syllables combine into words, the first syllable in a word elicits larger electroencephalography (EEG) responses at latency of around 100 ms (Sanders et al., <xref ref-type="bibr" rid="B33">2002</xref>) and that cortical activity tracks the rhythms of both syllables and words (Buiatti et al., <xref ref-type="bibr" rid="B6">2009</xref>; Kabdebon et al., <xref ref-type="bibr" rid="B20">2015</xref>; Farthouat et al., <xref ref-type="bibr" rid="B14">2016</xref>; Batterink and Paller, <xref ref-type="bibr" rid="B3">2017</xref>).</p>
<p>When investigating phrase-level neurophysiological processing, an EEG component, i.e., the closure positive shift (CPS), is observed at the boundary of prosodic phrases, which has been interpreted as a marker for phonological level processing of phrases (Steinhauer et al., <xref ref-type="bibr" rid="B34">1999</xref>; Li and Yang, <xref ref-type="bibr" rid="B25">2009</xref>). Recent magnetoencephalography (MEG) and electrocorticography (ECoG) experiments show that low-frequency cortical activity is concurrently entrained, i.e., synchronized, to the rhythms of multiple linguistic units, e.g., words, phrases, and sentences, even without any prosodic cues at the phrasal/sentential boundaries (Ding et al., <xref ref-type="bibr" rid="B12">2016</xref>). Furthermore, within a linguistic structure, the power of electrophysiological activity shows a sustained increase or build up in the theta, beta (Bastiaansen et al., <xref ref-type="bibr" rid="B2">2010</xref>; Bastiaansen and Hagoort, <xref ref-type="bibr" rid="B1">2015</xref>; Ding et al., <xref ref-type="bibr" rid="B12">2016</xref>), gamma (Pe&#x000F1;a and Melloni, <xref ref-type="bibr" rid="B30">2012</xref>), and high-gamma bands (Ding et al., <xref ref-type="bibr" rid="B12">2016</xref>; Nelson et al., <xref ref-type="bibr" rid="B28">2017</xref>). Neural tracking in different frequency bands may reflect the neural coupling across frequencies (Lakatos et al., <xref ref-type="bibr" rid="B22">2005</xref>; Canolty et al., <xref ref-type="bibr" rid="B7">2006</xref>), but it has also been suggested that beta and gamma bands may preferentially process syntactic and semantic information (Bastiaansen and Hagoort, <xref ref-type="bibr" rid="B1">2015</xref>; Ding et al., <xref ref-type="bibr" rid="B12">2016</xref>). These results indicate that during listening to connected speech, the brain can construct phrasal/sentential structure purely based on grammatical cues and entrain cortical rhythms to track the rhythms of these internally constructed linguistic units.</p>
<p>Concurrent cortical entrainment to hierarchical linguistic units provides a plausible neural marker to characterize how linguistic structure building is affected by factors, such as attention and memory and also affords a measure to study developmental and aging effects on linguistic structure building. One limitation of this neural marker, however, is that it has only been validated using MEG and ECoG, which are not commonly available recording techniques. Here we test whether cortical tracking of hierarchical linguistic units (Figure <xref ref-type="fig" rid="F1">1A</xref>) can also be observed using EEG.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>Stimulus. <bold>(A)</bold> Linguistic structure of the sentence stimuli. Each sentence contains a two-word noun phrase and a two-word verb phrase. All words are monosyllabic. <bold>(B)</bold> Auditory spectrogram of an example segment of the sentence stimulus (upper) and the control stimulus (lower). The acoustic control stimulus has spectro-temporal properties similar to the sentence materials. <bold>(C)</bold> Power spectrum of the stimulus envelope. Both the sentence stimulus and the control stimulus show temporal modulations at the syllabic rate, i.e., 1/0.32 Hz, but not at the phrasal or sentential rates.</p></caption>
<graphic xlink:href="fnhum-11-00481-g0001.tif"/>
</fig>
</sec>
<sec sec-type="methods" id="s2">
<title>Methods</title>
<sec>
<title>Subjects</title>
<p>Sixteen native American English speaking New York University undergraduate students (4 males; 2 left-handed; age range 18&#x02013;22) participated in this study. They were given course credit for participation. The institutional review board of New York University approved the study protocol, and written informed consent was obtained from all participants before the study.</p>
</sec>
<sec>
<title>Stimuli</title>
<p>The stimuli and procedures were identical to experiment 6 (sentence condition and shuffled sequence condition) of a recent MEG study (Ding et al., <xref ref-type="bibr" rid="B12">2016</xref>). In the sentence condition, each English sentence contains 4 monosyllabic words (Figure <xref ref-type="fig" rid="F1">1A</xref>). The first two words form a noun phrase (adjective/pronoun &#x0002B; noun) and the last two words form a verb phrase (verb &#x0002B; noun). English words were synthesized independently using the MacinTalk Synthesizer (male voice Alex, in Mac OS X 10.7.5). Each monosyllabic word was adjusted to 320 ms in duration. In each trial, 12 sentences were presented without any acoustic gap between sentences (continuous, isochronous presentation). Therefore, each trial is 15.36 s in duration. Thirty trials were played, eight of which contained outliers. An outlier trial was the same as a normal trial except that 3 consecutive words from a roved position were replaced with 3 random words. The behavioral response was correct in 72% (<italic>SD</italic> &#x0003D; 9%) trial for the sentence condition.</p>
<p>In the control condition, each syllable in the sentence condition was cut into 5 slices (72-ms in duration with a 10-ms overlap between neighboring slices, which is smoothed by a 10-ms linear ramp) and slices at the same position within a sentence were shuffled across sentences. The control stimulus is not intelligible speech but has similar acoustic properties as the 4-syllable sentences (Figures <xref ref-type="fig" rid="F1">1B,C</xref>). Detailed procedures of how the control stimuli were made are described in Ding et al. (<xref ref-type="bibr" rid="B12">2016</xref>). The control stimulus has the same duration as the sentence stimulus and 30 trials were presented. Eight trials contained outliers consisting of 4 randomly chosen English words embedded in the stimulus. The behavioral response was correct in 81% (<italic>SD</italic> &#x0003D; 14%) of the trials for the control condition. The behavioral score of one subject (33%) clearly differed from other subjects. If this subject was excluded, the mean correct rate was 84% (<italic>SD</italic> &#x0003D; 6%).</p>
<p>The spectrogram of an example segment of a stimulus is shown Figure <xref ref-type="fig" rid="F1">1B</xref> for both conditions. The spectrogram is calculated using an auditory model (Yang et al., <xref ref-type="bibr" rid="B36">1992</xref>). The power spectrum of the temporal envelope of the stimuli is shown in Figure <xref ref-type="fig" rid="F1">1C</xref>. The temporal envelope is the average of the spectrogram over frequencies, and the power spectrum is calculated using the Discrete Fourier Transform (DFT) without any smoothing window. The power spectrum in Figure <xref ref-type="fig" rid="F1">1C</xref> is averaged over all 15.36-s duration trials. The stimulus envelope shows a spectral peak only at the syllabic/word rate.</p>
</sec>
<sec>
<title>Procedures</title>
<p>The experiment was conducted in a quiet room. The sentence condition and the control condition were presented in separate sessions and the order of these two sessions was counterbalanced over subjects. The participants were instructed to distinguish normal trials from outlier trials by pressing a response keys at the end of each trial.</p>
</sec>
<sec>
<title>EEG recording</title>
<p>EEG was continuously recorded with a 128-channel EEG system (EGI, Inc., Eugene, OR), digitized at a sampling rate of 1,000 Hz (bandpass filter &#x0003D; 0.01&#x02013;400 Hz) and referenced to the vertex (Cz). The impedance of electrodes was kept below 40 kO (Ferree et al., <xref ref-type="bibr" rid="B15">2001</xref>). EOG artifacts were removed from the EEG recordings using ICA (Delorme and Makeig, <xref ref-type="bibr" rid="B10">2004</xref>). Specifically, the 128-channel EEG signals were dimension reduced to 80 components using PCA and then the 80 principal components were further decomposed using ICA. An independent component was removed if in its topography the mean power over the most frontal 14 channels was more than 10 times stronger than the mean power over all other channels.</p>
<p>The EEG signal was lowpass filtered to 25 Hz, since the signals of interests are in the low-frequency region, at 1/1.28, 2/1.28, and 4/1.28 Hz. Data were re-referenced offline to a common average reference. The response to each trial was epoched. The recorded data from the first sentence of each trial was removed to avoid the transient EEG response to sound onset.</p>
</sec>
<sec>
<title>Response power and inter-trial phase coherence</title>
<p>The EEG response in each trial was converted into the frequency domain using the DFT. After the first sentence was removed, each trial was 14.08 s in duration (9 sentences &#x000D7; 1.28 s/sentence) and therefore the frequency resolution of the DFT of the entire trial is 0.071 Hz, i.e., 1/14.08 Hz. If the DFT of the response in trial <italic>k</italic> is denoted as <italic>X</italic><sub><italic>k</italic></sub>(<italic>f</italic>), the evoked power spectrum is shown in equation (1), where <italic>K</italic> is the total number of trials. <italic>X</italic><sub><italic>k</italic></sub>(<italic>f</italic>) is complex-valued Fourier coefficient and is a function of frequency <italic>f</italic>. The evoked power reflects the power of EEG responses that are synchronized to the speech input. It is the same as the power spectrum of the EEG response waveform averaged over trials.</p>
<disp-formula id="E1"><label>(1)</label><mml:math id="M1"><mml:mrow><mml:mi>E</mml:mi><mml:mo stretchy='false'>(</mml:mo><mml:mi>f</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:mo>=</mml:mo><mml:mo>&#x0007C;</mml:mo><mml:msub><mml:mo>&#x003A3;</mml:mo><mml:mi>k</mml:mi></mml:msub><mml:msub><mml:mi>X</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:mo stretchy='false'>(</mml:mo><mml:mi>f</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:msup><mml:mo>&#x0007C;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mo>/</mml:mo><mml:mi>K</mml:mi></mml:mrow></mml:math></disp-formula>
<p>The inter-trial phase coherence is defined in equation (2), where &#x003B8;<sub><italic>k</italic></sub> is the phase angle of each complex-valued Fourier coefficient, i.e., &#x003B8;<sub><italic>k</italic></sub> &#x0003D; &#x0003C;<italic>X</italic><sub><italic>k</italic></sub>(<italic>f</italic>).</p>
<disp-formula id="E2"><label>(2)</label><mml:math id="M2"><mml:mrow><mml:mi>R</mml:mi><mml:mo stretchy='false'>(</mml:mo><mml:mi>f</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:mo>=</mml:mo><mml:msup><mml:mrow><mml:mo stretchy='false'>(</mml:mo><mml:msub><mml:mo>&#x003A3;</mml:mo><mml:mi>k</mml:mi></mml:msub><mml:mtext>cos</mml:mtext><mml:mo stretchy='false'>(</mml:mo><mml:msub><mml:mo>&#x003B8;</mml:mo><mml:mi>k</mml:mi></mml:msub><mml:mo stretchy='false'>)</mml:mo><mml:mo stretchy='false'>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>/</mml:mo><mml:mi>K</mml:mi><mml:mo>+</mml:mo><mml:msup><mml:mrow><mml:mo stretchy='false'>(</mml:mo><mml:msub><mml:mo>&#x003A3;</mml:mo><mml:mi>k</mml:mi></mml:msub><mml:mtext>sin</mml:mtext><mml:mo stretchy='false'>(</mml:mo><mml:msub><mml:mo>&#x003B8;</mml:mo><mml:mi>k</mml:mi></mml:msub><mml:mo stretchy='false'>)</mml:mo><mml:mo stretchy='false'>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>/</mml:mo><mml:mi>K</mml:mi></mml:mrow></mml:math></disp-formula>
<p>The induced power, i.e., the power of EEG responses not synchronized to the speech input, is also calculated as the following formula, where &#x0003C;X(<italic>f</italic>)&#x0003E; denotes the mean over trials.</p>
<disp-formula id="E3"><label>(3)</label><mml:math id="M3"><mml:mrow><mml:mi>I</mml:mi><mml:mo stretchy='false'>(</mml:mo><mml:mi>f</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:mo>=</mml:mo><mml:msub><mml:mo>&#x003A3;</mml:mo><mml:mi>k</mml:mi></mml:msub><mml:mo>&#x0007C;</mml:mo><mml:msub><mml:mi>X</mml:mi><mml:mi>k</mml:mi></mml:msub><mml:mo stretchy='false'>(</mml:mo><mml:mi>f</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mo>&#x02212;</mml:mo><mml:mo>&#x0003C;</mml:mo><mml:mtext>&#x0200B;</mml:mtext><mml:mi>X</mml:mi><mml:mo stretchy='false'>(</mml:mo><mml:mi>f</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:mtext>&#x0200B;</mml:mtext><mml:mo>&#x0003E;</mml:mo><mml:mtext>&#x0200B;</mml:mtext><mml:msup><mml:mo>&#x0007C;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mo>/</mml:mo><mml:mi>K</mml:mi></mml:mrow></mml:math></disp-formula>
</sec>
<sec>
<title>Significance testing</title>
<p>The statistical significance of neural entrainment at a target frequency was tested for evoked power and inter-trial phase coherence, respectively. In the power test, to remove the 1/f trend of the response power spectrum, the response power at each frequency was normalized by the neighboring 14 frequency bins (7 bins on each side, which is equivalent to 0.5 Hz). The normalized power (equation 3), which can be viewed as a signal-to-noise measure, is:</p>
<disp-formula id="E4"><label>(4)</label><mml:math id="M4"><mml:mrow><mml:msub><mml:mi>E</mml:mi><mml:mi>n</mml:mi></mml:msub><mml:mo stretchy='false'>(</mml:mo><mml:mi>f</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:mo>=</mml:mo><mml:mi>E</mml:mi><mml:mo stretchy='false'>(</mml:mo><mml:mi>f</mml:mi><mml:mo stretchy='false'>)</mml:mo><mml:mo>/</mml:mo><mml:msub><mml:mo>&#x003A3;</mml:mo><mml:mo>&#x003C9;</mml:mo></mml:msub><mml:mi>E</mml:mi><mml:mo stretchy='false'>(</mml:mo><mml:mo>&#x003C9;</mml:mo><mml:mo stretchy='false'>)</mml:mo><mml:mo>,</mml:mo><mml:mo>&#x0007C;</mml:mo><mml:mo>&#x003C9;</mml:mo><mml:mo>&#x02212;</mml:mo><mml:mi>f</mml:mi><mml:mo>&#x0007C;</mml:mo><mml:mo>&#x0003C;</mml:mo><mml:mtext>&#x0200B;&#x0200B;</mml:mtext><mml:mn>0.5</mml:mn><mml:mtext>Hz</mml:mtext><mml:mo>,</mml:mo><mml:mo>&#x003C9;</mml:mo><mml:mo>&#x02260;</mml:mo><mml:mi>f</mml:mi></mml:mrow></mml:math></disp-formula>
<p>where &#x003C9; denotes frequencies around the target frequency <italic>f</italic>.</p>
<p>In the phase coherence test, phase coherence values are not normalized by the neighboring frequency bins, since the inter-trial phase coherence spectrum has no 1/f fall-off.</p>
<p>For the power test, the null hypothesis is that the power at the target frequency is not significantly larger than the power in neighboring frequencies. Under the null hypothesis, the normalized power <italic>E</italic><sub><italic>n</italic></sub>(<italic>f</italic>) is subject to an <italic>F</italic><sub>(32, 448)</sub> distribution for each channel. When the response power is averaged over channels, since the EEG response is correlated over channels, we conservatively assumes that the normalized power calculated based on the power averaged over channels is also subject to an <italic>F</italic><sub>(32, 448)</sub> distribution. For the phase coherence test, the null hypothesis is that the response phase is not synchronized to the stimulus and the null distribution of &#x003B8;<sub><italic>k</italic></sub> is a uniform distribution. Therefore, we employed the <italic>F</italic>-test and the Rayleigh test, respectively, to evaluate the statistical significance of the evoked power and phase coherence at each target frequency.</p>
<p>For the response averaged over channels, the null distribution of the evoked power or phase coherence cannot be easily described by a parametric distribution due to the correlation between channels. Therefore, the null distribution of normalized power (or inter-trial phase coherence) is estimated based on the response at non-target frequencies, i.e., the responses at frequencies that are not harmonically related to the sentential rate. The chance-level normalized power (or phase coherence) is pooled over frequencies. When the significance test is applied to individual subjects, the chance-level power (or phase coherence) is pooled over subjects. The statistical significance of the response at a target frequency is the probability that the target-frequency response differs from a chance-level response.</p>
<p>A linear classification analysis is employed to test if the topographic patterns at two frequencies or in two conditions are significantly different. In this analysis, the topographic plots averaged over half of the trials (e.g., the first or last 15 trials) are used to train a classifier. Each subject is viewed as a sample. The classifier&#x00027;s performance is evaluated based on the data averaged over the other half of the trials. A binomial test (<italic>N</italic> &#x0003D; 16, probability: 0.5) is used to test if the classifier can discriminate the two classes of topographic plots with higher than chance performance.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<p>We first analyzed the global field power of EEG responses (Figure <xref ref-type="fig" rid="F2">2A</xref>). In this analysis, the power spectrum is calculated for each electrode and then averaged over electrodes. In the grand average over subjects, the response to sentences shows three clear peaks at the sentential, phrasal, and syllabic rates, respectively [<italic>P</italic> &#x0003C; 0.001, <italic>F</italic><sub>(32, 448)</sub> &#x0003D; 8.9, 6.1, and 111.9, respectively]. The response to the acoustic control shows a single statistically significant peak at the syllabic rate [<italic>P</italic> &#x0003C; 0.001, <italic>F</italic><sub>(32, 448)</sub> &#x0003D; 47.6]. The response at the sentential and phrasal rates are not significantly stronger than the power in neighboring frequency bins [<italic>P</italic> &#x0003E; 0.3, <italic>F</italic><sub>(32, 448)</sub> &#x0003D; 1.1, and 1.1 respectively]. Comparing the sentence condition and the control condition, it is revealed that the response is stronger for the sentential condition at the sentential [<italic>P</italic> &#x0003C; 0.001, <italic>F</italic><sub>(32, 32)</sub> &#x0003D; 7.9], phrasal [<italic>P</italic> &#x0003C; 0.001, <italic>F</italic><sub>(32, 32)</sub> &#x0003D; 4.5], and syllabic rates [<italic>P</italic> &#x0003D; 0.03, <italic>F</italic><sub>(32, 32)</sub> &#x0003D; 2.0].</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>EEG responses to sentences and the acoustic control (grand average over all subjects and channels). <bold>(A)</bold> The evoked power spectrum of EEG responses. The bold black line shows the grand average over subjects, the two thin black lines delimit the 75th and 25th percentiles. Green lines show the data from individual subjects. The responses to sentences show 3 peaks at the sentential (1/1.28 Hz), phrasal (1/0.64 Hz), and syllabic rates (1/0.32 Hz), respectively. In contrast, the responses to the acoustic control only show one peak at the syllabic rate. <bold>(B)</bold> The spectrum of inter-trial phase coherence. The phase coherence spectrum is similar to the evoked power spectrum except that there is no 1/f power fall-off in the spectrum. Statistically significant inter-trial phase coherence means that the EEG responses are phase-locked to the stimulus. <bold>(C)</bold> Induced power.</p></caption>
<graphic xlink:href="fnhum-11-00481-g0002.tif"/>
</fig>
<p>To quantify if the neural response is phase-locked to the stimulus, we calculated the inter-trial phase coherence. The inter-trial phase coherence averaged over channels is shown in Figure <xref ref-type="fig" rid="F2">2B</xref>. For the sentence condition, three peaks in the phase coherence spectrum are observed at the sentential, phrasal, and syllabic rates, respectively (<italic>P</italic> &#x0003C; 0.002, see Methods). For the control condition, only one peak at the syllabic rate is observed (<italic>P</italic> &#x0003C; 0.002).</p>
<p>The induced power, i.e., non-phase-locked power, of the EEG responses is shown in Figure <xref ref-type="fig" rid="F2">2C</xref>. No spectral peak is observed at the sentential, phrasal, or syllabic rate.</p>
<p>The EEG responses in the sentence condition were further analyzed as follows. We first quantify whether the neural responses to hierarchical linguistic units can be reliably detected in single subjects. The response power from individual subjects is shown in Figure <xref ref-type="fig" rid="F3">3A</xref> for each target frequency. The power at each target frequency was normalized by the mean power in a 1-Hz neighboring frequency area (0.5 Hz on each side of the target frequency). At the sentential, phrasal, and syllabic rate responses reached significance level (<italic>P</italic> &#x0003C; 0.05, FDR-corrected, see Methods) in 62.5, 43.8, and 100% of the 16 participants, respectively. The inter-trial phase coherence values of individual subjects is shown in Figure <xref ref-type="fig" rid="F3">3B</xref>. Statistically significant phase coherence was observed at the sentential, phrasal, and syllabic rates in 62.5, 56.3, and 100%, respectively (<italic>P</italic> &#x0003C; 0.05, FDR-corrected, see method). Neural entrainment to at least one higher-level linguistic structure (i.e., phrase or sentence) is detected in 68.8% (<italic>N</italic> &#x0003D; 11) and 81.3% (<italic>N</italic> &#x0003D; 13) of the subjects for the power test and the phase test, respectively.</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p>Neural responses to hierarchical linguistic structures in individual participants. The normalized evoked power <bold>(A)</bold> and inter-trial phase coherence <bold>(B)</bold> for individual subjects at each target frequency. Participants showing a statistically significant spectral peak at each target frequency are marked by a star (<italic>P</italic> &#x0003C; 0.05, FDR-corrected, see Methods).</p></caption>
<graphic xlink:href="fnhum-11-00481-g0003.tif"/>
</fig>
<p>The spatial distribution of EEG power and phase coherence over electrodes is shown in Figure <xref ref-type="fig" rid="F4">4</xref>. The syllabic response is most salient around channel Cz. The sentential and phrasal rate responses, however, are more salient near channels on the right and left side of channel Cz. Such a distinction in spatial distribution, however, is not consistent across subjects, since a linear classifier fails to distinguish the topographic patterns between the conditions shown in Figure <xref ref-type="fig" rid="F4">4</xref> above chance level, possibly due to the low-spatial resolution of EEG and large individual differences.</p>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p>Topography of the neural responses at the sentential, phrasal, and syllabic rates. Channels Cz, T7, T8, Fz, and Pz are marked by blue dots. <bold>(A)</bold> The normalized evoked response averaged over subjects. The color bar shows the normalized power in dB. The syllabic rate response is strongest near channel Cz. In contrast, the sentential response is strongest between Cz and T8 and the phrasal response shows a bilateral pattern on both sides of Cz. <bold>(B)</bold> The inter-trial phase coherence averaged over subjects, shows a pattern similar to the that of normalized evoked power.</p></caption>
<graphic xlink:href="fnhum-11-00481-g0004.tif"/>
</fig>
<p>Finally, we examine whether the EEG responses are correlated with behavior (Figure <xref ref-type="fig" rid="F5">5</xref>). The sentential-rate response is found to be significantly correlated with the performance of detecting an outlier (i.e., 3 random words) embedded in a sequence of grammatical sentences. No correlation with behavior is observed at other frequencies.</p>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p>Correlation between neural response power and behavior for the sentence <bold>(A&#x02013;C)</bold> and control condition <bold>(D)</bold>. In the sentence condition, the sentential-rate response is positively correlated with how well each subject can detect a sequence of random words embedded in a sequence of sentences. In <bold>(D)</bold>, data from one subject is not shown since the behavioral score (33%) is much lower than other subjects.</p></caption>
<graphic xlink:href="fnhum-11-00481-g0005.tif"/>
</fig>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>This study shows that ongoing EEG responses can follow the rhythmic structure of multiple linguistic levels, concurrently, during listening to connected speech. These results demonstrate that scalp EEG provides an effective tool to investigate the neural tracking of hierarchical linguistic units in individual subjects.</p>
<sec>
<title>Neural representation of hierarchical linguistic units</title>
<p>Whether sentences are represented by hierarchically embedded syntactic structures or linear Markov models during language comprehension is a central question in cognitive science (Chomsky, <xref ref-type="bibr" rid="B8">1957</xref>; Townsend and Bever, <xref ref-type="bibr" rid="B35">2001</xref>; Jackendoff, <xref ref-type="bibr" rid="B19">2002</xref>; Phillips, <xref ref-type="bibr" rid="B31">2003</xref>; Frank et al., <xref ref-type="bibr" rid="B17">2012</xref>; Everaert et al., <xref ref-type="bibr" rid="B13">2015</xref>). Recently, a number of studies have suggested that neural processing of languages cannot be fully explained by a linear Markov model and is consistent with hierarchical syntactic models. For example, using fMRI, Brennan et al. tested how well BOLD signals in each cortical area can be explained by a hierarchical models or Markov models (Brennan et al., <xref ref-type="bibr" rid="B5">2016</xref>). They found that while hierarchical models predicted BOLD signals in the anterior and posterior temporal lobes, a Markov model predicted activity in a broader cortical network including the frontal lobe. Neural entrainment to linguistic structures also provides a useful tool to address how syntactic structures are represented in the brain. For example, previous MEG data show that neural activity can entrain to linguistic structures even without any statistical cues for structural boundaries, demonstrating that statistical cues are not the only cues for syntactic analysis (Ding et al., <xref ref-type="bibr" rid="B12">2016</xref>).</p>
</sec>
<sec>
<title>Neural entrainment to speech</title>
<p>When listening to speech, cortical activity is entrained to the temporal envelope of speech (Luo and Poeppel, <xref ref-type="bibr" rid="B26">2007</xref>; Kerlin et al., <xref ref-type="bibr" rid="B21">2010</xref>; Lalor and Foxe, <xref ref-type="bibr" rid="B23">2010</xref>), which carries the acoustic rhythm of speech. It has also been shown that cortical activity carries phonetic information (Di Liberto et al., <xref ref-type="bibr" rid="B11">2015</xref>). Furthermore, as shown in this study using EEG and previous studies using MEG and ECoG (Ding et al., <xref ref-type="bibr" rid="B12">2016</xref>), cortical activity is also entrained to the rhythms of higher level linguistic structures such as phrases and sentences, in the absence of acoustic cues. Therefore, during speech listening, cortical activity on different time scales is concurrently synchronized to linguistic structures of time scales. Therefore, a hierarchy of linguistic structures are converted into neural dynamics on different time scales, providing a plausible neural basis for the mental representation of hierarchical linguistic structures and the interactions between linguistic levels during speech processing (Townsend and Bever, <xref ref-type="bibr" rid="B35">2001</xref>; Poeppel et al., <xref ref-type="bibr" rid="B32">2008</xref>; Christiansen and Chater, <xref ref-type="bibr" rid="B9">2016</xref>).</p>
<p>Although a syllabic-rate response is observed in both the sentence condition and the control condition, it is weaker in the control condition. This effect may reflect better neural tracking of intelligible monosyllabic words. Alternatively, it is possible that the subjects paid more attention in the sentence condition, which enhances the syllabic/word rate response. The sentence condition may require a higher level of attention, since the behavioral task is more challenging in the sentence condition (&#x0007E;70% correct rate in the sentence condition vs. &#x0007E;80% correct rate in the control condition).</p>
<p>To dissociate syntactic from prosodic processing, the current study removes prosodic cues in speech. Natural speech, however, contains rich prosodic information which facilitates syntactic analysis. Therefore, neural tracking of phrasal and sentential structures is likely to be more prominent in natural speech. Furthermore, prosodic cues can also directly generate event-related response tracking the structural boundaries, such as the CPS (Steinhauer et al., <xref ref-type="bibr" rid="B34">1999</xref>).</p>
</sec>
<sec>
<title>Measuring neural tracking of phrases and sentences using EEG</title>
<p>In this study, 30 trials of sentence sequences (&#x0007E;15 s each) are presented and the neural tracking of higher-level linguistic structures, i.e., phrases or sentences, can be detected in more than half of the subjects using EEG. Therefore, the EEG-based paradigm shown here provides a plausible way to measure the neural encoding of higher-level linguistic structures. The sentential and phrasal responses do not reach significance in some subjects, possibly limited by the low SNR of EEG recordings. The subjects in the current study are all young adult native speakers without any language disorders, and therefore individual differences in language ability should be small, given such elementary processing demands. Nevertheless, the performance of detecting random words embedded in a sequence of sentences shows considerable individual differences, which is likely to be driven by cognitive factors, e.g., attention, rather than language ability. Indeed, a recent study shows that neural tracking of phrasal and sentential structure is diminished during sleep (Makov et al., <xref ref-type="bibr" rid="B27">2017</xref>). Future experiments are needed to elucidate the influence of tasks and cognitive states on the neural tracking of phrasal and sentential structures.</p>
<p>It is challenging to detect of low frequency neural activity, since background neural activity generally has a 1/f spectrum. Compared with the 4-Hz syllabic-rate response and the 1-Hz sentential-rate response, however, the 2-Hz phrasal-rate response is especially difficult to detect in individual subjects. A possible reason is the following: The syllables have very clear acoustic boundaries and therefore can drive strong auditory responses. Each sentence is a syntactically and semantically coherent unit and, in this experiment, different sentences are syntactically and semantically disconnected. Therefore, the sentences also have relatively clear perceptual boundaries. The phrases within a sentence, however, are related both syntactically and semantically, which makes the boundaries between them less obvious than those between syllables and sentences.</p>
<p>Finally, since EEG is a commonly available non-invasive neural recording technique, the current paradigm has the potential of being developed into a tool to assess higher-level linguistic processing in populations less able to engage in typical laboratory research, including children and clinical patients. To apply the current paradigm to a special population, however, possibly requires adapting the sentence materials based on the vocabulary familiar to the target population and elucidating how attention and other cognitive factors may influence the neural tracking of higher-level linguistic structures.</p>
</sec>
</sec>
<sec id="s5">
<title>Author contributions</title>
<p>ND, LM, and DP conceived the experiment. AY performed the experiments. AY, YW, WZ, and ND analyzed the data. ND, LM, and DP wrote the paper. All authors edited the paper.</p>
<sec>
<title>Conflict of interest statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</sec>
</body>
<back>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bastiaansen</surname> <given-names>M.</given-names></name> <name><surname>Hagoort</surname> <given-names>P.</given-names></name></person-group> (<year>2015</year>). <article-title>Frequency-based segregation of syntactic and semantic unification during online sentence level language comprehension</article-title>. <source>J. Cogn. Neurosci.</source> <volume>27</volume>, <fpage>2095</fpage>&#x02013;<lpage>2107</lpage>. <pub-id pub-id-type="doi">10.1162/jocn_a_00829</pub-id><pub-id pub-id-type="pmid">26042498</pub-id></citation></ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bastiaansen</surname> <given-names>M.</given-names></name> <name><surname>Magyari</surname> <given-names>L.</given-names></name> <name><surname>Hagoort</surname> <given-names>P.</given-names></name></person-group> (<year>2010</year>). <article-title>Syntactic unification operations are reflected in oscillatory dynamics during on-line sentence comprehension</article-title>. <source>J. Cogn. Neurosci.</source> <volume>22</volume>, <fpage>1333</fpage>&#x02013;<lpage>1347</lpage>. <pub-id pub-id-type="doi">10.1162/jocn.2009.21283</pub-id><pub-id pub-id-type="pmid">19580386</pub-id></citation></ref>
<ref id="B3">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Batterink</surname> <given-names>L. J.</given-names></name> <name><surname>Paller</surname> <given-names>K. A.</given-names></name></person-group> (<year>2017</year>). <article-title>Online neural monitoring of statistical learning</article-title>. <source>Cortex</source> <volume>90</volume> <fpage>31</fpage>&#x02013;<lpage>45</lpage>. <pub-id pub-id-type="doi">10.1016/j.cortex.2017.02.004</pub-id><pub-id pub-id-type="pmid">28324696</pub-id></citation></ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Berwick</surname> <given-names>R. C.</given-names></name> <name><surname>Friederici</surname> <given-names>A. D.</given-names></name> <name><surname>Chomsky</surname> <given-names>N.</given-names></name> <name><surname>Bolhuis</surname> <given-names>J. J.</given-names></name></person-group> (<year>2013</year>). <article-title>Evolution, brain, and the nature of language</article-title>. <source>Trends Cogn. Sci.</source> <volume>17</volume>, <fpage>89</fpage>&#x02013;<lpage>98</lpage>. <pub-id pub-id-type="doi">10.1016/j.tics.2012.12.002</pub-id><pub-id pub-id-type="pmid">23313359</pub-id></citation></ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Brennan</surname> <given-names>J. R.</given-names></name> <name><surname>Stabler</surname> <given-names>E. P.</given-names></name> <name><surname>Van Wagenen</surname> <given-names>S. E.</given-names></name> <name><surname>Luh</surname> <given-names>W. M.</given-names></name> <name><surname>Hale</surname> <given-names>J. T.</given-names></name></person-group> (<year>2016</year>). <article-title>Abstract linguistic structure correlates with temporal activity during naturalistic comprehension</article-title>. <source>Brain Lang.</source> <volume>157</volume>, <fpage>81</fpage>&#x02013;<lpage>94</lpage>. <pub-id pub-id-type="doi">10.1016/j.bandl.2016.04.008</pub-id><pub-id pub-id-type="pmid">27208858</pub-id></citation></ref>
<ref id="B6">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Buiatti</surname> <given-names>M.</given-names></name> <name><surname>Pe&#x000F1;a</surname> <given-names>M.</given-names></name> <name><surname>Dehaene-Lambertz</surname> <given-names>G.</given-names></name></person-group> (<year>2009</year>). <article-title>Investigating the neural correlates of continuous speech computation with frequency-tagged neuroelectric responses</article-title>. <source>Neuroimage</source> <volume>44</volume>, <fpage>509</fpage>&#x02013;<lpage>551</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuroimage.2008.09.015</pub-id><pub-id pub-id-type="pmid">18929668</pub-id></citation></ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Canolty</surname> <given-names>R. T.</given-names></name> <name><surname>Edwards</surname> <given-names>E.</given-names></name> <name><surname>Dalal</surname> <given-names>S. S.</given-names></name> <name><surname>Soltani</surname> <given-names>M.</given-names></name> <name><surname>Nagarajan</surname> <given-names>S. S.</given-names></name> <name><surname>Kirsch</surname> <given-names>H. E.</given-names></name> <etal/></person-group>. (<year>2006</year>). <article-title>High gamma power is phase-locked to theta oscillations in human neocortex</article-title>. <source>Science</source> <volume>313</volume>, <fpage>1626</fpage>&#x02013;<lpage>1628</lpage>. <pub-id pub-id-type="doi">10.1126/science.1128115</pub-id><pub-id pub-id-type="pmid">16973878</pub-id></citation></ref>
<ref id="B8">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Chomsky</surname> <given-names>N.</given-names></name></person-group> (<year>1957</year>). <source>Syntactic Structures</source>. <publisher-name>Mouton de Gruyter</publisher-name>.</citation></ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Christiansen</surname> <given-names>M. H.</given-names></name> <name><surname>Chater</surname> <given-names>N.</given-names></name></person-group> (<year>2016</year>). <article-title>The now-or-never bottleneck: a fundamental constraint on language</article-title>. <source>Behav. Brain Sci.</source> <volume>39</volume>:<fpage>e62</fpage>. <pub-id pub-id-type="doi">10.1017/S0140525X1500031X</pub-id><pub-id pub-id-type="pmid">25869618</pub-id></citation></ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Delorme</surname> <given-names>A.</given-names></name> <name><surname>Makeig</surname> <given-names>S.</given-names></name></person-group> (<year>2004</year>). <article-title>EEGLAB: an open source toolbox for analysis of single-trial EEG dynamics including independent component analysis</article-title>. <source>J. Neurosci. Methods</source> <volume>134</volume>, <fpage>9</fpage>&#x02013;<lpage>21</lpage>. <pub-id pub-id-type="doi">10.1016/j.jneumeth.2003.10.009</pub-id><pub-id pub-id-type="pmid">15102499</pub-id></citation></ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Di Liberto</surname> <given-names>G. M.</given-names></name> <name><surname>O&#x00027;sullivan</surname> <given-names>J. A.</given-names></name> <name><surname>Lalor</surname> <given-names>E. C.</given-names></name></person-group> (<year>2015</year>). <article-title>Low-frequency cortical entrainment to speech reflects phoneme-level processing</article-title>. <source>Curr. Biol.</source> <volume>25</volume>, <fpage>2457</fpage>&#x02013;<lpage>2465</lpage>. <pub-id pub-id-type="doi">10.1016/j.cub.2015.08.030</pub-id><pub-id pub-id-type="pmid">26412129</pub-id></citation></ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ding</surname> <given-names>N.</given-names></name> <name><surname>Melloni</surname> <given-names>L.</given-names></name> <name><surname>Zhang</surname> <given-names>H.</given-names></name> <name><surname>Tian</surname> <given-names>X.</given-names></name> <name><surname>Poeppel</surname> <given-names>D.</given-names></name></person-group> (<year>2016</year>). <article-title>Cortical tracking of hierarchical linguistic structures in connected speech</article-title>. <source>Nat. Neurosci.</source> <volume>19</volume>, <fpage>158</fpage>&#x02013;<lpage>164</lpage>. <pub-id pub-id-type="doi">10.1038/nn.4186</pub-id><pub-id pub-id-type="pmid">26642090</pub-id></citation></ref>
<ref id="B13">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Everaert</surname> <given-names>M. B.</given-names></name> <name><surname>Huybregts</surname> <given-names>M. A.</given-names></name> <name><surname>Chomsky</surname> <given-names>N.</given-names></name> <name><surname>Berwick</surname> <given-names>R. C.</given-names></name> <name><surname>Bolhuis</surname> <given-names>J. J.</given-names></name></person-group> (<year>2015</year>). <article-title>Structures, not strings: linguistics as part of the cognitive sciences</article-title>. <source>Trends Cogn. Sci.</source> <volume>19</volume>, <fpage>729</fpage>&#x02013;<lpage>743</lpage>. <pub-id pub-id-type="doi">10.1016/j.tics.2015.09.008</pub-id><pub-id pub-id-type="pmid">26564247</pub-id></citation></ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Farthouat</surname> <given-names>J.</given-names></name> <name><surname>Franco</surname> <given-names>A.</given-names></name> <name><surname>Mary</surname> <given-names>A.</given-names></name> <name><surname>Delpouve</surname> <given-names>J.</given-names></name> <name><surname>Wens</surname> <given-names>V.</given-names></name> <name><surname>Op de Beeck</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Auditory magnetoencephalographic frequency-tagged responses mirror the ongoing segmentation processes underlying statistical learning</article-title>. <source>Brain Topogr.</source> <volume>30</volume>, <fpage>220</fpage>&#x02013;<lpage>232</lpage>. <pub-id pub-id-type="doi">10.1007/s10548-016-0518-y</pub-id><pub-id pub-id-type="pmid">27613530</pub-id></citation></ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ferree</surname> <given-names>T. C.</given-names></name> <name><surname>Luu</surname> <given-names>P.</given-names></name> <name><surname>Russell</surname> <given-names>G. S.</given-names></name> <name><surname>Tucker</surname> <given-names>D. M.</given-names></name></person-group> (<year>2001</year>). <article-title>Scalp electrode impedance, infection risk, and EEG data quality</article-title>. <source>Clin. Neurophysiol.</source> <volume>112</volume>, <fpage>536</fpage>&#x02013;<lpage>544</lpage>. <pub-id pub-id-type="doi">10.1016/S1388-2457(00)00533-2</pub-id><pub-id pub-id-type="pmid">11222977</pub-id></citation></ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fitch</surname> <given-names>W. T.</given-names></name> <name><surname>Friederici</surname> <given-names>A. D.</given-names></name></person-group> (<year>2012</year>). <article-title>Artificial grammar learning meets formal language theory: an overview</article-title>. <source>Philos. Trans. R. Soc. B Biol. Sci.</source> <volume>367</volume>, <fpage>1933</fpage>&#x02013;<lpage>1955</lpage>. <pub-id pub-id-type="doi">10.1098/rstb.2012.0103</pub-id><pub-id pub-id-type="pmid">22688631</pub-id></citation></ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Frank</surname> <given-names>S. L.</given-names></name> <name><surname>Bod</surname> <given-names>R.</given-names></name> <name><surname>Christiansen</surname> <given-names>M. H.</given-names></name></person-group> (<year>2012</year>). <article-title>How hierarchical is language use?</article-title> <source>Proc. R. Soc. B</source> <volume>279</volume>, <fpage>4522</fpage>&#x02013;<lpage>4531</lpage>. <pub-id pub-id-type="doi">10.1098/rspb.2012.1741</pub-id><pub-id pub-id-type="pmid">22977157</pub-id></citation></ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Friederici</surname> <given-names>A. D.</given-names></name> <name><surname>Meyer</surname> <given-names>M.</given-names></name> <name><surname>Cramon</surname> <given-names>D. Y.</given-names></name></person-group> (<year>2000</year>). <article-title>Auditory language comprehension: an event-related fMRI study on the processing of syntactic and lexical information</article-title>. <source>Brain Lang.</source> <volume>74</volume>, <fpage>289</fpage>&#x02013;<lpage>300</lpage>. <pub-id pub-id-type="doi">10.1006/brln.2000.2313</pub-id><pub-id pub-id-type="pmid">10950920</pub-id></citation></ref>
<ref id="B19">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Jackendoff</surname> <given-names>R.</given-names></name></person-group> (<year>2002</year>). <source>Foundations of Language: Brain, Meaning, Grammar, Evolution.</source> <publisher-name>Oxford University Press</publisher-name>. <pub-id pub-id-type="pmid">15377127</pub-id></citation></ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kabdebon</surname> <given-names>C.</given-names></name> <name><surname>Pena</surname> <given-names>M.</given-names></name> <name><surname>Buiatti</surname> <given-names>M.</given-names></name> <name><surname>Dehaene-Lambertz</surname> <given-names>G.</given-names></name></person-group> (<year>2015</year>). <article-title>Electrophysiological evidence of statistical learning of long-distance dependencies in 8-month-old preterm and full-term infants</article-title>. <source>Brain Lang.</source> <volume>148</volume>, <fpage>25</fpage>&#x02013;<lpage>36</lpage>. <pub-id pub-id-type="doi">10.1016/j.bandl.2015.03.005</pub-id><pub-id pub-id-type="pmid">25865749</pub-id></citation></ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kerlin</surname> <given-names>J. R.</given-names></name> <name><surname>Shahin</surname> <given-names>A. J.</given-names></name> <name><surname>Miller</surname> <given-names>L. M.</given-names></name></person-group> (<year>2010</year>). <article-title>Attentional gain control of ongoing cortical speech representations in a &#x0201C;Cocktail Party.&#x0201D;</article-title> <source>J. Neurosci.</source> <volume>30</volume>, <fpage>620</fpage>&#x02013;<lpage>628</lpage>. <pub-id pub-id-type="doi">10.1523/JNEUROSCI.3631-09.2010</pub-id><pub-id pub-id-type="pmid">20071526</pub-id></citation></ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lakatos</surname> <given-names>P.</given-names></name> <name><surname>Shah</surname> <given-names>A. S.</given-names></name> <name><surname>Knuth</surname> <given-names>K. H.</given-names></name> <name><surname>Ulbert</surname> <given-names>I.</given-names></name> <name><surname>Karmos</surname> <given-names>G.</given-names></name> <name><surname>Schroeder</surname> <given-names>C. E.</given-names></name></person-group> (<year>2005</year>). <article-title>An oscillatory hierarchy controlling neuronal excitability and stimulus processing in the auditory cortex</article-title>. <source>J. Neurophysiol.</source> <volume>94</volume>, <fpage>1904</fpage>&#x02013;<lpage>1911</lpage>. <pub-id pub-id-type="doi">10.1152/jn.00263.2005</pub-id><pub-id pub-id-type="pmid">15901760</pub-id></citation></ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lalor</surname> <given-names>E. C.</given-names></name> <name><surname>Foxe</surname> <given-names>J. J.</given-names></name></person-group> (<year>2010</year>). <article-title>Neural responses to uninterrupted natural speech can be extracted with precise temporal resolution</article-title>. <source>Eur. J. Neurosci.</source> <volume>31</volume>, <fpage>189</fpage>&#x02013;<lpage>193</lpage>. <pub-id pub-id-type="doi">10.1111/j.1460-9568.2009.07055.x</pub-id><pub-id pub-id-type="pmid">20092565</pub-id></citation></ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lerner</surname> <given-names>Y.</given-names></name> <name><surname>Honey</surname> <given-names>C. J.</given-names></name> <name><surname>Silbert</surname> <given-names>L. J.</given-names></name> <name><surname>Hasson</surname> <given-names>U.</given-names></name></person-group> (<year>2011</year>). <article-title>Topographic mapping of a hierarchy of temporal receptive windows using a narrated story</article-title>. <source>J. Neurosci.</source> <volume>31</volume>, <fpage>2906</fpage>&#x02013;<lpage>2915</lpage>. <pub-id pub-id-type="doi">10.1523/JNEUROSCI.3684-10.2011</pub-id><pub-id pub-id-type="pmid">21414912</pub-id></citation></ref>
<ref id="B25">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>Yang</surname> <given-names>Y.</given-names></name></person-group> (<year>2009</year>). <article-title>Perception of prosodic hierarchical boundaries in Mandarin Chinese sentences</article-title>. <source>Neuroscience</source> <volume>158</volume>, <fpage>1416</fpage>&#x02013;<lpage>1425</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuroscience.2008.10.065</pub-id><pub-id pub-id-type="pmid">19111906</pub-id></citation></ref>
<ref id="B26">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname> <given-names>H.</given-names></name> <name><surname>Poeppel</surname> <given-names>D.</given-names></name></person-group> (<year>2007</year>). <article-title>Phase patterns of neuronal responses reliably discriminate speech in human auditory cortex</article-title>. <source>Neuron</source> <volume>54</volume>, <fpage>1001</fpage>&#x02013;<lpage>1010</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuron.2007.06.004</pub-id><pub-id pub-id-type="pmid">17582338</pub-id></citation></ref>
<ref id="B27">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Makov</surname> <given-names>S.</given-names></name> <name><surname>Sharon</surname> <given-names>O.</given-names></name> <name><surname>Ding</surname> <given-names>N.</given-names></name> <name><surname>Ben-Shachar</surname> <given-names>M.</given-names></name> <name><surname>Nir</surname> <given-names>Y.</given-names></name> <name><surname>Zion Golumbic</surname> <given-names>E.</given-names></name></person-group> (<year>2017</year>). <article-title>Sleep disrupts high-level speech parsing despite significant basic auditory processing</article-title>. <source>J. Neurosci.</source> <volume>37</volume>, <fpage>7772</fpage>&#x02013;<lpage>7781</lpage>. <pub-id pub-id-type="doi">10.1523/JNEUROSCI.0168-17.2017</pub-id><pub-id pub-id-type="pmid">28626013</pub-id></citation></ref>
<ref id="B28">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nelson</surname> <given-names>M. J.</given-names></name> <name><surname>El Karoui</surname> <given-names>I.</given-names></name> <name><surname>Giber</surname> <given-names>K.</given-names></name> <name><surname>Yang</surname> <given-names>X.</given-names></name> <name><surname>Cohen</surname> <given-names>L.</given-names></name> <name><surname>Koopman</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>Neurophysiological dynamics of phrase-structure building during sentence processing</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>114</volume>, <fpage>E3669</fpage>&#x02013;<lpage>E3678</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1701590114</pub-id><pub-id pub-id-type="pmid">28416691</pub-id></citation></ref>
<ref id="B29">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pallier</surname> <given-names>C.</given-names></name> <name><surname>Devauchelle</surname> <given-names>A. D.</given-names></name> <name><surname>Dehaene</surname> <given-names>S.</given-names></name></person-group> (<year>2011</year>). <article-title>Cortical representation of the constituent structure of sentences</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>108</volume>, <fpage>2522</fpage>&#x02013;<lpage>2527</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1018711108</pub-id><pub-id pub-id-type="pmid">21224415</pub-id></citation></ref>
<ref id="B30">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pe&#x000F1;a</surname> <given-names>M.</given-names></name> <name><surname>Melloni</surname> <given-names>L.</given-names></name></person-group> (<year>2012</year>). <article-title>Brain oscillations during spoken sentence processing</article-title>. <source>J. Cogn. Neurosci.</source> <volume>24</volume>, <fpage>1149</fpage>&#x02013;<lpage>1164</lpage>. <pub-id pub-id-type="doi">10.1162/jocn_a_00144</pub-id><pub-id pub-id-type="pmid">21981666</pub-id></citation></ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Phillips</surname> <given-names>C.</given-names></name></person-group> (<year>2003</year>). <article-title>Linear order and constituency</article-title>. <source>Linguist. Inq.</source> <volume>34</volume>, <fpage>37</fpage>&#x02013;<lpage>90</lpage>. <pub-id pub-id-type="doi">10.1162/002438903763255922</pub-id></citation></ref>
<ref id="B32">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Poeppel</surname> <given-names>D.</given-names></name> <name><surname>Idsardi</surname> <given-names>W. J.</given-names></name> <name><surname>van Wassenhove</surname> <given-names>V.</given-names></name></person-group> (<year>2008</year>). <article-title>Speech perception at the interface of neurobiology and linguistics</article-title>. <source>Philos. Trans. R. Soc. B Biol. Sci.</source> <volume>363</volume>, <fpage>1071</fpage>&#x02013;<lpage>1086</lpage>. <pub-id pub-id-type="doi">10.1098/rstb.2007.2160</pub-id><pub-id pub-id-type="pmid">17890189</pub-id></citation></ref>
<ref id="B33">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sanders</surname> <given-names>L. D.</given-names></name> <name><surname>Newport</surname> <given-names>E. L.</given-names></name> <name><surname>Neville</surname> <given-names>H. J.</given-names></name></person-group> (<year>2002</year>). <article-title>Segmenting nonsense: an event-related potential index of perceived onsets in continuous speech</article-title>. <source>Nat. Neurosci.</source> <volume>5</volume>, <fpage>700</fpage>&#x02013;<lpage>703</lpage>. <pub-id pub-id-type="doi">10.1038/nn873</pub-id><pub-id pub-id-type="pmid">12068301</pub-id></citation></ref>
<ref id="B34">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Steinhauer</surname> <given-names>K.</given-names></name> <name><surname>Alter</surname> <given-names>K.</given-names></name> <name><surname>Friederici</surname> <given-names>A. D.</given-names></name></person-group> (<year>1999</year>). <article-title>Brain potentials indicate immediate use of prosodic cues in natural speech processing</article-title>. <source>Nat. Neurosci.</source> <volume>2</volume>, <fpage>191</fpage>&#x02013;<lpage>196</lpage>. <pub-id pub-id-type="doi">10.1038/5757</pub-id><pub-id pub-id-type="pmid">10195205</pub-id></citation></ref>
<ref id="B35">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Townsend</surname> <given-names>D. J.</given-names></name> <name><surname>Bever</surname> <given-names>T. G.</given-names></name></person-group> (<year>2001</year>). <source>Sentence Comprehension: The Integration of Habits and Rules</source>. <publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>MIT Press</publisher-name>.</citation></ref>
<ref id="B36">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>X.</given-names></name> <name><surname>Wang</surname> <given-names>K.</given-names></name> <name><surname>Shamma</surname> <given-names>S. A.</given-names></name></person-group> (<year>1992</year>). <article-title>Auditory representations of acoustic signals</article-title>. <source>IEEE Trans. Inf. Theory</source> <volume>38</volume>, <fpage>824</fpage>&#x02013;<lpage>839</lpage>. <pub-id pub-id-type="doi">10.1109/18.119739</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn fn-type="financial-disclosure"><p><bold>Funding.</bold> Work supported by National Natural Science Foundation of China 31500873 (ND), Zhejiang Provincial Natural Science Foundation of China LR16C090002 (ND), Fundamental Research Funds for the Central Universities (ND), and research funding from the State Key Laboratory of Industrial Control Technology, Zhejiang University (ND).</p>
</fn>
</fn-group>
</back>
</article>
