<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychol.</journal-id>
<journal-title>Frontiers in Psychology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychol.</abbrev-journal-title>
<issn pub-type="epub">1664-1078</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyg.2025.1528821</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Psychology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>The processing of familiar English L2 phrasal verbs in neutral and biased sentence contexts</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Yu</surname> <given-names>Jianyao</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2555401/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Siya</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2923189/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Zhang</surname> <given-names>Ping</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Chen</surname> <given-names>Tai&#x2019;an</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>School of Foreign Studies, South China Normal University</institution>, <addr-line>Guangzhou</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Guangdong Center for Language Cognition and Assessment</institution>, <addr-line>Guangzhou</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>Cheng Yi Middle School</institution>, <addr-line>Xiamen</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>School of Foreign Languages, Soochow University</institution>, <addr-line>Suzhou</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>Maoming School Affiliated to Guangdong Experimental High School</institution>, <addr-line>Maoming</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0004">
<p>Edited by: Rui Li, Hunan University, Changsha, China</p>
</fn>
<fn fn-type="edited-by" id="fn0005">
<p>Reviewed by: Tingzhu Chen, Shanghai Jiao Tong University, China</p>
<p>Wenshuo Chang, Shanghai International Studies University, China</p>
</fn>
<corresp id="c001">&#x002A;Correspondence: Ping Zhang, <email>blacrose@163.com</email>;<email>blacrosezhang@suda.edu.cn</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>05</day>
<month>06</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1528821</elocation-id>
<history>
<date date-type="received">
<day>15</day>
<month>11</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>02</day>
<month>05</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Yu, Wang, Zhang and Chen.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Yu, Wang, Zhang and Chen</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>This paper addresses an important psycholinguistic question: whether L2 learners preferentially process phrasal verbs (PVs) literally or figuratively, irrespective of context and proficiency levels. Our primary aim was twofold: first, to investigate how familiar English L2 PVs are processed&#x2014;whether literally or figuratively&#x2014;and secondly, to explore this across different contexts (neutral, literal bias, figurative bias) and proficiency levels among learners. Drawing on existing literature, we tentatively hypothesized that while learners might activate literal meanings early in processing, figurative activation could dominate later stages as far as familiar PVs are concerned. Familiarity with PVs may be critical across proficiency levels in driving PV processing. What&#x2019;s more, the preferred meaning may be bootstrapped in supporting context, but the less preferred meaning is likely suppressed even with context boost. To achieve these objectives, an eye-tracking experiment was conducted with intermediate and advanced Chinese English L2 learners. Participants read context sentences containing PVs followed by a visual word search task to assess PV meaning activation at early, late and further delayed stages. Statistic analysis revealed that no consistent interpretation of PVs as literal or figurative in the time course emerged. However, in sentence reading, we observed faster late meaning activation in both literal and figurative contexts than in the neutral context, and delayed preference for figurative interpretation in the post-PV region. Meanwhile, in visual word search task, meaning activation was context-dependent and fluctuated over time, indicating temporal dynamics in processing. Last but not least, proficiency ranging from intermediate to advanced levels did not significantly impact processing when PV familiarity was achieved. Our findings suggest that teaching strategies should focus on enhancing learners&#x2019; ability to recognize figurative meanings. This approach could improve reading comprehension by promoting learner awareness of PVs as whole lexical units. In conclusion, this study enhances our understanding the mechanisms underlying L2 PV processing dynamics and provides actionable insights for language acquisition strategies, thus contributing valuable knowledge to the field of second language processing and learning.</p>
</abstract>
<kwd-group>
<kwd>familiar phrasal verbs</kwd>
<kwd>eye-tracking</kwd>
<kwd>preferential meaning activation</kwd>
<kwd>context effect</kwd>
<kwd>proficiency effect</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="77"/>
<page-count count="16"/>
<word-count count="13852"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Psychology of Language</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<title>Introduction</title>
<p>Recent decades of psycholinguistic research has underscored the importance of focusing on multiword unit processing and acquisition (<xref ref-type="bibr" rid="ref3">Arnon and Snider, 2010</xref>; <xref ref-type="bibr" rid="ref29">Jiang and Siyanova-Chanturia, 2023</xref>; <xref ref-type="bibr" rid="ref30">Jolsvai et al., 2020</xref>; <xref ref-type="bibr" rid="ref74">Wray, 2002</xref>). As one type of multiword unit, phrasal verbs (PVs) have been under-researched due to their complex nature with regard to their syntactic and semantic aspects (<xref ref-type="bibr" rid="ref72">Wisintainer and Mota, 2018</xref>).</p>
<p>PVs abound in the English language (<xref ref-type="bibr" rid="ref9002">Gardner and Davies, 2007</xref>) and challenge L2 English learners because of their complex nature (<xref ref-type="bibr" rid="ref55">Side, 1990</xref>). Previous research focused more on L2 PV learning, learner difficulty in using PVs and their avoidance behavior (e.g., <xref ref-type="bibr" rid="ref18">Dagut and Laufer, 1985</xref>; <xref ref-type="bibr" rid="ref34">Liao and Fukuya, 2004</xref>; <xref ref-type="bibr" rid="ref58">Siyanova-Chanturia and Schmitt, 2007</xref>; <xref ref-type="bibr" rid="ref79">Zhang and Chen, 2019</xref>). What remains underexplored about PVs is how L2 learners process PVs, which is important to facilitate our understanding of whether L2 learners employ similar underlying cognitive mechanism in processing PVs as in dealing with idioms (typical multiword units). Increasingly more research supports treating idioms both figuratively as holistic lexical units and literally as strings of individual words in figurative language comprehension (<xref ref-type="bibr" rid="ref77">Yi and Zhong, 2023</xref>). We join in this theoretic discussion by testing this dual approach on PVs.</p>
<p>In this study, we aim to conceptually replicate <xref ref-type="bibr" rid="ref69">Wang et al. (2016)</xref>, investigating how intermediate and advanced Chinese learners of English process familiar L2 phrasal verb (PV) constructions in neutral, literally biased, and figuratively biased sentence contexts. Our investigation is two-staged: tracking eye movements in both PV and post-PV noun phrase regions in sentence reading, and following it with a visual word search task to examine further delayed PV processing effects. The findings from this study could provide insights into improving PV comprehension by helping learners understand the importance of knowing opaque figurative meanings.</p>
</sec>
<sec id="sec2">
<title>Theoretical background</title>
<sec id="sec3">
<title>Figurative language processing models and related influencing factors</title>
<p>The study of figurative language processing has been marked by the debate surrounding how figurative and literal meanings are processed during idiom comprehension. Currently the more widely accepted approach to figurative language processing is the hybrid model. According to this view, idioms are processed as both single lexical units and phrases composed of individual words, with both figurative and literal meanings being activated simultaneously (<xref ref-type="bibr" rid="ref6">Beck and Weber, 2016</xref>; <xref ref-type="bibr" rid="ref77">Yi and Zhong, 2023</xref>). However, the activation of these meanings is not necessarily sequential, beginning with literal interpretation. The graded salience hypothesis in this approach proposes that it&#x2019;s a graded process where more salient meanings (e.g., conventional, frequent, familiar) are preferentially processed over less salient ones (<xref ref-type="bibr" rid="ref21">Giora, 1997</xref>, <xref ref-type="bibr" rid="ref22">1999</xref>, <xref ref-type="bibr" rid="ref23">2002</xref>). In accordance with graded salience hypothesis, familiar meanings - whether literal or figurative - are more accessible and salient for speakers/hearers. This means that figurative meanings can be easily accessed for familiar idioms, while literal meanings serve as the default interpretation for unfamiliar ones.</p>
<p>Building upon the graded salience hypothesis, <xref ref-type="bibr" rid="ref11">Cie&#x015B;licka (2006)</xref> put forward the literal salience resonant hypothesis which offers a unique perspective on L2 idiom processing. Specifically designed to account for comprehension of L2 idioms, it predicts that L2 learners tend to process L2 idioms literally, regardless of context and familiarity. L2 learners supposedly become familiar with individual words before encountering the idioms themselves, which affords literal meanings a more salient status. Empiracal studies from Cieslicka and colleagues supported this hypothesis by showing that L2 learners prefer literal interpretations for idioms (<xref ref-type="bibr" rid="ref12">Cieslicka, 2011</xref>; <xref ref-type="bibr" rid="ref13">Cieslicka and Heredia, 2011</xref>, <xref ref-type="bibr" rid="ref14">2019</xref>; <xref ref-type="bibr" rid="ref15">Cieslicka et al., 2014</xref>).</p>
<p>However, more recent research on the hybrid approach to idiom processing by both L1 and L2 speakers has challenged this hypothesis. For instance, studies have shown that speakers can both access/retrieve figurative meanings and analyze individual words (e.g., <xref ref-type="bibr" rid="ref24">Holsinger, 2013</xref>; <xref ref-type="bibr" rid="ref31">Kessler et al., 2020</xref>; <xref ref-type="bibr" rid="ref66">van Ginkel and Dijkstra, 2020</xref>). This raises questions about the extension of literal salience resonant hypothesis to L2 learners&#x2019; processing of idioms and phrasal verbs.</p>
<p>Other research illuminates more complexities involved in idiom processing by focusing more on the factors influencing literal or figurative interpretation. Familiarity (subjective frequency) has been deemed as the primary predictor of figurative interpretation of idioms and also an index of ease of direct retrieval of figurative meanings (<xref ref-type="bibr" rid="ref10">Carrol and Littlemore, 2020</xref>; <xref ref-type="bibr" rid="ref35">Libben and Titone, 2008</xref>; <xref ref-type="bibr" rid="ref54">Schweigert and Moates, 1988</xref>; <xref ref-type="bibr" rid="ref65">Titone and Libben, 2014</xref>). Studies by <xref ref-type="bibr" rid="ref35">Libben and Titone (2008)</xref> and <xref ref-type="bibr" rid="ref64">Titone and Connine (1999)</xref>, among others, have highlighted the impact of familiarity with idioms on meaningfulness judgments. Participants are more likely to process an idiom as figurative if they possess knowledge about its intended non-literal interpretation. One cannot expect participants to consider the figurative meaning of an expression if they do not know the said meaning (<xref ref-type="bibr" rid="ref24">Holsinger, 2013</xref>). <xref ref-type="bibr" rid="ref54">Schweigert and Moates (1988)</xref> suggest that without idiom knowledge, participants may default to literal interpretations regardless of their proficiency level. <xref ref-type="bibr" rid="ref32">Kim (2016)</xref> emphasizes that when dealing with less well-known or unfamiliar idioms, even proficient L2 learners may misconstrue such idioms as literal due to their deceptive transparency. Such findings highlight the necessity to include tasks to ascertain the actual familiarity with the figurative language in question before assessing whether literal or figurative meanings of idioms are processed preferentially.</p>
<p>In addition to familiarity, other factors such as transparency/compositionality and predictability also influence idiom processing (<xref ref-type="bibr" rid="ref35">Libben and Titone, 2008</xref>; <xref ref-type="bibr" rid="ref64">Titone and Connine, 1999</xref>). These factors may interact in modulating idiom processing at different time points. For example, transparency/decomposability only influences meaningfulness judgments if idioms are less familiar (<xref ref-type="bibr" rid="ref35">Libben and Titone, 2008</xref>). Idiom literality also plays a role in idiom processing. Idiom recognition may come earlier with greater idiom familiarity but later with higher literality of an idiom (<xref ref-type="bibr" rid="ref43">Morid et al., 2021</xref>; <xref ref-type="bibr" rid="ref65">Titone and Libben, 2014</xref>). Furthermore, context weighs in the process by either promoting or suppressing figurative interpretation. For instance, there is speedy figurative processing of high-familiarity idioms in figuratively biased contexts and literal processing of low-familiarity idioms in literally biased contexts (<xref ref-type="bibr" rid="ref70">Wang et al., 2021</xref>). There is also interaction between biasing context and idiom literality. For example, supporting literal or figurative context strengthens the biased meaning interpretation for high-literality idioms (e.g., &#x201C;<italic>at the end of the day</italic>&#x201D;), but there is a cost of incongruent meaning resolution; meanwhile, for low-literality idioms (e.g., &#x201C;<italic>in the seventh heaven</italic>&#x201D;), literal interpretation carries a cost regardless of literal or figurative context (<xref ref-type="bibr" rid="ref7">Beck and Weber, 2020</xref>). To sum up, such factors as familiarity, transparency, and context bias should all be considered in further research into L1 figurative language processing.</p>
<p>Research has shown that the above factors also influence L2 idiom processing. Familiarity plays a critical role in determining how learners process idioms (<xref ref-type="bibr" rid="ref81">Zhou and Zhang, 2011</xref>). <xref ref-type="bibr" rid="ref0040">Titone et al. (2015)</xref> study found that both direct retrieval and compositional analysis are involved in L2 idiom processing. In particular<xref ref-type="bibr" rid="ref81">Zhou and Zhang (2011)</xref> experiment demonstrated the importance of familiarity with L2 idioms. They presented Chinese learners of English with neutral or figuratively biased contexts with idioms embedded, then the participants were required to fill in literal and figurative associate words. The results showed that when processing familiar idioms, both higher-level and lower-level learners preferred figurative meaning interpretation of the idioms in both neutral and figuratively biased contexts. In contrast, when processing unknown idioms, the proficiency effect emerged: While both levels of learners favored literal meanings in neutral contexts, they differed in their interpretation of idioms in figuratively biased contexts. Higher-level learners opted for figurative meanings, whereas lower-level learners preferred literal meanings (<xref ref-type="bibr" rid="ref81">Zhou and Zhang, 2011</xref>). These findings contradict Cieslicka&#x2019;s hypothesis that L2 speakers always prefer the literal meaning and instead support Giora&#x2019;s graded salience hypothesis (<xref ref-type="bibr" rid="ref22">Giora, 1999</xref>) by evidencing familiarity effect.</p>
<p>In short, the analyses of the influencing factors on figurative language processing provide new insights for further study to uncover the underlying processes involved in PV interpretation in context across varying L2 proficiency levels.</p>
</sec>
<sec id="sec4">
<title>Previous research on phrasal verb processing</title>
<p>Phrasal verbs (PVs) are verb particle combinations syntacally (<xref ref-type="bibr" rid="ref9001">Cappelle et al., 2010</xref>; <xref ref-type="bibr" rid="ref9005">Richards and Schmidt, 2011</xref>). Semantically, PVs have been viewed as lexical units along a continuum (<xref ref-type="bibr" rid="ref18">Dagut and Laufer, 1985</xref>; <xref ref-type="bibr" rid="ref19">Darwin and Gray, 1999</xref>; <xref ref-type="bibr" rid="ref20">Dixon, 1982</xref>; <xref ref-type="bibr" rid="ref45">Palmer, 1974</xref>) with PVs like &#x201C;<italic>walk in</italic>&#x201D; (whose meaning is transparent) and &#x201C;<italic>give up</italic>&#x201D; (which has an opaque figurative sense only) at the two ends of this continuum. In terms of <xref ref-type="bibr" rid="ref9001">Cappelle et al. (2010)</xref>, the PVs at the two opposite ends are literal and figurative PVs. Many PVs along this continuum have figurative meanings and are also literally plausible (of high litreality), such as &#x201C;<italic>run into [encounter] someone</italic>&#x201D; or &#x201C;<italic>run into [enter] a room</italic>.&#x201D; To test whether L2 learners process PVs literally or figuratively, this study focuses on these PVs which are both literally and figuratively plausible (e.g., <italic>run into</italic>).</p>
<p>Researchers have considered idiom processing models applicable to L2 PV processing (e.g., <xref ref-type="bibr" rid="ref9">Carrol and Conklin, 2020</xref>; <xref ref-type="bibr" rid="ref18">Dagut and Laufer, 1985</xref>; <xref ref-type="bibr" rid="ref57">Siyanova-Chanturia and Martinez, 2014</xref>), given the formulaic similarities between idioms and PVs (<xref ref-type="bibr" rid="ref74">Wray, 2002</xref>). However, studies on PV processing are limited in number. Preference for figurative processing of PVs was found with L2 learners in several studies (<xref ref-type="bibr" rid="ref8">Blais and Gonnermn, 2013</xref>; <xref ref-type="bibr" rid="ref40">Matlock and Heredia, 2002</xref>; <xref ref-type="bibr" rid="ref47">Paulmann et al., 2015</xref>). For instance, Matlock and Heredia&#x2019;s study (2002) found that advanced early bilinguals processed figurative meanings for PVs similarly to native speakers, whereas lower-level late bilinguals relied more heavily on literal interpretations. This suggests that L2 proficiency may influence the way learners process PVs. The study by Matlock and Heredia provides valuable insights into how L2 learners process PVs, but it has several limitations that can be addressed in future research. One limitation is the reliance on self-paced reading tasks on the sentence level, which may not provide precise information about how learners engage with the PV within a sentence (<xref ref-type="bibr" rid="ref8">Blais and Gonnermn, 2013</xref>). Another limitation is the lack of control for PV familiarity among participants, as prior exposure to a PV could influence processing. Additionally, the study did not account for PV transparency levels or syntactical complexity of sentences where PVs were embedded, which may impact figurative or literal interpretations. Furthermore, contextual cues such as sentence topic and surrounding discourse were not controlled for, which could also affect learners&#x2019; preference for figurative interpretation.</p>
<p>The study by <xref ref-type="bibr" rid="ref47">Paulmann et al. (2015)</xref> also found that both upper-intermediate-to-advanced L2 learner group and native L1 speakers showed similar preference for figurative meanings when reading PVs, such as &#x201C;<italic>run over</italic>&#x201D; meaning <italic>to kill someone</italic>. This was evident from the event-related potential (ERP) data, which indicated smaller N400 component for the following noun phrase allowing for figurative meaning (e.g., <italic>the old man</italic>) than the one allowing for literal meaning (e.g., <italic>the old bridge</italic>). However, there are some limitations to this study that should be considered: Firstly, the study only included one group of L2 learners compared to a native speaker group, leaving it unclear whether these findings would generalize to lower-proficiency L2 learners. Future research could benefit from including different proficiency levels to examine potential differences in idiomatic interpretation. Secondly, the study only examined the ERP components for paired nouns after reading the same PV. Future research could benefit from examining the effect of prior literally or figuratively biasing context on the same PV plus the same noun phrase (e.g., <italic>Peter was looking around for Black Friday deals. So Peter ran into Zara on Oxford Street</italic> vs. <italic>Peter had not seen Zara for years. Then Peter ran into Zara on Oxford Street</italic> in which Zara is likely to be interpreted as a chain store in one situation or a friend in the other situation). This would allow researchers to better isolate the effect of prior biasing context and gain insights into how L2 learners process PVs in different contexts.</p>
<p>Evidence from <xref ref-type="bibr" rid="ref8">Blais and Gonnermn (2013)</xref> suggests that advanced L2 speakers may process phrasal verbs in a manner similar to native speakers. In their study, researchers used a masked priming task to explore automatic activation patterns for figurative meanings in L2 speakers&#x2019; mental lexicon. The results showed that high-proficiency L2 speakers exhibited response latencies similar to those of native speakers when processing transparent and opaque phrasal verbs. Specifically, the study found that transparent PVs (e.g., &#x201C;finish up&#x201D;) produced greater priming on their component verbs (e.g., &#x201C;finish&#x201D;) than opaque PVs (e.g., &#x201C;chew out&#x201D;) did on theirs (e.g., &#x201C;chew&#x201D;). This suggests that L2 speakers with higher proficiency are sensitive to the figurative phrasal verbs, which can cause a delay in processing. In contrast, lower-proficiency L2 learners showed no response difference between transparent and opaque PVs. The study&#x2019;s findings suggest that L2 proficiency plays a role in phrasal verb processing. However, it is essential to note that this experiment only tapped into the priming effect of different types of PVs on their component verbs out of context. Additionally, similar to <xref ref-type="bibr" rid="ref47">Paulmann et al. (2015)</xref> research, the study did not assess learners&#x2019; familiarity with PVs&#x2019; opaque meanings at either proficiency level.</p>
<p>In contrast to the studies in favor of preferential figurative processing, other PV processing studies support opposite primary literal activation in both L1 and L2. <xref ref-type="bibr" rid="ref25">Holsinger and Kaiser (2013)</xref> found that native speakers tend toward default literal processing of phrasal verbs. In their self-paced reading task, participants were presented with ambiguous PVs that could be interpreted in either a literal or idiomatic sense (e.g., <italic>dig into the tomb/sandwich</italic>). The study&#x2019;s design relied on creating semantic contradictions between the prior biasing context and the disambiguation context following the PV (e.g., <italic>The daring archaeologist/hungry waitress who had been working all day dug into the sandwich/tomb just after noon on Sunday.</italic>). The findings suggest that native speakers may prioritize literal meanings over figurative ones, which could be more attributed to the complex contextual semantic contradiction. It is unclear whether this tendency would also apply to L2 learners, who might have uneven level of familiarity with idiomatic senses of PVs. Additionally, it&#x2019;s worth noting that <xref ref-type="bibr" rid="ref25">Holsinger and Kaiser (2013)</xref> did not control for PV transparency, which could have impacted their findings.</p>
<p><xref ref-type="bibr" rid="ref69">Wang et al. (2016)</xref> study with L2 learners further supports the idea that phrasal verbs may be processed primarily literally. In their visual word search eye-tracking experiment, intermediate and advanced English L2 learner groups were presented with either literally or figuratively biased context sentences containing a PV in each sentence, and then had to choose one of the four probe words (literally or figuratively related words, and two unrelated control words). The results from the eye fixation data on the probe words showed an overall reliance on literal meaning activation at both proficiency levels in the task. Besides, L2 learners spent more time considering context-biased literal or figurative meanings, and there was also an L2 proficiency effect in the activation of figurative meanings in the literally biased context, with only the advanced group showing figurative activation in spite of the literal bias. The strength of this study is its control for familiarity with both literal and figurative meanings, which was lacking in previous PV studies. However, the use of visual word search eye-tracking measures only allowed the researchers to examine L2 learners&#x2019; delayed cognitive processes of PV interpretation, which they confused for online PV processing. Besides, it&#x2019;s also worth noting that there was no neutral baseline context for comparison and the total fixation time proportion analysis used in Wang <italic>et al.</italic>&#x2019;s study may not have captured finer-grained temporal dynamics as demonstrated in <xref ref-type="bibr" rid="ref24">Holsinger (2013)</xref>. This limitation highlights the importance of updating statistical analytical approaches when examining language processing patterns (see the next Section below).</p>
<p>To sum up, the current status quo of phrasal verb (PV) processing research presents several unanswered questions. For instance, do all non-native English speakers process PVs literally? Do they tend to interpret PVs figuratively or literally in contexts that are biased toward literal or figurative meanings? Additionally, is there a consistent pattern in the time course of meaning processing? The discrepancies between studies such as <xref ref-type="bibr" rid="ref69">Wang et al. (2016)</xref> and <xref ref-type="bibr" rid="ref47">Paulmann et al. (2015)</xref> highlight the complexity of how non-native English speakers process PVs figuratively versus literally. While the different studies have examined individual factors like transparency, context biasing, level of familiarity or language proficiency in isolation, future research should aim to consider these variables simultaneously within a single experimental framework in light of the findings about the complexities involved in idiomatic/figurative language processing (See the previous Section). To achieve this multifaceted understanding, researchers could manipulate contextual biases and examine how prior contexts influence subsequent PV interpretations. Moreover, it is essential to control for the figurative meaning familiarity of target PVs, as previous studies have shown that non-native speakers tend to misconstrue less well-known idiomatic expressions as literal due to their deceptive transparency (<xref ref-type="bibr" rid="ref32">Kim, 2016</xref>). Furthermore, given the intertwined nature of familiarity and proficiency effects in idiom comprehension (<xref ref-type="bibr" rid="ref81">Zhou and Zhang, 2011</xref>), future research should strive to disentangle these joint effects on non-native speakers&#x2019; processing of PVs. By addressing these gaps in our understanding, we can contribute to developing models of phrasal verb processing across L2 proficiency levels.</p>
</sec>
<sec id="sec5">
<title>Related research using visual word search eye-tracking paradigm</title>
<p>Eye-tracking allows us to gain insights into the real-time consideration of literal and idiomatic interpretations over the time course of sentence comprehension without the need for predetermined time-point selections. The visual word search (VWS) paradigm in particular has been adapted to investigate the processing of figurative language, such as idioms and phrasal verbs. By measuring gaze patterns across different regions of interest on the display, this method captures the temporal dynamics of comprehension through changes in eye movement focus. Operationally, participants&#x2019; consideration of literal or figurative meaning in VWS is assessed by analyzing the proportion of eye fixations directed toward literal versus figurative related probe words compared to their respective distractor words. Higher proportions of looks indicate a greater degree of attention to and consideration of that particular meaning.</p>
<p>The listen-and-look visual word search paradigm involves listening to spoken information while viewing visual probe words on display (<xref ref-type="bibr" rid="ref41">McQueen and Viebahn, 2007</xref>). A read-only variant of the paradigm is to read a sentence before viewing the visual probe words (<xref ref-type="bibr" rid="ref24">Holsinger, 2013</xref>). By examining how participants&#x2019; eyes move between semantically related words, and unrelated control words in the same grid, we can gain insights into whether individuals are relying more heavily on lexical recognition of PVs or performing word-by-word syntactic analysis.</p>
<p>Observable eye movements in response to a target word are often within the 1,000-ms time window from the target word onset (<xref ref-type="bibr" rid="ref1">Allopenna et al., 1998</xref>; <xref ref-type="bibr" rid="ref76">Yee and Sedivy, 2006</xref>). Moreover, according to <xref ref-type="bibr" rid="ref28">Ito and Knoeferle (2023)</xref>, a more rigorous approach to statistical analysis is to count fixations in very fine time bins (e.g., 20-, 50- or 100-ms interest period), then partition the bins into wider time windows (e.g., 400&#x202F;ms) and observe the looks proportion in each time window. Moreover, for interest period (time bins) shorter than 100&#x202F;ms, eye fixation &#x201C;yes/no&#x201D; data are binomially distributed and can be transformed into binary (1, 0) data. Analyzing binary gaze data at multiple time points (for example in 20-ms bins), rather than relying on single measures such as fixation durations or total numbers of fixations helps to account for heteroscedasticity (variation in the variance of fixation durations), improve the sensitivity of statistical analysis and reduce Type II errors. However potential problems with multiple testing in 20-ms bins could lead to an increase in false significant results. To reduce the likelihood of spurious significance, eye movement data should be averaged over larger time windows (e.g., of 400&#x202F;ms) (<xref ref-type="bibr" rid="ref28">Ito and Knoeferle, 2023</xref>).</p>
<p>It was along these lines that <xref ref-type="bibr" rid="ref24">Holsinger (2013)</xref> converted gaze sampling data in his listen-and-look visual word search eye tracking task into binary data and divided them between early and late time windows (180&#x2013;580&#x202F;ms,<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref> 580&#x2013;980&#x202F;ms). He investigated how native speakers process idioms in neutral, literally-biased, and figuratively-biased contexts (e.g., <italic>kicked the bucket</italic>), obtaining the fixation count proportions and the order in which the native speaker participants fixated on a set of four visual probe words presented simultaneously with the onset of the auditory idiom embedded in sentence. His findings showed that, in unbiased conditions, participants initially preferred looking at literal associates before experiencing attention competition between figurative and literal associate words later on. In literally biased contexts, looks to literal associates were significantly higher than looks to unrelated control words in both time windows, while in figuratively biased contexts there was only early consideration of literal meanings as measured by higher looks proportions. The time-course statistical analysis of L1 idiomatic processing mechanisms provides a useful frame of reference for our study of L2 PV processing.</p>
<p>In contrast to <xref ref-type="bibr" rid="ref24">Holsinger (2013)</xref> study, the experimental paradigm adopted by <xref ref-type="bibr" rid="ref69">Wang et al. (2016)</xref> was a read-only visual word search variant (see the previous section), but relied only on the proportions of total interest area reading/dwell time for the probe words (e.g., 4,000&#x202F;ms, much longer than the usual 1,000-ms observation window) to make statistical analysis, and were unable to account for the heteroscedasticity of the total reading time. Another limitation is that they did not provide information on early online processing of phrasal verbs but instead relied solely on total reading time analysis for probe words. In this approach they quickly drew an unsupported conclusion about early activation of literal meanings for the phrasal verbs at the earlier stage of sentence reading. Therefore, to further examine the time-course changes in meaning activation, it is necessary to observe not only the participants&#x2019; fixations to probe words, but also fixation data during earlier sentence reading.</p>
<p>Further research should aim to improve upon these limitations by focusing on the timing and order of literal and figurative meaning consideration while employing more robust statistical analyses. By doing so, researchers can gain a better understanding of nuanced temporal patterns in PV processing by L2 learners of different proficiency levels.</p>
</sec>
</sec>
<sec id="sec6">
<title>The present study</title>
<p>The present study replicates <xref ref-type="bibr" rid="ref69">Wang et al. (2016)</xref> by employing the same read-only visual word search paradigm but followed the statistical analysis approach in <xref ref-type="bibr" rid="ref24">Holsinger (2013)</xref>. Specifically, this study investigates how Chinese learners of English at intermediate and advanced proficiency levels process familiar PVs with similarly high literal and figurative meaning familiarity ratings but significantly different literal and figurative transparency ratings. The goal is to examine whether distinct proficiency groups of L2 learners give PVs a literal interpretation in preference to a figurative interpretation in literally biased, figuratively biased, and neutral unbiasing prior contexts.</p>
<sec id="sec7">
<title>Research questions</title>
<p>Based on our review of previous studies, we address two research questions as follows:</p>
<list list-type="order">
<list-item>
<p>Do learners show continuous preference for activating either literal or figurative meanings across different contexts at both early sentence reading stage and late visual probe word search stage when PVs have equivalent familiarity ratings?</p>
</list-item>
<list-item>
<p>Does L2 English proficiency affect the processing order or activation strength in interpreting PV meanings at both early sentence reading stage and late visual probe word search stage when PVs have equivalent familiarity ratings?</p>
</list-item>
</list>
<p>Competing meaning activation models present us a challenging task to predict either literal or figurative meaning activation in figurative language processing. Giora&#x2019;s graded salience hypothesis, when applied to L2 learners who are familiar with figurative language, suggests that they should activate meanings figuratively regardless of context. However, context itself, as a driving factor in achieving salience effect, is known to influence whether interpretations lean toward literal or figurative meanings based on the context provided. Empirical studies indicate that even highly competent L1 speakers may find themselves activating literal meanings for familiar figurative language in figuratively biased contexts during early stages of online processing.</p>
<p>According to the literal salience resonant model, which applies specifically to L2 learners, literal meaning should be superior and preferred over figurative meaning when processing a familiar PV regardless of context. This implies that literal interpretations should take precedence irrespective of how a PV is presented or used. For bilinguals with a less proficicent L2 at least, literal meanings are more salient and therefore literal activation should be obligatory throughout the time-course of processing as shown in lexical decision tasks immediately at sentence offset, 300&#x202F;ms, or 800&#x202F;ms after sentence offset (<xref ref-type="bibr" rid="ref13">Cieslicka and Heredia, 2011</xref>). Nonetheless, research by <xref ref-type="bibr" rid="ref47">Paulmann et al. (2015)</xref>, along with other studies, reveals that proficient L2 learners may exhibit similarities to native speakers in their default preference for early figurative processing. These findings suggest a more nuanced understanding instead of an absolute either/or choice between literal and figurative meanings during activation.</p>
<p>Therefore, we tentatively suggest that L2 learners, in dealing with familiar PVs, may initially activate the literal meaning like L1 speakers before preferred figurative interpretations become dominant as online processing continues. Additionally, we also expect that context may bootstrap the preferred meaning earlier and more strongly than the less preferred meaning.</p>
<p>The role of L2 proficiency in processing figurative vocabulary (PVs) is less straightforward than previously thought. Previous studies suggest that only advanced learners exhibit a figurative advantage when interpreting PVs. However, when item familiarity is controlled for, even lower-proficiency learners tend to activate figurative meanings of highly familiar idioms during explicit tasks like blank-filling semantically related words. These findings challenge the literal salience resonant hypothesis by revealing that lower proficiency learners still prefer figurative interpretations of familiar idioms. This suggests that intermediate and advanced L2 learners may exhibit similar tendencies when processing such idioms, even if their proficiency levels vary. Further research is needed to determine whether this figurative preference holds for PVs over time during real-time interpretation in sentence-level reading and succeeding probe word reading.</p>
<p>The previous research pointed to two opposite directions. Therefore, we did not have a definitive hypothesis. We explored whether it would happen as we tentatively suggested. Statistically, Hypothesis<sub>0</sub> was: there would be no meaning activation preference for target items (PVs, post-PV noun phrases, or probe words) across contexts and proficiency levels. The alternative hypothesis was: there would be meaning activation preference across contexts and proficiency levels.</p>
</sec>
</sec>
<sec id="sec8">
<title>Experiment method</title>
<sec id="sec9">
<title>Participants</title>
<p>A statistical power analysis based on a pilot test with 27 participants homogeneous to students in the main experiment and the same materials as in the main experiment showed that to obtain the sufficient statistical power of 0.8, we should have a sample size of 80 participants.</p>
<p>Participants were recruited from South China Normal University, with all being native Chinese speakers who had no prior experience studying or living in English-speaking countries. A total of 99 students participated in the main experiment, receiving a payment of 40 RMB each as an incentive for their involvement.</p>
<p>The intermediate group comprised 51 sophomore students majoring in English (who were pre-TEM-4 but all passed TEM-4<xref ref-type="fn" rid="fn0002"><sup>2</sup></xref> the next semester). The advanced group consisted of 48 English graduate students who had already passed TEM-8. A significant age difference was found between proficiency groups (<italic>M</italic><sub><italic>intermediat</italic>e</sub>&#x202F;=&#x202F;19.44, <italic>SD</italic>&#x202F;=&#x202F;0.87, <italic>M<sub>advanced</sub></italic>&#x202F;=&#x202F;23.17, <italic>SD</italic>&#x202F;=&#x202F;1.19; <italic>t</italic>&#x202F;=&#x202F;17.13, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001, <italic>Cohen&#x2019;s d</italic>&#x202F;=&#x202F;3.56).</p>
<p>To ensure a clear distinction between intermediate and advanced levels, we excluded students who had exceptionally high scores on TEM-4 (above 90 out of 100). Participants&#x2019; vocabulary sizes were measured using the Vocabulary Size Test (VST) (<xref ref-type="bibr" rid="ref44">Nation and Beglar, 2007</xref>) as vocabulary knowledge has often been used to indicate proficiency in studies on L2 formulaic language processing (e.g., <xref ref-type="bibr" rid="ref42">Milton, 2010</xref>; <xref ref-type="bibr" rid="ref59">Sonbul et al., 2020</xref>; <xref ref-type="bibr" rid="ref73">Wolter and Yamashita, 2018</xref>). The results showed a significant difference between groups in terms of vocabulary size (<italic>M<sub>intermediate</sub></italic>&#x202F;=&#x202F;56.29, <italic>SD</italic>&#x202F;=&#x202F;8.59, <italic>M<sub>advanced</sub></italic>&#x202F;=&#x202F;88.13, <italic>SD</italic>&#x202F;=&#x202F;14.12; <italic>t</italic>&#x202F;=&#x202F;13.29, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001, <italic>Cohen&#x2019;s d</italic>&#x202F;=&#x202F;2.70).</p>
</sec>
<sec id="sec10">
<title>Research materials</title>
<p>The research materials included PVs embedded in context sentences and probe words for visual display.</p>
</sec>
<sec id="sec11">
<title>Item selection</title>
<p>To ensure that even the intermediate participants would be familiar with the PVs used in this study, we started by identifying potential PVs from the TEM-4 syllabus and then screened them based on semantic transparency, transitivity, and COCA frequency. This process eliminated PVs that were not suitable for our purposes.</p>
<p>To confirm the idiomatic/figurative meanings of these PVs, we consulted the Longman Phrasal Verbs Dictionary (<xref ref-type="bibr" rid="ref0050">Pearson Education, 2000</xref>) and checked their literal plausibility in COCA. We also used a stratified sampling method to examine the percentages of selected literal and figurative meanings in a sample of 100 lines for each PV. This process allowed us to exclude two PVs with minimal frequency.</p>
<p>We then invited 24 Chinese sophomore English majors (at the intermediate level) to write out in Chinese the first two meanings that came to mind when they saw each PV. Based on their responses, six PVs whose figurative meanings did not come up for more than half of the participants were removed.</p>
<p>We also asked the same 24 sophomore English majors to rate the familiarity of both literal and figurative meanings on a five-point Likert scale (see <xref ref-type="bibr" rid="ref68">Wang and Koda, 2005</xref>; <xref ref-type="bibr" rid="ref80">Zhang and Wen, 2019</xref>). Six PVs with average familiarity scores below three for their figurative meanings were excluded. The remaining final 13 PVs showed no significant difference in literal and figurative meaning familiarity ratings (<italic>M<sub>literal meaning</sub></italic>&#x202F;=&#x202F;4.06, <italic>SD</italic>&#x202F;=&#x202F;0.58 and <italic>M<sub>figurative meaning</sub></italic>&#x202F;=&#x202F;4.06, <italic>SD</italic>&#x202F;=&#x202F;0.48, <italic>t</italic> (12)&#x202F;=&#x202F;0.03, <italic>p</italic>&#x202F;=&#x202F;0.97, <italic>Cohen&#x2019;s d</italic>&#x202F;=&#x202F;0.01).</p>
<p>To prevent paired items like &#x201C;dig into the tomb/sandwich&#x201D; from contaminating the phrases pool, we carefully selected PVs that did not have obvious metaphoric extensions of their literal meanings. For example, we avoided using verb particles with close meaning similarities between the PV wholes and the component verbs (like &#x201C;dig into&#x201D;), which could blur the boundary between literal and figurative meanings.</p>
<p>To assess the semantic transparency of these PVs, we asked 24 advanced learners to rate the predictability of their literal and figurative meanings on a five-point scale (from completely unpredictable to completely predictable) (refer to <xref ref-type="bibr" rid="ref80">Zhang and Wen, 2019</xref>). The results showed that the figurative meanings were significantly less predictable than the plausible literal meanings for each PV (<italic>M<sub>literal meaning</sub></italic>&#x202F;=&#x202F;4.48, <italic>SD</italic>&#x202F;=&#x202F;0.28 and <italic>M<sub>figurative meaning</sub></italic>&#x202F;=&#x202F;3.21, <italic>SD</italic>&#x202F;=&#x202F;0.37, <italic>t</italic> (12)&#x202F;=&#x202F;11.45, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001, <italic>Cohen&#x2019;s d</italic>&#x202F;=&#x202F;3.18). (refer to <xref ref-type="supplementary-material" rid="SM1">Supplementary material A</xref> for the selected PVs).</p>
</sec>
<sec id="sec12">
<title>Context sentences with literal or figurative bias</title>
<p>To ensure that the PVs were embedded in contexts that would bias interpretations, we designed three types of context sentences: literal, figurative, and neutral. We avoided separable PV structures (e.g., <italic>put the picture up</italic>) to minimize cognitive effort. Besides, we used the same noun phrase after the literal and figurative uses of the same PV [<italic>ran into Zara</italic> (a person) vs. <italic>ran into Zara</italic> (a shop)] so that we would see how the preceding context and the meaning salience of the PV itself would act on the same noun phrase and ensure that the processing difference would not come from the difference between the two noun phrases behind the same PV.</p>
<p>All target sentences (refer to <xref ref-type="supplementary-material" rid="SM2">Supplementary material B</xref>) followed a consistent pattern: &#x201C;subject + PV&#x202F;+&#x202F;noun phrase + adverbial.&#x201D; To ensure that our contexts were adequate for participants&#x2019; intended interpretations of the PVs, we pilot-tested five homogeneous advanced English learners who translated the biased sentences into Chinese. Sentences with 80% or more translations revealing the context-biased interpretation were retained. Neutral contexts were designed to be ambiguous and not to provide cues for either literal or figurative interpretations. Operationally, the same five people were first required to write down possible anticipanted meaning of the prior sentence and then compare the meaning with literal and figurative meanings of the target PV before deciding if the prior context cued neither meanings.</p>
<p>One example of embedding the same PV in different sentence contexts is shown below.</p>
<list list-type="alpha-upper">
<list-item>
<p>Literal context: When Eva saw the fire burning on the bed, she ran across the house for water.</p>
</list-item>
<list-item>
<p>Figurative context: When Eva was watching birds with a telescope, she ran across the house with big windows.</p>
</list-item>
<list-item>
<p>Neutral context: Who knew what would happen to Eva next. She ran across the house in excitement.</p>
</list-item>
</list>
<p>In this example, we see the PV <italic>ran across</italic> used literally in one context [A] and figuratively in another [B], while the neutral context [C] does not provide cues for either interpretation.</p>
<p>To prevent participants from identifying specific PVs or contexts, we rotated the sentences into three lists. Each list had all 13 PVs in sentences, but each participant read only one list with a unique combination of context conditions. Each list had all the three context conditions in rotation (four PVs in one condition, another four in another condition and the remaining five in the last condition).</p>
<p>To prevent the participants from identifying the purpose of this study, 26 filler sentences were used to mix with the target sentences. We had 13 sentences with idioms, e.g.<italic>, Anna had a cold, so she was feeling under the weather these days</italic>, and 13 sentences with fixed collocations, e.g.<italic>, After Ella had lived in the country, she could not get used to the city life</italic>, as in the study by <xref ref-type="bibr" rid="ref47">Paulmann et al. (2015)</xref>. The filler sentences and experiment sentences were randomized to eliminate trial order effect.</p>
</sec>
<sec id="sec13">
<title>Probe words for visual display</title>
<p>To assess participants&#x2019; interpretation of PVs in the target sentences, we designed a set of four words for each PV to appear in each trial: one literal associate, one figurative associate, and two semantically unrelated control words. The positions of these probe words were fully counterbalanced across trials (<xref ref-type="bibr" rid="ref24">Holsinger, 2013</xref>; <xref ref-type="bibr" rid="ref69">Wang et al., 2016</xref>).</p>
<p>To ensure that the probe words did not influence participants&#x2019; responses through their frequency, orthographic complexity, or length, we matched the two associate words with the two control words on these characteristics (<xref ref-type="bibr" rid="ref11">Cie&#x015B;licka, 2006</xref>). There was only a small difference in word frequency between the four types of probes (<italic>M<sub>lit_related</sub></italic>&#x202F;=&#x202F;249,023, <italic>M<sub>fig_related</sub></italic>&#x202F;=&#x202F;143072.08, <italic>M<sub>lit_ctrl</sub></italic>&#x202F;=&#x202F;120767.69, <italic>M<sub>fig_ctrl</sub></italic>&#x202F;=&#x202F;116226.69; <italic>p</italic>&#x202F;=&#x202F;0.73, <italic>Partial &#x03B7;<sup>2</sup></italic>&#x202F;=&#x202F;0.03, <italic>Cohen&#x2019;s f</italic>&#x202F;=&#x202F;0.16).</p>
<p>However, we noted a significant length difference among the probe words (<italic>M<sub>lit_related</sub></italic>&#x202F;=&#x202F;4.69, <italic>M<sub>fig_related</sub></italic>&#x202F;=&#x202F;6.46, <italic>M<sub>lit_ctrl</sub></italic>&#x202F;=&#x202F;4.62, <italic>M<sub>fig_ctrl</sub></italic>&#x202F;=&#x202F;6.15; <italic>p</italic>&#x202F;=&#x202F;0.002, <italic>Partial &#x03B7;<sup>2</sup></italic>&#x202F;=&#x202F;0.27, <italic>Cohen&#x2019;s f</italic>&#x202F;=&#x202F;0.61). To account for this potential confound, we included word frequency and length as fixed-effect covariate factors in initial R modeling to ensure that these variables did not influence our results. (refer to <xref ref-type="supplementary-material" rid="SM1">Supplementary material A</xref> for the probe word sets).</p>
<p>Here is an example of the visual display for the PV <italic>run after</italic> (<xref ref-type="fig" rid="fig1">Figure 1</xref>).</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Sample visual display for the probe words of <italic>run after</italic>: The above left word <italic>chase</italic> is literally related, the above right word <italic>court</italic> is figuratively related, the below left word <italic>cheat</italic> is literal control word and the below right word <italic>chill</italic> is figurative control word. The positions of the four types of probe words are rotated in the visual word search task.</p>
</caption>
<graphic xlink:href="fpsyg-16-1528821-g001.tif"/>
</fig>
</sec>
</sec>
<sec id="sec14">
<title>Experiment procedure</title>
<p>The experiment stimuli were presented on a computer screen using Experiment Builder software (<xref ref-type="bibr" rid="ref60">SR, 2021</xref>). The screen had a resolution of 1,024&#x202F;&#x00D7;&#x202F;768 pixels, with each region of interest in the four corners occupying approximately 369&#x202F;&#x00D7;&#x202F;248 pixels. Eye movements were tracked using an Eyelink 1,000 Plus tracker at a sampling rate of 1,000&#x202F;Hz. Participants sat 65&#x202F;cm from the screen and rested their chins on a chinrest to minimize head movement.</p>
<p>Before commencing the formal experiment, participants read instructions to ensure they understood the requirements. Eye movements were calibrated and validated to guarantee accurate data recording using a 9-point star calibration followed by five practice trials. If any participant&#x2019;s eye movement deviated during the experiment, it was paused for recalibration and revalidation.</p>
<p>To minimize fatigue effects, participants had the option to request breaks before the next trial, which would be preceded by recalibration and revalidation of their eye tracker. The experiment began with a drift correction at the start of each trial when they focused on the fixation cross to the left of the sentence. Participants then read a context sentence presented in one line on the screen, which should reveal to us potential early and late meaning activation in PV processing. After completing the sentence, they clicked the mouse to proceed, followed by a 500-ms display of a red &#x201C;?&#x201D; question mark at the center of the screen. This was succeeded by the presentation of four probe words in the visual word search task. The visual word search task was designed to explore whether literal activation is also obligatory during two consecutive time windows at the delayed stage of processing after sentence offset as indicated in <xref ref-type="bibr" rid="ref13">Cieslicka and Heredia (2011)</xref>.</p>
<p>Participants were instructed to make meaning-relatedness judgments as quickly and accurately as possible upon seeing the probes. They then clicked on their chosen word with the mouse. After each judgment, the screen went blank for 1,000&#x202F;ms before the next trial began (see <xref ref-type="fig" rid="fig2">Figure 2</xref>). After the experiment, participants were surveyed to confirm their related PV meanings. Each participant rated each PV&#x2019;s figurative meaning using their Chinese translation on a 5-point Likert scale from 1 (totally unfamiliar) to 5 (completely familiar). For example, the PV &#x201C;<italic>run after</italic>&#x201D; was presented together with its Chinese translation &#x8FFD;&#x6C42; (&#x201C;court (girls)&#x201D;). Participants were asked to rate how familiar they felt with the figurative meaning of each PV. The survey results indicated that all data points were relevant and therefore were retained because they demonstrated sufficient familiarity with the figurative meanings of PVs. Ratings ranged from 4 to 5, with an average score of <italic>M</italic>&#x202F;=&#x202F;4.48 and a standard deviation of <italic>SD</italic>&#x202F;=&#x202F;0.37.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Eye movements experiment procedure.</p>
</caption>
<graphic xlink:href="fpsyg-16-1528821-g002.tif"/>
</fig>
<sec id="sec15">
<title>Data preparation and analysis</title>
<p>Among the 99 participants, six finished the experiment task with the sampling rate accidentally set at 500&#x202F;Hz, different from the normal 1,000&#x202F;Hz. Data of another student was lost due to a computer hardware memory problem. Data from the other 92 students were valid for statistical analysis.</p>
<p>Regarding sentence reading, we concentrated early-measure and late-measure analyses on both PVs and the following noun phrases. Phrase-level effects may reflect how a construct is processed as a whole unit, while post-PV regions tend to show delayed processing effects (<xref ref-type="bibr" rid="ref9">Carrol and Conklin, 2020</xref>). For early measures, we used <italic>first fixation duration</italic> (the duration of the first fixation on the focused phrase within a specific interest area) and <italic>first pass reading time</italic> (the duration of all the fixations on the phrase the first time it is encountered in the sentence before gaze exits to the left or right). These metrics capture initial processes like familiarity checks, access to orthographical/phonological information and lexical meaning, and early information integration. For late measures we adopted <italic>total reading time</italic> (also called total dwell time, the duration of all fixations on the phrase during the trial including time for rereading the same phrase) and <italic>second pass reading time</italic> (lookback fixation time) which refers to all the returning fixations within the interest area following the initial fixation (<xref ref-type="bibr" rid="ref27">Hy&#x00F6;n&#x00E4; et al., 2003</xref>). We chose those measures based on past literature (<xref ref-type="bibr" rid="ref51">Reichle et al., 1998</xref>; <xref ref-type="bibr" rid="ref52">Roberts and Siyanova-Chanturia, 2013</xref>). These two measures are believed to be sensitive to later processes associated with comprehension of a text, such as information re-analysis, recovery from processing difficulties and integration of information in discourse (<xref ref-type="bibr" rid="ref50">Rayner et al., 1989</xref>; <xref ref-type="bibr" rid="ref46">Paterson et al., 1999</xref>). Research indicates that significant late-measure effects without corresponding significant effects from early-measure indicators imply that the examined effects develop relatively late in the online processing (<xref ref-type="bibr" rid="ref75">Yan et al., 2013</xref>).</p>
<p>To trim probe word reading data, we converted the looks to probes words in every 20-ms bin starting from 180&#x202F;ms after the probe display onset into binary data and sorted them into two consecutive 400-ms time windows to prepare for inferential analysis. To do this, we aligned the eye-tracking data to the onset of the visual display for each set of probe words and counted the fixations on the probe words (looks) in each 20-ms time bin (interest time period). Since the Eyelink 1,000 Plus tracker samples at 1,000&#x202F;Hz, there will be 1,000 samples of fixation on an area of interest if one focuses on the area for 1,000&#x202F;ms. If there were more than ten samples out of 20 ones in a 20-ms time bin, it was coded one, otherwise it was zero. We converted the samples into binary data since for an interest period shorter than 100&#x202F;ms, it is not likely that eyes move from one interest area to another. Fixation data within such a short time bin are likely to be binomially distributed and can be coded one for <italic>fixated</italic> or zero for <italic>not fixated</italic> (<xref ref-type="bibr" rid="ref28">Ito and Knoeferle, 2023</xref>). The data was then sorted into two analysis windows: T1 window (180&#x2013;580&#x202F;ms) and T2 window (580&#x2013;980) following the practice of <xref ref-type="bibr" rid="ref24">Holsinger (2013)</xref>. All probe word reading analyses were conducted on the binary data from the two windows.</p>
<p>We conducted our statistical analysis using R software (<xref ref-type="bibr" rid="ref48">R Core Team, 2023</xref>), employing linear mixed-effects models from the lme4 package for analyzing PV and post-PV NP reading time data. For probe word reading responses&#x2014;binary (fixation/no fixation) outcomes&#x2014;we utilized generalized linear mixed-effects logistic regression models, following the methodology outlined by <xref ref-type="bibr" rid="ref5">Bates et al. (2015)</xref>. Our modeling approach (following <xref ref-type="bibr" rid="ref4">Barr et al., 2013</xref>) included random intercepts for subject and item to account for variability across subjects and items (PV or NP in sentence reading tasks; probe words). The maximal random effects structures incorporated in preliminary models were:</p>
<disp-quote>
<p>For PV or NP analysis: (1&#x202F;+&#x202F;context + log(phraselength)&#x202F;+&#x202F;log(trialorder) | subject)&#x202F;+&#x202F;(1&#x202F;+&#x202F;context &#x002A; log(VST) | PV or NP item).</p>
</disp-quote>
<disp-quote>
<p>For probe word analysis: (1&#x202F;+&#x202F;log(VST)&#x202F;+&#x202F;log(probelength)&#x202F;+&#x202F;log(probefrequency)&#x202F;+&#x202F;log(trialorder) | subject)&#x202F;+&#x202F;(1&#x202F;+&#x202F;context &#x002A; log(VST) | probe word item).</p>
</disp-quote>
<p>By-subject random slopes allow for differences among subjects in terms of their degree of sensitivity to phrase or word properties and treatment contexts; in contrast by-item random slope allows each experimental item to function differently depending on participant proficiency difference, treatment contexts and their interaction.</p>
<p>Linear mixed-effects models thus built analyzed the early and late sentence reading measures for both the PV and post-post noun phrase regions: first fixation duration, first-pass reading time, total reading time and second pass reading time data were examined. Independent variables of interest included context and proficiency indicated in term of VST. Phrase length and trial order were treated as covariates. The categorical variable &#x2018;context&#x2019; was dummy-coded using neutral condition as the reference level. We were interested to look at context contrasts between neutral vs. figurative, neutral vs. literal, figurative vs. literal, and whether VST (proficiency) would interact with context in affecting eye fixation duration (log transformed). Instead of removing data prematurely, we kept all data points. For normality, all continuous variables were log-transformed to reduce skewing (expontentiating will convert the log values back to their original values). We used the <italic>vif.mer</italic> function to inspect multilinearity, <italic>scale</italic> to reduce collinearity and have all continuous predicting factors centered at their means.</p>
<p>Then we stepwise reduced the complexity of the random effects by removing from the maximal random structure the interactions (one at a time), random correlations (one at a time), random slopes (one at time) and/or random correlations until the models converges. Finally the most parsimonious models were selected using backward model selection based on anova () to compare models [see <xref ref-type="bibr" rid="ref38">Ma et al. (2022)</xref>]. Since we kept all data points, the final models were refined through model-based residual analysis for outlier elimination (using <italic>filter</italic> (dataframe, abs (<italic>scale</italic> (resid (final. Model))&#x202F;&#x003C;&#x202F;2.5 which means that any standardized residue with an absolute value greater than 2.5 is considered an outlier) (see <xref ref-type="bibr" rid="ref9004">Wu, 2019</xref> for rationale). For fixed effects and interaction effects we relied on <italic>mixed</italic> in the <italic>afex</italic> package, and <italic>emmeans</italic> (<xref ref-type="bibr" rid="ref9003">Lenth et al., 2018</xref>) for the <italic>post hoc</italic> paired <italic>t</italic>-tests.</p>
<p>In the <italic>glmer</italic> mixed-effects models analyzing looks proportions of probe words, we initially included as fixed effects: visual probe word type (with figurative-unrelated control word as the reference level), context (with neutral condition as the reference level), VST indicating proficiency, and the covariates such as probe word frequency and length, and trial order. The categorical variables (context and probe word type) were dummy-coded. We were interested to look at context contrasts between neutral vs. figurative, neutral vs. literal, figurative vs. literal, and also probe type contrasts between figurative control vs. figurative related, literal control vs. literal related, figurative related vs. literal related, and whether VST (proficiency) interact with context and probe word type in affecting looks to the interest regions.</p>
<p>Since logistic regression is a statistical method to model the linear relationship between the predictor variables and log odds of a binary outcome such fixation and non-fixation (yes/no) events, the coefficient estimate (<italic>&#x03B2;</italic>) represents the change in log odds of the outcome per unit change in a predictor (between one categorical level and a reference level). Consequently, exponentiating these coefficiencts provides odds ratios which are easier to interpret as they translate log odds into probabilities or relative likelihood of fixation. An odds ratio greater than 1 suggests higher likelihood of fixation for one category over another of the predicator. With a log odds ratio of 0.21 for instance, exponentiating gives approximately 1.23, indicating that fixation to one categorical level is about 1.23 times (23% higher) the likelihood of fixating the reference level. Once one is no longer puzzled at the small log odds values of the coefficient estimate (<italic>&#x03B2;</italic>), it is suffice to rely on the log odds and the significant value to judge whether the outcome of fixation (looks) proportion change is significant as per change between a predictor level and its reference level.</p>
<p>We also abided by the <italic>Keep it maximal</italic> principle to build the random effect structure models, then stepwise reduced models until they converged, and selected the most parsimonious models (<xref ref-type="bibr" rid="ref4">Barr et al., 2013</xref>). Results of the final best-fitting models for both sentence and probe reading were reported in the following section (alpha-levels were set at 0.05). Likewise, for normality, all continuous variables were log-transformed to reduce skewing. We used the <italic>vif.mer</italic> function to inspect multilinearity, <italic>scale</italic> to reduce collinearity and have all continuous predicting factors centered at their means. For fixed effects and interaction effects we utilized <italic>mixed</italic> in the <italic>afex</italic> package, and <italic>emmeans</italic> for the <italic>post hoc</italic> paired <italic>t</italic>-tests.</p>
</sec>
</sec>
<sec sec-type="results" id="sec16">
<title>Results</title>
<sec id="sec17">
<title>Results from early and late measures at the sentence-reading stage</title>
<p>The table below provides descriptive statistics for early measures (first fixation duration and first pass reading time), as well as late measures (total reading time and second pass reading time) in the PV region and post-PV region across three context conditions (<xref ref-type="table" rid="tab1">Table 1</xref>).</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Mean phrase-level early and late measures for PVs and post-PV NPs in context.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Interest region</th>
<th align="left" valign="top" rowspan="2">Context</th>
<th align="center" valign="top" colspan="2">Early measures</th>
<th align="center" valign="top" colspan="2">Late measures</th>
</tr>
<tr>
<th align="center" valign="top">First fixation duration</th>
<th align="center" valign="top">First pass reading time</th>
<th align="center" valign="top">Total reading time</th>
<th align="center" valign="top">Second pass reading time</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" rowspan="3">PV</td>
<td align="left" valign="top">Neutral</td>
<td align="center" valign="top">237.(123.)</td>
<td align="center" valign="top">399.(232.)</td>
<td align="center" valign="top">1,206.(700.)</td>
<td align="center" valign="top">806.(675.)</td>
</tr>
<tr>
<td align="left" valign="top">Figurative</td>
<td align="center" valign="top">234.(92.8)</td>
<td align="center" valign="top">407.(227.)</td>
<td align="center" valign="top">1,029.(639.)&#x002A;&#x002A;&#x002A;</td>
<td align="center" valign="top">622.(604.)&#x002A;&#x002A;&#x002A;</td>
</tr>
<tr>
<td align="left" valign="top">Literal</td>
<td align="center" valign="top">228.(91.6)</td>
<td align="center" valign="top">388.(223.)</td>
<td align="center" valign="top">1,056.(663.)&#x002A;&#x002A;&#x002A;</td>
<td align="center" valign="top">669.(624.)&#x002A;&#x002A;&#x002A;</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Post-PV<break/>NP</td>
<td align="left" valign="top">Neutral</td>
<td align="center" valign="top">244.(96.4)</td>
<td align="center" valign="top">397.(206.)</td>
<td align="center" valign="top">1,115.(707.)</td>
<td align="center" valign="top">717.(667.)</td>
</tr>
<tr>
<td align="left" valign="top">Figurative</td>
<td align="center" valign="top">238.(94.2)</td>
<td align="center" valign="top">415.(244.)</td>
<td align="center" valign="top">915.(586.)&#x002A;&#x002A;&#x002A;</td>
<td align="center" valign="top">500.(546.)&#x002A;&#x002A;&#x002A;</td>
</tr>
<tr>
<td align="left" valign="top">Literal</td>
<td align="center" valign="top">248.(95.3)</td>
<td align="center" valign="top">413.(221.)</td>
<td align="center" valign="top">1,031.(637.)</td>
<td align="center" valign="top">619.(591.)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Duration measures are reported in milliseconds. Values in parentheses are SDs (standard deviations). Total reading time by definition excludes regressive fixations to preceding words, so second pass reading time&#x202F;=&#x202F;Total reading time - First pass reading time. In case of zero difference between total reading time and first pass reading time, 0 was converted to 1 so as not to affect log-transformation [see <xref ref-type="bibr" rid="ref73">Wolter and Yamashita (2018)</xref>]. Significant differences between neutral baseline and treatment conditions (based on the models reported in <xref ref-type="supplementary-material" rid="SM3">Supplementary material C</xref>) are indicated with the convention of &#x002A;<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05, &#x002A;&#x002A;<italic>p</italic>&#x202F;&#x003C;&#x202F;0.01, &#x002A;&#x002A;&#x002A;<italic>p</italic>&#x202F;&#x003C;&#x202F;0.001.</p>
</table-wrap-foot>
</table-wrap>
<p>In the best fit models<xref ref-type="fn" rid="fn0003"><sup>3</sup></xref> (see <xref ref-type="supplementary-material" rid="SM3">Supplementary material C</xref>), the early measures on first fixation duration and first pass reading time showed no significant context main effects in both the PV region [<italic>&#x03C7;</italic><sup>2</sup> (2)&#x202F;=&#x202F;1.71, <italic>p&#x202F;=</italic> 0.424; &#x03C7;<sup>2</sup> (2)&#x202F;=&#x202F;1.50, <italic>p&#x202F;=</italic> 0.473] and post-PV region [<italic>&#x03C7;</italic><sup>2</sup> (2)&#x202F;=&#x202F;2.71, <italic>p&#x202F;=</italic> 0.258; &#x03C7;<sup>2</sup> (2)&#x202F;=&#x202F;1.42, <italic>p&#x202F;=</italic> 0.490], neither were there main effects of proficiency-indicating logged VST for the PV region [<italic>&#x03C7;</italic><sup>2</sup> (1)&#x202F;=&#x202F;0.77, <italic>p&#x202F;=</italic> 0.381; <italic>&#x03C7;</italic><sup>2</sup> (1)&#x202F;=&#x202F;0.66, <italic>p&#x202F;=</italic> 0.417] and for the post-PV region [&#x03C7;<sup>2</sup> (1)&#x202F;=&#x202F;0.45, <italic>p&#x202F;=</italic> 0.500; &#x03C7;<sup>2</sup> (1)&#x202F;=&#x202F;1.15, <italic>p&#x202F;=</italic> 0.284], or any interaction between the two factors. The late measures of total reading time and second pass reading time (<xref ref-type="fig" rid="fig3">Figure 3</xref>) showed no proficiency main effect in the two regions either [for the PV region: <italic>&#x03C7;</italic><sup>2</sup> (1)&#x202F;=&#x202F;0.66, <italic>p&#x202F;=</italic> 0.417; <italic>&#x03C7;</italic><sup>2</sup> (1)&#x202F;=&#x202F;0.32, <italic>p&#x202F;=</italic> 0.572; for the post-PV region: <italic>&#x03C7;</italic><sup>2</sup> (1)&#x202F;=&#x202F;0.30, <italic>p&#x202F;=</italic> 0.582; <italic>&#x03C7;</italic><sup>2</sup> (1)&#x202F;=&#x202F;0.61, <italic>p&#x202F;=</italic> 0.437]. However, more interestingly, in both regions the two late measures of log transformed fixation durations showed significant context main effect. In the PV region the main context effects for the total reading time and second pass reading time are as shown in the bracket [<italic>&#x03C7;</italic><sup>2</sup> (2)&#x202F;=&#x202F;23.90, <italic>p&#x202F;&#x003C;</italic> 0.001; <italic>&#x03C7;</italic><sup>2</sup> (2)&#x202F;=&#x202F;15.29, <italic>p&#x202F;&#x003C;</italic> 0.001]. Total reading time in the PV region was longer in the neutral context than in both figurative and literal contexts (neutral vs. Figurative: <italic>&#x03B2;&#x202F;=</italic> 0.1645, <italic>t&#x202F;=</italic> 4.83, <italic>p&#x202F;=</italic> 0.0002; neutral vs. Literal: <italic>&#x03B2;&#x202F;=</italic> 0.11, <italic>t&#x202F;=</italic> 3.17, <italic>p&#x202F;=</italic> 0.0002). Second pass reading time in the same region manifested the same pattern [neutral vs. Figurative: <italic>&#x03B2;&#x202F;=</italic> 0.18, <italic>t&#x202F;=</italic> 3.78, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001; neutral vs. Literal: <italic>&#x03B2;&#x202F;=</italic> 0.13, <italic>t&#x202F;=</italic> 2.75, <italic>p&#x202F;=</italic> 0.006]. In the post-PV noun phrase region, the main context effects for total reading time [<italic>&#x03C7;</italic><sup>2</sup> (2)&#x202F;=&#x202F;35.23, <italic>p&#x202F;&#x003C;</italic> 0.001] and second pass reading time [<italic>&#x03C7;</italic><sup>2</sup> (2)&#x202F;=&#x202F;26.69, <italic>p&#x202F;&#x003C;</italic> 0.001] exhibited a different context contrast pattern (<xref ref-type="fig" rid="fig3">Figure 3</xref>). The figurative context resulted in shorter duration than neutral and literal contexts (for total reading time, neutral vs. figurative: <italic>&#x03B2;&#x202F;=</italic> 0.21, <italic>t&#x202F;=</italic> 5.78, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001; figurative vs. literal: <italic>&#x03B2;&#x202F;=</italic>&#x202F;&#x2212;0.15, <italic>t&#x202F;=</italic>&#x202F;&#x2212;4.22, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001; for second pass reading time, neutral vs. figurative: <italic>&#x03B2;&#x202F;=</italic> 0.27, <italic>t&#x202F;=</italic> 5.09, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001; figurative vs. literal: <italic>&#x03B2;&#x202F;=</italic>&#x202F;&#x2212;0.20, <italic>t&#x202F;=</italic>&#x202F;&#x2212;3.64, <italic>p&#x202F;=</italic> 0.0003).</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Late measures of durations (untransformed) for PV and post-PV noun phrase at sentence reading stage: <italic>above left figure</italic> shows total reading time for PV region in contexts; <italic>above right figure</italic> shows second pass reading time for PV region in contexts; <italic>below left figure</italic> shows total reading time for post-PV region in contexts; <italic>below right figure</italic> shows second pass reading time for post-PV region in contexts. In the <italic>above</italic> figures for the PV region, both total reading time and second pass reading measures have higher median lines and greater variability in the neutral context than in the figurative and literal contexts as indicated by the jittered points depicting individual participant averages. In the <italic>below</italic> figures for the post-PV region, both total reading time and second pass reading measures however have lower median lines and less variability in the figurative context than in the neutral and literal contexts. Besides, the red asterisks in the figures represent means values in each context for each measure. Significance levels in means comparison are indicated as follows: <italic>p</italic> &#x003C;&#x202F;0.05&#x002A;, <italic>p</italic> &#x003C;&#x202F;0.01&#x002A;&#x002A;, <italic>p</italic> &#x003C;&#x202F;0.001&#x002A;&#x002A;&#x002A;, with &#x201C;ns&#x201D; denoting non-significant results. Refer to <xref ref-type="supplementary-material" rid="SM4">Supplementary material D</xref> for the 1st quartile, median, 3rd quartile for each of the four measures across contexts, and also relevant means values and standard deviations (SDs) as derived from model-based residual analysis to eliminate outliers.</p>
</caption>
<graphic xlink:href="fpsyg-16-1528821-g003.tif"/>
</fig>
<p>To sum up, early measures did not reveal difference in meaning activation between conditions along the proficiency range but late measures indicate more information reanalysis in neutral context than in literal and figurative contexts for the PV region. In the post-PV noun phrase region, for delayed PV processing, figurative meaning processing required less total reading time and second pass reading time, indicating the need of less information reanalysis in figurative context than in neutral and literal contexts.</p>
</sec>
<sec id="sec18">
<title>Results from further delayed visual word search task</title>
<p>The results below demonstrate further delayed PV processing effects after sentence reading. The looks proportions in neutral, literal, and figurative contexts across two proficiency levels are illustrated in <xref ref-type="fig" rid="fig4">Figure 4</xref>. The activation patterns within an initial 1,000-ms window were similar between intermediate and advanced groups.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Probing word looks over a 1,000&#x202F;ms time course in both proficiency groups: The figure displays curves showing proportions of looks to figurative control, figurative related, literal control, and literal related probe words within neutral, figurative, and literal contexts for intermediate and advanced participants.</p>
</caption>
<graphic xlink:href="fpsyg-16-1528821-g004.tif"/>
</fig>
</sec>
<sec id="sec19">
<title>180-580-ms&#x202F;T1 time window analysis</title>
<p>For the T1 window (<xref ref-type="fig" rid="fig5">Figure 5</xref> <italic>above</italic>), the best fit model was Model: looks proportion ~ probe type in focus &#x002A; context + log(VST)&#x202F;+&#x202F;log(order)&#x202F;+&#x202F;log(probe word length)&#x202F;+&#x202F;(1 | subject)&#x202F;+&#x202F;(1 | probe word item). Context and order showed main effects [<italic>&#x03C7;</italic><sup>2</sup> (2)&#x202F;=&#x202F;20.63, <italic>p&#x202F;&#x003C;</italic> 0.001; &#x03C7;<sup>2</sup> (1)&#x202F;=&#x202F;8.82, <italic>p&#x202F;=</italic> 0.003]. There was also interaction between probe word type and context [<italic>&#x03C7;</italic><sup>2</sup> (6)&#x202F;=&#x202F;3018.74, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.001] <italic>Post hoc</italic> pairwise (literal related vs. literal control; figurative related vs. figurative control; literal related vs. figurative related) comparison confirmed that looks to the types of probe words focused varied depending on context.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Probing word looks proportions across two time windows (180&#x2013;580&#x202F;ms and 580&#x2013;980&#x202F;ms): Significance levels of <italic>post hoc</italic> emmeans comparisons were determined using linear mixed effect models (<italic>p</italic> &#x003C;&#x202F;0.05&#x002A;, <italic>p</italic> &#x003C;&#x202F;0.01&#x002A;&#x002A;, <italic>p</italic> &#x003C;&#x202F;0.001&#x002A;&#x002A;&#x002A;), with &#x201C;ns&#x201D; indicating non-significant results. Refer to <xref ref-type="supplementary-material" rid="SM4">Supplementary material D</xref> for detailed emmeans comparison data.</p>
</caption>
<graphic xlink:href="fpsyg-16-1528821-g005.tif"/>
</fig>
<p>In the neutral context there was significantly more looks to (consideration of) the figurative related probe (&#x03B2;<sub>figurative related vs.literal related</sub> <italic>=</italic> 1.97, <italic>z&#x202F;=</italic> 4.59, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.0001; &#x03B2;<sub>figurative related vs. figurative control</sub> <italic>=</italic> 1.09, <italic>z&#x202F;=</italic> 2.68, <italic>p&#x202F;=</italic> 0.007) and the literal probe was less fixated and considered than its control word (&#x03B2;<sub>literal related vs. literal control</sub> <italic>=&#x202F;&#x2212;</italic>1.00, <italic>z&#x202F;=&#x202F;&#x2212;</italic>2.60, <italic>p&#x202F;=</italic> 0.009).</p>
<p>In the figurative context, proportions of looks to the figurative probe were significantly higher than looks to the semantically unrelated control probes (&#x03B2;<sub>figurative related vs. figurative control</sub> <italic>=</italic> 1.50, <italic>z&#x202F;=</italic> 3.67, <italic>p&#x202F;=</italic> 0.0002); the difference of looks to the literal and literal control probe was also at significance level (&#x03B2;<sub>literal related vs. literal control</sub> <italic>=</italic> 0.80, <italic>z&#x202F;=</italic> 2.06, <italic>p&#x202F;=</italic> 0.040). But looks to the figurative and literal probes were comparable (&#x03B2;<sub>figurative related vs. literal related</sub> <italic>=</italic> 0.40, <italic>z&#x202F;=</italic> 0.93, <italic>p&#x202F;=</italic> 0.353).</p>
<p>In the literal context, the most attention was given to the figurative control probe (&#x03B2;<sub>figurative control vs. figurative related</sub> <italic>=</italic> 0.70, <italic>z&#x202F;=</italic> 1.72, <italic>p&#x202F;=</italic> 0.086). Looks to the literal probe were not much different from the figurative probe and the literal control probe (&#x03B2;<sub>literal related vs. figurative related</sub> <italic>=&#x202F;&#x2212;</italic>0.03, <italic>z&#x202F;=&#x202F;&#x2212;</italic>0.06, <italic>p&#x202F;=</italic> 0.95; &#x03B2;<sub>literal related vs. literal control</sub> <italic>=</italic> 0.43, <italic>z&#x202F;=</italic> 1.11, <italic>p&#x202F;=</italic> 0.269).</p>
</sec>
<sec id="sec20">
<title>580-980-ms&#x202F;T2 time window analysis</title>
<p>For the T2 window (<xref ref-type="fig" rid="fig5">Figure 5</xref> <italic>below</italic>), the best fit model was looks proportion ~ probe type in focus &#x002A; context + log(VST)&#x202F;+&#x202F;log(order)&#x202F;+&#x202F;log(probe word length)&#x202F;+&#x202F;(1 | subject)&#x202F;+&#x202F;(1 | probe word item). There was main effect only with probe word length [<italic>&#x03C7;</italic><sup>2</sup> (1)&#x202F;=&#x202F;9.12, <italic>p&#x202F;=</italic> 0.003]. However there was an interaction between probe word type and context condition [<italic>&#x03C7;</italic><sup>2</sup> (6)&#x202F;=&#x202F;437.55, <italic>p</italic>&#x202F;&#x003C;&#x202F;0.001].</p>
<p>Post hoc comparison revealed that in the neutral context in the T2 window, proportions of looks to the figurative probe numerically remained higher (&#x03B2;<sub>figurative related vs. literal related</sub> <italic>=</italic> 0.15, <italic>z&#x202F;=</italic> 0.78, <italic>p&#x202F;=</italic> 0.436). But the figurative control probe and literal related probe both competed for attention and consideration so that significance-level differences that had existed in the T1 window disappeared (&#x03B2;<sub>figurative related vs. figurative control</sub> <italic>=&#x202F;&#x2212;</italic>0.14, <italic>z&#x202F;=&#x202F;&#x2212;</italic>0.75, <italic>p&#x202F;=</italic> 0.45; &#x03B2;<sub>literal related vs. literal control</sub> <italic>=</italic> 0.12, <italic>z&#x202F;=</italic> 0.65, <italic>p&#x202F;=</italic> 0.516).</p>
<p>In the figurative context, more looks were now given to the control probe (&#x03B2;<sub>figurative control vs. figurative related</sub> <italic>=</italic> 0.35, <italic>z&#x202F;=</italic> 1.91, <italic>p&#x202F;=</italic> 0.056; &#x03B2;<sub>literal control vs. literal related</sub> <italic>=</italic> 0.52, <italic>z&#x202F;=</italic> 2.93, <italic>p&#x202F;=</italic> 0.003) while proportions of looks to the literal probe and figurative probe were both at a low (&#x03B2;<sub>literal related vs. figurative related</sub> <italic>=&#x202F;&#x2212;</italic>0.12, <italic>z&#x202F;=&#x202F;&#x2212;</italic>0.59, <italic>p&#x202F;=</italic> 0.556).</p>
<p>In the literal context, the overall looks pattern remained similar to that in the T1 window, with least consideration of the literal control probe. Looks to the figurative control probe remained the highest but not significantly more than the figurative related probe (&#x03B2;<sub>figurative control vs. figurative related</sub> <italic>=</italic> 0.32, <italic>z&#x202F;=</italic> 1.71, <italic>p&#x202F;=</italic> 0.088) but proportion of looks to the literal related probe increased to a significance level compared to the literal control probe and figurative related probe (&#x03B2;<sub>literal related vs. literal control</sub> <italic>=</italic> 0.36, <italic>z&#x202F;=</italic> 2.03, <italic>p&#x202F;=</italic> 0.043; &#x03B2;<sub>literal related vs. figurative related</sub> <italic>=</italic> 0.51, <italic>z&#x202F;=</italic> 2.60, <italic>p&#x202F;=</italic> 0.010).</p>
</sec>
</sec>
<sec sec-type="discussion" id="sec21">
<title>Discussion</title>
<p>The results do not support a simple &#x2018;yes&#x2019; answer regarding whether figurative or literal meanings are preferentially activated across all contexts, nor does proficiency level necessarily modulate meaning activation patterns for familiar PVs.</p>
<p>Eye movements in sentence reading revealed no difference in early meaning activation across contexts. However, late meaning activation was observed in supporting literal and figurative contexts, along with delayed post-PV figurative meaning activation preference. There was no main effect from proficiency or any interaction effects.</p>
<p>The results from sentence reading indicate that early processes such as familiarity checks, access to orthographical/phonological information, lexical meaning retrieval, and early integration of information demand comparable cognitive effort in both neutral and biased contexts. As measured by first fixation duration and first pass reading time in both PV and post-PV regions, the preference for meaning activation was not discernible at this stage.</p>
<p>The late measure of total reading time for the PV region indicates that contextually biased meanings are more accessible in figurative and literal contexts compared to neutral ones. The other late measure&#x2014;second pass reading time analysis&#x2014;confirms that significantly more cognitive effort is required to perform information reanalysis in unbiased, neutral context than in the biased contexts. Thus learners can access familiar figurative and literal meanings with equal ease as indicated by the late measures, similar to what <xref ref-type="bibr" rid="ref56">Siyanova-Chanturia et al. (2011)</xref> find about idiom processing by native speakers.</p>
<p>Further examination of post-PV spilloff region data shows that delayed information reanalysis may be less demanding in figurative contexts compared to other conditions. Since activation of preferred meaning is more likely to occur in supporting prior contexts, while activation of less expected meanings are likely to be suppressed despite boost from their supporting prior contexts (<xref ref-type="bibr" rid="ref25">Holsinger and Kaiser, 2013</xref>), figurative meaning preference in figurative context together with no literal meaning activation in literal context may mean more salience of the figurative meanings for familiar PVs, though this preference emerges late in the post-PV spilloff region. Moreover, since no significant interaction effect was observed between proficiency and context on meaning activation across all models, this late figurative preference may be consistent across different proficiency groups.</p>
<p>The early measures used in sentence reading did not distinguish meaning activation preference across different contexts. However, since these early measures involve accessing word information and lexical meaning, the observation of no context effect at the early PV processing stage does not preclude the activation of literal or figurative meaning per se. Evidence for early literal or figurative activation was found in other studies (<xref ref-type="bibr" rid="ref24">Holsinger, 2013</xref>; <xref ref-type="bibr" rid="ref31">Kessler et al., 2020</xref>; <xref ref-type="bibr" rid="ref47">Paulmann et al., 2015</xref>). For instance, <xref ref-type="bibr" rid="ref24">Holsinger (2013)</xref> reported early literal activation during L1 idiom processing in a neutral context. Similarly, <xref ref-type="bibr" rid="ref31">Kessler et al.'s (2020)</xref> empirical research confirmed early literal activation for idioms among L1 speakers within a neutral context; however, this effect disappeared shortly after the auditory cue stimulus offset. In contrast, <xref ref-type="bibr" rid="ref47">Paulmann et al. (2015)</xref> found that even non-native English L2 speakers interpret PVs figuratively in neutral contexts like native English speakers, as evidenced by their ERP N400 measures. Future research remains necessary to determine if L2 literal activation is obligatory at an early stage.</p>
<p>In our read-only visual word search task at the further delayed stage, participants did not show explicit advantage or significant preference for literal meaning activation in neutral contexts. Additionally, they displayed no notable preference for activated literal meanings in figuratively biased contexts. However, there was a very late T2-time-window-specific preference for the literal meaning observed in literally biased contexts. These findings only partially support the literal salience hypothesis, which suggests that literal processing is obligatory even 800&#x202F;ms after sentence offset. Instead, our results imply that context plays a crucial role in determining whether literal or figurative activation preference occurs at such further delayed stages of processing. In neutral contexts, participants preferred figurative meanings over literals during T1 time window. For comparison, the figurative context not only boosted figurative activation previously in the post-PV region when reading sentence, but also maintained figurative activation now in the T1 time window; meanwhile competing control words received more attention in T2 window and literal activation in the same context decreased from T1 to T2 time windows. In contrast, even within a literal context, delayed literal meaning activation occurred primarily in T2 window, suggesting that despite literal contextual boosts, literals were activated at the latest time.</p>
<p>Given our read-only visual word search task, which examined activation patterns 500&#x202F;ms after sentence reading ceased, it&#x2019;s plausible that any transient literal activation may have already subsided at this point. This aligns with <xref ref-type="bibr" rid="ref31">Kessler et al.'s (2020)</xref> findings from their contrast of listen-and-look and read-only tasks in neutral contexts. Their experiments revealed no evidence of literal activation in the read-only visual word search task, suggesting that brief literal activation may not persist beyond the sentence reading stage. This finding supports our observation in the neutral context at this deferred stage in visual word search task.</p>
<p>Our results challenge Wang <italic>et al</italic>.&#x2019;s (2016) finding that familiar PVs&#x2019; literal meanings were activated consistently regardless of whether the context was literal or figurative in the visual word search task 500&#x202F;ms after sentence reading. Additionally, only advanced learners in their study exhibited activation for figurative meaning in literally biased contexts. Their interpretation suggested that learners at intermediate and advanced levels primarily relied on literal meanings in online PV processing. Their finding can be attributed to two limitations: their use of inappropriate statistical analysis and misinterpretation of results from their look-only visual word search task for early preference of literal meanings as clarified in the review section.</p>
<p>Wang et al.&#x2019;s methodology involved proportions analysis of reading times for probe words over a longer trial duration (4,000&#x202F;ms), whereas our study focused on shorter time frames within 1,000&#x202F;ms typical for visual word search experiments. To further explore the processes, we also analyzed earlier-stage sentence reading as suggested by Reviewer One. These additional analyses provide complementary insights into early stages of PV meaning activation in our experimental tasks.</p>
<p>Notably, there was no observed proficiency effect for intermediate and advanced learners of English as a foreign language, suggesting that even lower-proficiency participants could activate familiar opaque PV meanings. Learner familiarity with PVs is likely to be more responsible for the facilitated access and retrieval of their figurative meanings. This finding aligns with <xref ref-type="bibr" rid="ref81">Zhou and Zhang's (2011)</xref> research on idiom processing in neutral and figuratively biased contexts with two different levels of learners, which we now extend to PVs. To move one step further, by analyzing learners&#x2019; eye movements in PV and post-PV regions when they read context sentences as well as looks proportions on probe words in visual word search task, we pinpointed when literal and figurative activation may occur in context by both intermediate and advanced learners of English.</p>
<p>Our findings suggest that familiarity plays an important role in driving meaning activation, potentially outweighing proficiency levels among learners of English as a foreign language. When there is controll for the learner&#x2019;s familiarity with both literal and figurative meanings of target PVs, differences in intermediate versus advanced L2 proficiency may not emerge. However, since this study focused solely on familiar PVs, conclusions about proficiency derived from these findings may not necessarily apply to unfamiliar ones.</p>
<p>This observation contrasts with previous studies where proficiency effects were observed: <xref ref-type="bibr" rid="ref40">Matlock and Heredia (2002)</xref>, <xref ref-type="bibr" rid="ref8">Blais and Gonnermn (2013)</xref>, <xref ref-type="bibr" rid="ref47">Paulmann et al. (2015)</xref>, and <xref ref-type="bibr" rid="ref69">Wang et al. (2016)</xref>. The findings from such studies might have been influenced by the unknown status of figurative language among lower-proficiency groups, as those previous studies did not assess learners&#x2019; familiarity with figurative meanings. For instance, in <xref ref-type="bibr" rid="ref40">Matlock and Heredia's (2002)</xref> study on late bilinguals processing PVs literally rather than figuratively potentially due to their lack of awareness about figurative meanings. Similarly, <xref ref-type="bibr" rid="ref8">Blais and Gonnermn (2013)</xref> and <xref ref-type="bibr" rid="ref47">Paulmann et al. (2015)</xref> studies may have relied on higher-proficiency speakers&#x2019; knowledge of PVs&#x2019; figurative meanings, whereas lower-proficiency learners processed PVs literally because they were unfamiliar with the figurative meanings&#x2014;no translation or paraphrasing tasks ensured such knowledge.</p>
<sec id="sec22">
<title>Limitations</title>
<p>Sample size and generalizability: While the sample of 92 valid participants together with the current PV item sample provided sufficient statistical power of 0.8 calculated by G&#x002A;Power, increasing the number of PVs tested could further enhance generalizability.</p>
<p>Focus on familiar PVs: Our investigation was limited to familiar PVs with equivalent familiarity ratings for both literal and figurative meanings. It remains uncertain how unfamiliar PVs are processed in context, as previous studies have preliminarily shown that familiar and unfamiliar idioms are processed differently across proficiency levels in biased contexts (<xref ref-type="bibr" rid="ref22">Giora, 1999</xref>; <xref ref-type="bibr" rid="ref81">Zhou and Zhang, 2011</xref>). Future research should explore the processing of unfamiliar PVs.</p>
<p>Literal activation patterns: Our findings regarding limited literal activation were observed within a specific 1,000-ms time frame&#x2014;500&#x202F;ms after sentence reading&#x2014;and in earlier sentence reading there was no evidence to draw definitive conclusions about whether early literal or figurative activation was stronger in the current design. We would like to suggest a listen-and-look visual word search task to tap into early meaning activation directly for future research. Alternatively the parafoveal processing paradigm, as suggested by Reviewer One, may also provide direct evidence of real-time PV processing (<xref ref-type="bibr" rid="ref49">Rayner, 1975</xref>; <xref ref-type="bibr" rid="ref53">Schotter et al., 2015</xref>).</p>
<p>To advance our understanding of PV processing in L2 learners, we recommend the following: (1) increasing the sample size of experimental items; (2) investigating both familiar and unfamiliar PVs; and (3) observing patterns of meaning activation at different time points in the above-suggested paradigms.</p>
</sec>
</sec>
<sec sec-type="conclusions" id="sec23">
<title>Conclusion</title>
<p>Though <xref ref-type="bibr" rid="ref12">Cieslicka (2011)</xref> literal salience resonant hypothesis cannot be rejected based on current evidence with PVs, there is good evidence against claiming an obligatory preference for literal meanings regardless of context. Early measures from our study did not support either early literal or figurative meaning activation preference, suggesting that preference for literal versus figurative meanings may not emerge until later stages of processing. Late measures on the PV region indicate that both familiar literal and figurative meaning PVs enjoy similar ease of handling across contexts and late measures on the post-PV noun phrase region suggest that there is delay before figurative activation preference develops. In the visual word search task, no stable reliance on literal meaning was evident over time windows or contexts, further supporting the nuanced nature of PV processing beyond mere preference for literal meanings alone.</p>
<p>The findings also suggest that <xref ref-type="bibr" rid="ref23">Giora (2002)</xref> graded salience hypothesis does not fully apply to this type of PVs with similar familiarity ratings for their literal and figurative meanings. Figurative activation is context-specific and time-sensitive, even among familiar PVs.</p>
<p>Last but not least, the findings underscore the importance of controlling for PV familiarity when investigating L2 learners&#x2019; comprehension across different proficiency levels. To further clarify early literal activation preference and proficiency effect in L2 learners&#x2019; PV processing mechanisms, additional research into both familiar and unfamiliar PVs in one framework among L2 learners across a broader range of proficiency using even more sensitive research paradigms would be beneficial.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec24">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref rid="sec31" ref-type="sec">Supplementary material</xref>, further inquiries can be directed to the first author (<email>yujianyao@scnu.edu.cn</email>) or corresponding author (<email>blacrose@163.com</email>; <email>blacrosezhang@suda.edu.cn</email>).</p>
</sec>
<sec sec-type="ethics-statement" id="sec25">
<title>Ethics statement</title>
<p>The studies involving humans were approved by the Academic Ethics Committee of School of Foreign Studies, South China Normal University. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec sec-type="author-contributions" id="sec26">
<title>Author contributions</title>
<p>JY: Conceptualization, Data curation, Formal analysis, Methodology, Project administration, Validation, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. SW: Data curation, Investigation, Software, Writing &#x2013; original draft. PZ: Formal analysis, Funding acquisition, Project administration, Resources, Supervision, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. TC: Data curation, Investigation, Software, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="funding-information" id="sec27">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This work was supported by the National Social Science Fund of China (grant no.23BYY178) and the Major Program Fund of Jiangsu Education Department [Grant NO. 2022SJZD126].</p>
</sec>
<ack>
<p>We owe special thanks to the anonymous reviewers for their constructive suggestions, to Dr. LI, Nan for generously sharing R codes, and to Dr. WANG, Yongqing for careful proofreading.</p>
</ack>
<sec sec-type="COI-statement" id="sec28">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec29">
<title>Generative AI statement</title>
<p>The authors declare that no Gen AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="sec30">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec31">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fpsyg.2025.1528821/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fpsyg.2025.1528821/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Supplementary_file_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Supplementary_file_2.doc" id="SM2" mimetype="application/vnd.ms-word" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Supplementary_file_3.docx" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Supplementary_file_4.docx" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<fn-group>
<fn id="fn0001"><p><sup>1</sup>Launching eye movement usually takes about 180&#x202F;ms, and therefore the first 180-ms sampling data cannot be considered as valid data (<xref ref-type="bibr" rid="ref39">Matin et al., 1993</xref>; <xref ref-type="bibr" rid="ref2">Altmann and Kamide, 1999</xref>).</p></fn>
<fn id="fn0002"><p><sup>2</sup>TEM 4 and 8 are national proficiency tests for English Majors in China, and international proficiency level alignment research from China Ministry of Education shows that students who pass the tests are at intermediate and advanced English levels (<xref ref-type="bibr" rid="ref36">Liu and Yang, 2021</xref>).</p></fn>
<fn id="fn0003"><p><sup>3</sup>The most parsimonious best-fitting models retained by-subject and by-item random intercepts for all outcomes except the first fixation duration model in the PV region. Due to issues related to near-zero variance associated with including a term for PV item-level random effect, its final model (Model: log(first fixation duration)&#x202F;~&#x202F;1&#x202F;+&#x202F;Context + log(PV length)&#x202F;+&#x202F;log(order)&#x202F;+&#x202F;log(VST)&#x202F;+&#x202F;(1 | subject)) only includes by-subject intercept.</p></fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Allopenna</surname> <given-names>P. D.</given-names></name> <name><surname>Magnuson</surname> <given-names>J. S.</given-names></name> <name><surname>Tanenhaus</surname> <given-names>M. K.</given-names></name></person-group> (<year>1998</year>). <article-title>Tracking the time course of spoken word recognition using eye movements: evidence for continuous mapping models</article-title>. <source>J. Mem. Lang.</source> <volume>38</volume>, <fpage>419</fpage>&#x2013;<lpage>439</lpage>. doi: <pub-id pub-id-type="doi">10.1006/jmla.1997.2558</pub-id></citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Altmann</surname> <given-names>G. T. M.</given-names></name> <name><surname>Kamide</surname> <given-names>Y.</given-names></name></person-group> (<year>1999</year>). <article-title>Incremental interpretation at verbs: restricting the domain of subsequent reference</article-title>. <source>Cognition</source> <volume>73</volume>, <fpage>247</fpage>&#x2013;<lpage>264</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0010-0277(99)00059-1</pub-id>, PMID: <pub-id pub-id-type="pmid">10585516</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Arnon</surname> <given-names>I.</given-names></name> <name><surname>Snider</surname> <given-names>N.</given-names></name></person-group> (<year>2010</year>). <article-title>More than words: frequency effects for multi-word phrases</article-title>. <source>J. Mem. Lang.</source> <volume>62</volume>, <fpage>67</fpage>&#x2013;<lpage>82</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jml.2009.09.005</pub-id></citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barr</surname> <given-names>D. J.</given-names></name> <name><surname>Levy</surname> <given-names>R.</given-names></name> <name><surname>Scheepers</surname> <given-names>C.</given-names></name> <name><surname>Tily</surname> <given-names>H. J.</given-names></name></person-group> (<year>2013</year>). <article-title>Random effects structure for confirmatory hypothesis testing: keep it maximal</article-title>. <source>J. Mem. Lang.</source> <volume>68</volume>, <fpage>255</fpage>&#x2013;<lpage>278</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jml.2012.11.001</pub-id>, PMID: <pub-id pub-id-type="pmid">24403724</pub-id></citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bates</surname> <given-names>D.</given-names></name> <name><surname>M&#x00E4;chler</surname> <given-names>M.</given-names></name> <name><surname>Bolker</surname> <given-names>B.</given-names></name> <name><surname>Walker</surname> <given-names>S.</given-names></name></person-group> (<year>2015</year>). <article-title>Fitting linear mixed-effects models using lme4</article-title>. <source>J. Stat. Softw.</source> <volume>67</volume>, <fpage>1</fpage>&#x2013;<lpage>48</lpage>. doi: <pub-id pub-id-type="doi">10.18637/jss.v067.i01</pub-id></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beck</surname> <given-names>S. D.</given-names></name> <name><surname>Weber</surname> <given-names>A.</given-names></name></person-group> (<year>2016</year>). <article-title>Bilingual and monolingual idiom processing is cut from the same cloth: the role of the L1 in literal and figurative meaning activation</article-title>. <source>Front. Psychol.</source> <volume>7</volume>:<fpage>1350</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpsyg.2016.01350</pub-id>, PMID: <pub-id pub-id-type="pmid">27667979</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beck</surname> <given-names>S. D.</given-names></name> <name><surname>Weber</surname> <given-names>A.</given-names></name></person-group> (<year>2020</year>). <article-title>Context and literality in idiom processing: evidence from self-paced reading</article-title>. <source>J. Psycholinguist. Res.</source> <volume>49</volume>, <fpage>837</fpage>&#x2013;<lpage>863</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10936-020-09719-2</pub-id>, PMID: <pub-id pub-id-type="pmid">32666211</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Blais</surname> <given-names>M.-J.</given-names></name> <name><surname>Gonnermn</surname> <given-names>L.</given-names></name></person-group> (<year>2013</year>). <article-title>Explicit and implicit semantic processing of verb&#x2013;particle constructions by French&#x2013;English bilinguals</article-title>. <source>Biling. Lang. Congn.</source> <volume>16</volume>, <fpage>829</fpage>&#x2013;<lpage>846</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S1366728912000673</pub-id></citation></ref>
<ref id="ref9001"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cappelle</surname> <given-names>B.</given-names></name> <name><surname>Shtyrov</surname> <given-names>Y.</given-names></name> <name><surname>Pulverm&#x00FC;ller</surname> <given-names>F.</given-names></name></person-group> (<year>2010</year>). <article-title>Heating up or cooling up the brain? MEG evidence that phrasal verbs are lexical units</article-title>. <source>Brain Lang.</source> <volume>115</volume>, <fpage>189</fpage>&#x2013;<lpage>201</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.bandl.2010.09.004</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carrol</surname> <given-names>G.</given-names></name> <name><surname>Conklin</surname> <given-names>K.</given-names></name></person-group> (<year>2020</year>). <article-title>Is all formulaic language created equal? Unpacking the processing advantage for different types of formulaic sequences</article-title>. <source>Lang. Speech</source> <volume>63</volume>, <fpage>95</fpage>&#x2013;<lpage>122</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0023830918823230</pub-id>, PMID: <pub-id pub-id-type="pmid">30693821</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carrol</surname> <given-names>G.</given-names></name> <name><surname>Littlemore</surname> <given-names>J.</given-names></name></person-group> (<year>2020</year>). <article-title>Resolving figurative expressions during reading: the role of familiarity, transparency, and context</article-title>. <source>Discourse Process.</source> <volume>57</volume>, <fpage>609</fpage>&#x2013;<lpage>626</lpage>. doi: <pub-id pub-id-type="doi">10.1080/0163853X.2020.1729041</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cie&#x015B;licka</surname> <given-names>A.</given-names></name></person-group> (<year>2006</year>). <article-title>Literal salience in on-line processing of idiomatic expressions by second language learners</article-title>. <source>Second. Lang. Res.</source> <volume>22</volume>, <fpage>115</fpage>&#x2013;<lpage>144</lpage>. doi: <pub-id pub-id-type="doi">10.1191/0267658306sr263oa</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cieslicka</surname> <given-names>A.</given-names></name></person-group> (<year>2011</year>). <article-title>Suppression of literal meanings in L2 idiom processing: does context help?</article-title> <source>Studies Second Language Learning Teach.</source> <volume>1</volume>, <fpage>13</fpage>&#x2013;<lpage>36</lpage>. doi: <pub-id pub-id-type="doi">10.14746/ssllt.2011.1.1.2</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cieslicka</surname> <given-names>A.</given-names></name> <name><surname>Heredia</surname> <given-names>R.</given-names></name></person-group> (<year>2011</year>). <article-title>Hemispheric asymmetries in processing L1 and L2 idioms: effects of salience and context</article-title>. <source>Brain Lang.</source> <volume>116</volume>, <fpage>136</fpage>&#x2013;<lpage>150</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.bandl.2010.09.007</pub-id>, PMID: <pub-id pub-id-type="pmid">20947154</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Cieslicka</surname> <given-names>A.</given-names></name> <name><surname>Heredia</surname> <given-names>R.</given-names></name></person-group> (<year>2019</year>). &#x201C;<article-title>ERP correlates of figurative language processing</article-title>&#x201D; in <source>Approaches to the study of sound structure and speech</source>. eds. <person-group person-group-type="editor"><name><surname>Wrembel</surname> <given-names>M.</given-names></name> <name><surname>Kie&#x0142;kiewicz-Janowiak</surname> <given-names>A.</given-names></name> <name><surname>G&#x0105;siorowski</surname> <given-names>P.</given-names></name></person-group> (<publisher-loc>New York</publisher-loc>: <publisher-name>Routledge</publisher-name>), <fpage>244</fpage>&#x2013;<lpage>257</lpage>.</citation></ref>
<ref id="ref15"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Cieslicka</surname> <given-names>A.</given-names></name> <name><surname>Heredia</surname> <given-names>R.</given-names></name> <name><surname>Olivares</surname> <given-names>M.</given-names></name></person-group> (<year>2014</year>). &#x201C;<article-title>It&#x2019;s all in the eyes: how language dominance, salience, and context affect eye movements during idiomatic language processing</article-title>&#x201D; in <source>Essential topics in applied linguistics and multilingualism</source>. eds. <person-group person-group-type="editor"><name><surname>Pawlak</surname> <given-names>M.</given-names></name> <name><surname>Aronin</surname> <given-names>L.</given-names></name></person-group> (<publisher-loc>Switzerland</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>21</fpage>&#x2013;<lpage>41</lpage>.</citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dagut</surname> <given-names>M.</given-names></name> <name><surname>Laufer</surname> <given-names>B.</given-names></name></person-group> (<year>1985</year>). <article-title>Avoidance of phrasal verbs: a case for contrastive analyses</article-title>. <source>Stud. Second. Lang. Acquis.</source> <volume>7</volume>, <fpage>73</fpage>&#x2013;<lpage>79</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S0272263100005167</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Darwin</surname> <given-names>C. M.</given-names></name> <name><surname>Gray</surname> <given-names>L. S.</given-names></name></person-group> (<year>1999</year>). <article-title>Going after the phrasal verbs: an alternative approach to classification</article-title>. <source>TESOL Q.</source> <volume>33</volume>, <fpage>65</fpage>&#x2013;<lpage>83</lpage>. doi: <pub-id pub-id-type="doi">10.2307/3588191</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dixon</surname> <given-names>R. M. W.</given-names></name></person-group> (<year>1982</year>). <article-title>The grammar of English phrasal verbs</article-title>. <source>Austr. J Linguistics</source> <volume>2</volume>, <fpage>1</fpage>&#x2013;<lpage>42</lpage>. doi: <pub-id pub-id-type="doi">10.1080/07268608208599280</pub-id></citation></ref>
<ref id="ref9002"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gardner</surname> <given-names>D.</given-names></name> <name><surname>Davies</surname> <given-names>M.</given-names></name></person-group> (<year>2007</year>). <article-title>Pointing out frequent phrasal verbs: A corpus-based analysis</article-title>. <source>TESOL Q.</source> <volume>41</volume>, <fpage>339</fpage>&#x2013;<lpage>359</lpage>. doi: <pub-id pub-id-type="doi">10.1002/j.1545-7249.2007.tb00062.x</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Giora</surname> <given-names>R.</given-names></name></person-group> (<year>1997</year>). <article-title>Understanding figurative and literal language: the graded salience hypothesis</article-title>. <source>Cognitive Linguistics</source> <volume>8</volume>, <fpage>183</fpage>&#x2013;<lpage>206</lpage>. doi: <pub-id pub-id-type="doi">10.1515/cogl.1997.8.3.183</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Giora</surname> <given-names>R.</given-names></name></person-group> (<year>1999</year>). <article-title>On the priority of salient meanings: studies of literal and figurative language</article-title>. <source>J. Pragmat.</source> <volume>31</volume>, <fpage>919</fpage>&#x2013;<lpage>929</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0378-2166(98)00100-3</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Giora</surname> <given-names>R.</given-names></name></person-group> (<year>2002</year>). <article-title>Literal vs. figurative meaning: different or equal?</article-title> <source>J. Pragmat.</source> <volume>34</volume>, <fpage>487</fpage>&#x2013;<lpage>506</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0378-2166(01)00045-5</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Holsinger</surname> <given-names>E.</given-names></name></person-group> (<year>2013</year>). <article-title>Representing idioms: syntactic and contextual effects on idiom processing</article-title>. <source>Lang. Speech</source> <volume>56</volume>, <fpage>373</fpage>&#x2013;<lpage>394</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0023830913484899</pub-id>, PMID: <pub-id pub-id-type="pmid">24416962</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Holsinger</surname> <given-names>E.</given-names></name> <name><surname>Kaiser</surname> <given-names>E.</given-names></name></person-group> (<year>2013</year>). <article-title>Processing (non)compositional expressions: mistakes and recovery</article-title>. <source>J. Exp. Psychol. Learn. Mem. Cogn.</source> <volume>39</volume>, <fpage>866</fpage>&#x2013;<lpage>878</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0030410</pub-id>, PMID: <pub-id pub-id-type="pmid">23088547</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Hy&#x00F6;n&#x00E4;</surname> <given-names>J.</given-names></name> <name><surname>Lorch</surname> <given-names>R. F.</given-names><suffix>Jr.</suffix></name> <name><surname>Rinck</surname> <given-names>M.</given-names></name></person-group> (<year>2003</year>). &#x201C;<article-title>Eye movement measures to study global text processing</article-title>&#x201D; in <source>The mind's eye: Cognitive and applied aspects of eye movement research</source>. eds. <person-group person-group-type="editor"><name><surname>Hy&#x00F6;n&#x00E4;</surname> <given-names>J.</given-names></name> <name><surname>Radach</surname> <given-names>R.</given-names></name> <name><surname>Deubel</surname> <given-names>H.</given-names></name></person-group> (<publisher-loc>Oxford, UK</publisher-loc>: <publisher-name>Elsevier</publisher-name>), <fpage>159</fpage>&#x2013;<lpage>176</lpage>.</citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ito</surname> <given-names>A.</given-names></name> <name><surname>Knoeferle</surname> <given-names>P.</given-names></name></person-group> (<year>2023</year>). <article-title>Analysing data from the psycholinguistic visual world paradigm: comparison of different analysis methods</article-title>. <source>Behav. Res. Methods</source> <volume>55</volume>, <fpage>3461</fpage>&#x2013;<lpage>3493</lpage>. doi: <pub-id pub-id-type="doi">10.3758/s13428-022-01969-3</pub-id>, PMID: <pub-id pub-id-type="pmid">36396835</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jiang</surname> <given-names>S.</given-names></name> <name><surname>Siyanova-Chanturia</surname> <given-names>A.</given-names></name></person-group> (<year>2023</year>). <article-title>The processing of multiword expressions in L1 andL2 Chinese: evidence from reaction times and eye movements</article-title>. <source>Mod. Lang. J.</source> <volume>107</volume>, <fpage>565</fpage>&#x2013;<lpage>605</lpage>. doi: <pub-id pub-id-type="doi">10.1111/modl.12846</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jolsvai</surname> <given-names>H.</given-names></name> <name><surname>McCauley</surname> <given-names>S. M.</given-names></name> <name><surname>Christiansen</surname> <given-names>M. H.</given-names></name></person-group> (<year>2020</year>). <article-title>Meaningfulness beats frequency in multiword chunk processing</article-title>. <source>Cogn. Sci.</source> <volume>44</volume>:<fpage>e12885</fpage>. doi: <pub-id pub-id-type="doi">10.1111/cogs.12885</pub-id>, PMID: <pub-id pub-id-type="pmid">32996628</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kessler</surname> <given-names>R.</given-names></name> <name><surname>Weber</surname> <given-names>A.</given-names></name> <name><surname>Friedrich</surname> <given-names>C. K.</given-names></name></person-group> (<year>2020</year>). <article-title>Activation of literal word meanings in idioms: evidence from eye-tracking and ERP experiments</article-title>. <source>Lang. Speech</source> <volume>64</volume>, <fpage>594</fpage>&#x2013;<lpage>624</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0023830920943625</pub-id>, PMID: <pub-id pub-id-type="pmid">32715872</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>C.</given-names></name></person-group> (<year>2016</year>). <article-title>L2 learners&#x2019; recognition of unfamiliar idioms composed of familiar words</article-title>. <source>Lang. Aware.</source> <volume>25</volume>, <fpage>89</fpage>&#x2013;<lpage>109</lpage>. doi: <pub-id pub-id-type="doi">10.1080/09658416.2015.1122025</pub-id></citation></ref>
<ref id="ref9003"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lenth</surname> <given-names>R.</given-names></name> <name><surname>Singmann</surname> <given-names>H.</given-names></name> <name><surname>Love</surname> <given-names>J.</given-names></name> <name><surname>Buerkner</surname> <given-names>P.</given-names></name> <name><surname>Herve</surname> <given-names>M</given-names></name></person-group>. (<year>2018</year>). <article-title>Package &#x201C;Emmeans&#x201D;</article-title>. <source>R Package Version 4.0-3</source>. Available at: <ext-link xlink:href="http://cran.r-project.org/package=emmeans" ext-link-type="uri">http://cran.r-project.org/package=emmeans</ext-link></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liao</surname> <given-names>Y.</given-names></name> <name><surname>Fukuya</surname> <given-names>Y. J.</given-names></name></person-group> (<year>2004</year>). <article-title>Avoidance of phrasal verbs: the case of Chinese learners of English</article-title>. <source>Lang. Learn.</source> <volume>54</volume>, <fpage>193</fpage>&#x2013;<lpage>226</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1467-9922.2004.00254.x</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Libben</surname> <given-names>M. R.</given-names></name> <name><surname>Titone</surname> <given-names>D. A.</given-names></name></person-group> (<year>2008</year>). <article-title>The multidetermined nature of idiom processing</article-title>. <source>Mem. Cogn.</source> <volume>36</volume>, <fpage>1103</fpage>&#x2013;<lpage>1121</lpage>. doi: <pub-id pub-id-type="doi">10.3758/mc.36.6.1103</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Yang</surname> <given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>Applying China&#x2019;s standards of English language ability in language testing and assessment</article-title>. <source>Foreign Language Testing Teaching</source> <volume>2</volume>, <fpage>1</fpage>&#x2013;<lpage>11</lpage>.</citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Matin</surname> <given-names>E.</given-names></name> <name><surname>Shao</surname> <given-names>K. C.</given-names></name> <name><surname>Boff</surname> <given-names>K. R.</given-names></name></person-group> (<year>1993</year>). <article-title>Saccadic overhead: information-processing time with and without saccades</article-title>. <source>Percept. Psychophys.</source> <volume>53</volume>, <fpage>372</fpage>&#x2013;<lpage>380</lpage>. doi: <pub-id pub-id-type="doi">10.3758/BF03206780</pub-id>, PMID: <pub-id pub-id-type="pmid">8483701</pub-id></citation></ref>
<ref id="ref40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Matlock</surname> <given-names>T.</given-names></name> <name><surname>Heredia</surname> <given-names>R. R.</given-names></name></person-group> (<year>2002</year>). <article-title>Understanding phrasal verbs in monolinguals and bilinguals</article-title>. <source>Adv. Psychol.</source> <volume>134</volume>, <fpage>251</fpage>&#x2013;<lpage>274</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0166-4115(02)80014-0</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ma</surname> <given-names>Z.</given-names></name> <name><surname>Jia</surname> <given-names>J.-X.</given-names></name> <name><surname>Wu</surname> <given-names>S.-Y.</given-names></name></person-group> (<year>2022</year>). <article-title>On the analysis of reaction time data through the use of mixed-effects models: principles and practices</article-title>. <source>Foreign Language Learning Theory Practice.</source> <volume>1</volume>, <fpage>35</fpage>&#x2013;<lpage>46</lpage>.</citation></ref>
<ref id="ref41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McQueen</surname> <given-names>J. M.</given-names></name> <name><surname>Viebahn</surname> <given-names>M. C.</given-names></name></person-group> (<year>2007</year>). <article-title>Tracking recognition of spoken words by tracking looks to printed words</article-title>. <source>Q. J. Exp. Psychol.</source> <volume>60</volume>, <fpage>661</fpage>&#x2013;<lpage>671</lpage>. doi: <pub-id pub-id-type="doi">10.1080/17470210601183890</pub-id>, PMID: <pub-id pub-id-type="pmid">17455074</pub-id></citation></ref>
<ref id="ref42"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Milton</surname> <given-names>J.</given-names></name></person-group> (<year>2010</year>). &#x201C;<article-title>The development of vocabulary breadth across the CEFR levels: a common basis for the elaboration of language syllabuses, curriculum guidelines, examinations, and textbooks across Europe</article-title>,&#x201D; in <source>Communicative proficiency and linguistic development: Intersections between SLA and language testing research</source>. eds. <person-group person-group-type="editor"><name><surname>Bartning</surname> <given-names>I.</given-names></name> <name><surname>Martin</surname> <given-names>M.</given-names></name> <name><surname>Vedder</surname> <given-names>I.</given-names></name></person-group> (<publisher-loc>Eurosla Monograph Series I. Rome</publisher-loc>: <publisher-name>Eurosla</publisher-name>), <fpage>211</fpage>&#x2013;<lpage>232</lpage>.</citation></ref>
<ref id="ref43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morid</surname> <given-names>M.</given-names></name> <name><surname>Bachar</surname> <given-names>N.</given-names></name> <name><surname>Sabourin</surname> <given-names>L.</given-names></name></person-group> (<year>2021</year>). <article-title>Capturing the multi-determined nature of idiom processing using ERPs</article-title>. <source>Can. J. Exp. Psychol.</source> <volume>75</volume>, <fpage>155</fpage>&#x2013;<lpage>161</lpage>. doi: <pub-id pub-id-type="doi">10.1037/cep0000252</pub-id>, PMID: <pub-id pub-id-type="pmid">34043370</pub-id></citation></ref>
<ref id="ref44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nation</surname> <given-names>P.</given-names></name> <name><surname>Beglar</surname> <given-names>D.</given-names></name></person-group> (<year>2007</year>). <article-title>A vocabulary size test</article-title>. <source>Lang. Teach.</source> <volume>31</volume>, <fpage>9</fpage>&#x2013;<lpage>13</lpage>.</citation></ref>
<ref id="ref45"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Palmer</surname> <given-names>F. R.</given-names></name></person-group> (<year>1974</year>). <source>The English verb</source>. <edition>2nd</edition> Edn. <publisher-loc>London</publisher-loc>: <publisher-name>Longman Group Ltd.</publisher-name></citation></ref>
<ref id="ref46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Paterson</surname> <given-names>K.</given-names></name> <name><surname>Liversedge</surname> <given-names>S.</given-names></name> <name><surname>Underwood</surname> <given-names>G.</given-names></name></person-group> (<year>1999</year>). <article-title>The influence of focus operators on syntactic processing of short relative clause sentences</article-title>. <source>Q. J. Exp. Psychol.</source> <volume>52</volume>, <fpage>717</fpage>&#x2013;<lpage>737</lpage>. doi: <pub-id pub-id-type="doi">10.1080/027249899391025</pub-id></citation></ref>
<ref id="ref47"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Paulmann</surname> <given-names>S.</given-names></name> <name><surname>Ghareeb-Ali</surname> <given-names>Z.</given-names></name> <name><surname>Felser</surname> <given-names>C.</given-names></name></person-group> (<year>2015</year>). &#x201C;<article-title>Neurophysiological markers of phrasal verb processing: evidence from L1 and L2 speakers</article-title>&#x201D; in <source>Bilingual figurative language processing</source>. eds. <person-group person-group-type="editor"><name><surname>Heredia</surname> <given-names>R. R.</given-names></name> <name><surname>Cie&#x015B;licka</surname> <given-names>A. B.</given-names></name></person-group> (<publisher-loc>Cambridge</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>), <fpage>245</fpage>&#x2013;<lpage>267</lpage>.</citation></ref>
<ref id="ref0050"><citation citation-type="other"><person-group person-group-type="author"><collab id="coll201">Pearson Education</collab></person-group>. (<year>2000</year>). <source>Longman phrasal verbs dictionary (2nd edition)</source>. <publisher-loc>New York</publisher-loc>: <publisher-name>Longman</publisher-name>.</citation></ref>
<ref id="ref48"><citation citation-type="other"><person-group person-group-type="author"><collab id="coll2">R Core Team</collab></person-group>. (<year>2023</year>). <source>R: a language and environment for statistical computing</source>. Available online at: <ext-link xlink:href="https://www.r-project.org/" ext-link-type="uri">https://www.r-project.org/</ext-link> (Accessed August 7, 2023).</citation></ref>
<ref id="ref49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rayner</surname> <given-names>K.</given-names></name></person-group> (<year>1975</year>). <article-title>The perceptual span and peripheral cues in reading</article-title>. <source>Cogn. Psychol.</source> <volume>7</volume>, <fpage>65</fpage>&#x2013;<lpage>81</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0010-0285(75)90005-5</pub-id></citation></ref>
<ref id="ref50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rayner</surname> <given-names>K.</given-names></name> <name><surname>Sereno</surname> <given-names>S. C.</given-names></name> <name><surname>Morris</surname> <given-names>R. K.</given-names></name> <name><surname>Schmauder</surname> <given-names>A. R.</given-names></name> <name><surname>Clifton</surname> <given-names>C.</given-names></name></person-group> (<year>1989</year>). <article-title>Eye movements and online comprehension processes</article-title>. <source>Lang. Cognitive Processes</source> <volume>4</volume>, <fpage>SI21</fpage>&#x2013;<lpage>SI49</lpage>. doi: <pub-id pub-id-type="doi">10.1080/01690968908406362</pub-id>, PMID: <pub-id pub-id-type="pmid">40101104</pub-id></citation></ref>
<ref id="ref51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Reichle</surname> <given-names>E. D.</given-names></name> <name><surname>Pollatsek</surname> <given-names>A.</given-names></name> <name><surname>Fisher</surname> <given-names>D. L.</given-names></name> <name><surname>Rayner</surname> <given-names>K.</given-names></name></person-group> (<year>1998</year>). <article-title>Toward a model of eye movement control in reading</article-title>. <source>Psychol. Rev.</source> <volume>105</volume>, <fpage>125</fpage>&#x2013;<lpage>157</lpage>. doi: <pub-id pub-id-type="doi">10.1037/0033-295x.105.1.125</pub-id>, PMID: <pub-id pub-id-type="pmid">9450374</pub-id></citation></ref>
<ref id="ref9005"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Richards</surname> <given-names>J. C.</given-names></name> <name><surname>Schmidt</surname> <given-names>R. W</given-names></name></person-group>. (<year>2011</year>). <source>Longman dictionary of language teaching and applied linguistics (4th ed.)</source>. <publisher-name>Routledge</publisher-name>. Available at: <ext-link xlink:href="https://doi.org/10.4324/9781315833835" ext-link-type="uri">https://doi.org/10.4324/9781315833835</ext-link></citation></ref>
<ref id="ref52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Roberts</surname> <given-names>L.</given-names></name> <name><surname>Siyanova-Chanturia</surname> <given-names>A.</given-names></name></person-group> (<year>2013</year>). <article-title>Using eye-tracking to investigate topics in L2 acquisition and L2 sentence and discourse processing</article-title>. <source>Stud. Second. Lang. Acquis.</source> <volume>35</volume>, <fpage>213</fpage>&#x2013;<lpage>235</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S0272263112000861</pub-id></citation></ref>
<ref id="ref53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schotter</surname> <given-names>E. R.</given-names></name> <name><surname>Lee</surname> <given-names>M.</given-names></name> <name><surname>Reiderman</surname> <given-names>M.</given-names></name> <name><surname>Rayner</surname> <given-names>K.</given-names></name></person-group> (<year>2015</year>). <article-title>The effect of contextual constraint on parafoveal processing in reading</article-title>. <source>J. Mem. Lang.</source> <volume>83</volume>, <fpage>118</fpage>&#x2013;<lpage>139</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jml.2015.04.005</pub-id>, PMID: <pub-id pub-id-type="pmid">26257469</pub-id></citation></ref>
<ref id="ref54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schweigert</surname> <given-names>W.</given-names></name> <name><surname>Moates</surname> <given-names>D.</given-names></name></person-group> (<year>1988</year>). <article-title>Familiar idiom comprehension</article-title>. <source>J. Psycholinguist. Res.</source> <volume>17</volume>, <fpage>281</fpage>&#x2013;<lpage>296</lpage>. doi: <pub-id pub-id-type="doi">10.1007/BF01067198</pub-id></citation></ref>
<ref id="ref55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Side</surname> <given-names>R.</given-names></name></person-group> (<year>1990</year>). <article-title>Phrasal verbs: sorting them out</article-title>. <source>ELT J.</source> <volume>44</volume>, <fpage>144</fpage>&#x2013;<lpage>152</lpage>. doi: <pub-id pub-id-type="doi">10.1093/elt/44.2.144</pub-id></citation></ref>
<ref id="ref56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Siyanova-Chanturia</surname> <given-names>A.</given-names></name> <name><surname>Conklin</surname> <given-names>K.</given-names></name> <name><surname>Schmitt</surname> <given-names>N.</given-names></name></person-group> (<year>2011</year>). <article-title>Adding more fuel to the fire: an eye-tracking study of idiom processing by native and non-native speakers</article-title>. <source>Second. Lang. Res.</source> <volume>27</volume>, <fpage>251</fpage>&#x2013;<lpage>272</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0267658310382068</pub-id></citation></ref>
<ref id="ref57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Siyanova-Chanturia</surname> <given-names>A.</given-names></name> <name><surname>Martinez</surname> <given-names>R.</given-names></name></person-group> (<year>2014</year>). <article-title>The idiom principle revisited</article-title>. <source>Appl. Linguis.</source> <volume>35</volume>, <fpage>amt054</fpage>&#x2013;<lpage>amt569</lpage>. doi: <pub-id pub-id-type="doi">10.1093/applin/amt054</pub-id></citation></ref>
<ref id="ref58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Siyanova-Chanturia</surname> <given-names>A.</given-names></name> <name><surname>Schmitt</surname> <given-names>N.</given-names></name></person-group> (<year>2007</year>). <article-title>Native and nonnative use of multi-word vs. one-word verbs</article-title>. <source>Int. Rev. Applied Linguist. Lang. Teach.</source> <volume>45</volume>, <fpage>119</fpage>&#x2013;<lpage>139</lpage>. doi: <pub-id pub-id-type="doi">10.1515/IRAL.2007.005</pub-id>, PMID: <pub-id pub-id-type="pmid">40292255</pub-id></citation></ref>
<ref id="ref59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sonbul</surname> <given-names>S.</given-names></name> <name><surname>El-Dakhs</surname> <given-names>D. A. S.</given-names></name> <name><surname>Al-Otaibi</surname> <given-names>H.</given-names></name></person-group> (<year>2020</year>). <article-title>Productive versus receptive L2 knowledge of polysemous phrasal verbs: a comparison of determining factors</article-title>. <source>System</source> <volume>95</volume>:<fpage>102361</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.system.2020.102361</pub-id></citation></ref>
<ref id="ref60"><citation citation-type="book"><person-group person-group-type="author"><collab id="coll3">SR</collab></person-group> (<year>2021</year>). <source>Mississauga</source>. <publisher-loc>Ontario, Canada</publisher-loc>: <publisher-name>SR Research Ltd.</publisher-name></citation></ref>
<ref id="ref0040"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Titone</surname> <given-names>D.</given-names></name> <name><surname>Columbus</surname> <given-names>G.</given-names></name> <name><surname>Whitford</surname> <given-names>V.</given-names></name> <name><surname>Mercier</surname> <given-names>J.</given-names></name> <name><surname>Libben</surname> <given-names>M.</given-names></name></person-group> (<year>2015</year>). &#x201C;<article-title>Contrasting bilingual and monolingual idiom processing,</article-title>&#x201D; in <source>Bilingual figurative language processing</source>. eds. <person-group person-group-type="editor"><name><surname>Heredia</surname> <given-names>R. R.</given-names></name> <name><surname>Cieslicka</surname> <given-names>A. B.</given-names></name></person-group> (<publisher-loc>Cambridge</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>), <fpage>171</fpage>&#x2013;<lpage>207</lpage>.</citation></ref>
<ref id="ref64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Titone</surname> <given-names>D. A.</given-names></name> <name><surname>Connine</surname> <given-names>C. M.</given-names></name></person-group> (<year>1999</year>). <article-title>On the compositional and non-compositional nature of idiomatic expressions</article-title>. <source>J. Pragmat.</source> <volume>31</volume>, <fpage>1655</fpage>&#x2013;<lpage>1674</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0378-2166(99)00008-9</pub-id></citation></ref>
<ref id="ref65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Titone</surname> <given-names>D. A.</given-names></name> <name><surname>Libben</surname> <given-names>M.</given-names></name></person-group> (<year>2014</year>). <article-title>Time-dependent effects of decomposability, familiarity and literal plausibility on idiom priming: a cross-modal priming investigation</article-title>. <source>Mental Lexicon</source> <volume>9</volume>, <fpage>473</fpage>&#x2013;<lpage>496</lpage>. doi: <pub-id pub-id-type="doi">10.1075/ml.9.3.05tit</pub-id></citation></ref>
<ref id="ref66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>van Ginkel</surname> <given-names>W.</given-names></name> <name><surname>Dijkstra</surname> <given-names>T.</given-names></name></person-group> (<year>2020</year>). <article-title>The tug of war between an idiom's figurative and literal meanings: evidence from native and bilingual speakers</article-title>. <source>Biling. Lang. Congn.</source> <volume>23</volume>, <fpage>131</fpage>&#x2013;<lpage>147</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S1366728918001219</pub-id></citation></ref>
<ref id="ref68"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>M.</given-names></name> <name><surname>Koda</surname> <given-names>K.</given-names></name></person-group> (<year>2005</year>). <article-title>Commonalities and differences in word identification skills among learners of English as a second language</article-title>. <source>Lang. Learn.</source> <volume>55</volume>, <fpage>71</fpage>&#x2013;<lpage>98</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.0023-8333.2005.00290.x</pub-id></citation></ref>
<ref id="ref70"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>X.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Tian</surname> <given-names>W.</given-names></name> <name><surname>Zheng</surname> <given-names>W.</given-names></name> <name><surname>Chen</surname> <given-names>X.</given-names></name></person-group> (<year>2021</year>). <article-title>The roles of familiarity and context in processing Chinese xiehouyu: an ERP study</article-title>. <source>J. Psycholinguist. Res.</source> <volume>50</volume>, <fpage>901</fpage>&#x2013;<lpage>921</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10936-020-09753-0</pub-id>, PMID: <pub-id pub-id-type="pmid">33389396</pub-id></citation></ref>
<ref id="ref69"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Sun</surname> <given-names>E.-H.</given-names></name> <name><surname>Zhang</surname> <given-names>J.-J.</given-names></name></person-group> (<year>2016</year>). <article-title>Sentence contexts affect Chinese-English bilinguals&#x2019; semantic processing of English phrasal verbs: evidence from eye movement research</article-title>. <source>Foreign Lang. Teach. Res.</source> <volume>48</volume>, <fpage>249</fpage>&#x2013;<lpage>321</lpage>.</citation></ref>
<ref id="ref72"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wisintainer</surname> <given-names>S.</given-names></name> <name><surname>Mota</surname> <given-names>B.</given-names></name></person-group> (<year>2018</year>). <article-title>Processing of literal phrasal verbs by non-native and native speakers of English: an eye movement study</article-title>. <source>Letr&#x00F4;nica</source> <volume>10</volume>, <fpage>717</fpage>&#x2013;<lpage>729</lpage>. doi: <pub-id pub-id-type="doi">10.15448/1984-4301.2017.2.26451</pub-id></citation></ref>
<ref id="ref73"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wolter</surname> <given-names>B.</given-names></name> <name><surname>Yamashita</surname> <given-names>J.</given-names></name></person-group> (<year>2018</year>). <article-title>Word frequency, collocational frequency, L1 congruency, and proficiency in L2 collocational processing: what accounts for L2 performance?</article-title> <source>Studies Second Lang. Acquisition</source> <volume>40</volume>, <fpage>395</fpage>&#x2013;<lpage>416</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S0272263117000237</pub-id></citation></ref>
<ref id="ref74"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Wray</surname> <given-names>A.</given-names></name></person-group> (<year>2002</year>). <source>Formulaic language and the lexicon</source>. <publisher-loc>Cambridge</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>.</citation></ref>
<ref id="ref9004"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Wu</surname> <given-names>Shiyu</given-names></name></person-group>. (<year>2019</year>). <source>Second Language Processing and R in Application</source>. <publisher-loc>Beijing</publisher-loc>: <publisher-name>Foreign Language Teaching and Research Press</publisher-name>.</citation></ref>
<ref id="ref75"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yan</surname> <given-names>G.</given-names></name> <name><surname>Xiong</surname> <given-names>J.</given-names></name> <name><surname>Zang</surname> <given-names>C.</given-names></name> <name><surname>Yu</surname> <given-names>L.</given-names></name> <name><surname>Cui</surname> <given-names>U.</given-names></name> <name><surname>Bai</surname> <given-names>X.</given-names></name></person-group> (<year>2013</year>). <article-title>Review of eye-movement measures in Reading research</article-title>. <source>Adv. Psychol. Sci.</source> <volume>21</volume>, <fpage>589</fpage>&#x2013;<lpage>605</lpage>. doi: <pub-id pub-id-type="doi">10.3724/SP.J.1042.2013.00589</pub-id></citation></ref>
<ref id="ref76"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yee</surname> <given-names>E.</given-names></name> <name><surname>Sedivy</surname> <given-names>J. C.</given-names></name></person-group> (<year>2006</year>). <article-title>Eye movements to pictures reveal transient semantic activation during spoken word recognition</article-title>. <source>J. Exp. Psychol. Learn. Mem. Cogn.</source> <volume>32</volume>, <fpage>1</fpage>&#x2013;<lpage>14</lpage>. doi: <pub-id pub-id-type="doi">10.1037/0278-7393.32.1.1</pub-id>, PMID: <pub-id pub-id-type="pmid">16478336</pub-id></citation></ref>
<ref id="ref77"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yi</surname> <given-names>W.</given-names></name> <name><surname>Zhong</surname> <given-names>Y.</given-names></name></person-group> (<year>2023</year>). <article-title>The processing advantage of multiword sequences: a meta-analysis</article-title>. <source>Stud. Second. Lang. Acquis.</source> <volume>46</volume>, <fpage>427</fpage>&#x2013;<lpage>452</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S0272263123000542</pub-id>, PMID: <pub-id pub-id-type="pmid">40247472</pub-id></citation></ref>
<ref id="ref79"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>P.</given-names></name> <name><surname>Chen</surname> <given-names>H.</given-names></name></person-group> (<year>2019</year>). <article-title>How input frequency and input interval affect the acquisition of English phrasal verbs</article-title>. <source>J. PLA Univ. Foreign Lang.</source> <volume>42</volume>, <fpage>1</fpage>&#x2013;<lpage>9</lpage>.</citation></ref>
<ref id="ref80"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Wen</surname> <given-names>J.</given-names></name></person-group> (<year>2019</year>). <article-title>Exploring multiple constraints on second language development of English polysemous phrasal verbs</article-title>. <source>Appl. Psycholinguist.</source> <volume>40</volume>, <fpage>1073</fpage>&#x2013;<lpage>1101</lpage>. doi: <pub-id pub-id-type="doi">10.1017/S0142716419000146</pub-id></citation></ref>
<ref id="ref81"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>S.</given-names></name></person-group> (<year>2011</year>). <article-title>A study of English majors&#x2019; processing of English idioms</article-title>. <source>J. PLA Univ. Foreign Lang.</source> <volume>34</volume>, <fpage>46</fpage>&#x2013;<lpage>127</lpage>.</citation></ref>
</ref-list>
</back>
</article>