<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE root>
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="research-article" dtd-version="1.2" xml:lang="en"><front><journal-meta><journal-id journal-id-type="publisher-id">Russian Journal of Linguistics</journal-id><journal-title-group><journal-title xml:lang="en">Russian Journal of Linguistics</journal-title><trans-title-group xml:lang="ru"><trans-title>Russian Journal of Linguistics</trans-title></trans-title-group></journal-title-group><issn publication-format="print">2687-0088</issn><issn publication-format="electronic">2686-8024</issn><publisher><publisher-name xml:lang="en">Peoples’ Friendship University of Russia named after Patrice Lumumba (RUDN University)</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">31334</article-id><article-id pub-id-type="doi">10.22363/2687-0088-31187</article-id><article-categories><subj-group subj-group-type="toc-heading" xml:lang="en"><subject>Articles</subject></subj-group><subj-group subj-group-type="toc-heading" xml:lang="ru"><subject>Статьи</subject></subj-group><subj-group subj-group-type="toc-heading" xml:lang="zh"><subject>Articles</subject></subj-group><subj-group subj-group-type="article-type"><subject>Research Article</subject></subj-group></article-categories><title-group><article-title xml:lang="en">Word-formation complexity: a learner corpus-based study</article-title><trans-title-group xml:lang="ru"><trans-title>Словообразовательная сложность и ошибки учащихся в экзаменационных эссе</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-8374-423X</contrib-id><name-alternatives><name xml:lang="en"><surname>Lyashevskaya</surname><given-names>Olga Nikolaevna</given-names></name><name xml:lang="ru"><surname>Ляшевская</surname><given-names>Ольга Николаевна</given-names></name></name-alternatives><bio xml:lang="en"><p>Professor at the School of Linguistics, National Research University “Higher School of Economics” and a Senior Research Fellow at the Vinogradov Russian Language Institute, RAS</p></bio><bio xml:lang="ru"><p>профессор Школы лингвистики Национального исследовательского университета «Высшая школа экономики», старший научный сотрудник Института русского языка имени В. В. Виноградова РАН</p></bio><email>olesar@yandex.ru</email><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0003-3439-9788</contrib-id><name-alternatives><name xml:lang="en"><surname>Pyzhak</surname><given-names>Julia Vyacheslavovna</given-names></name><name xml:lang="ru"><surname>Пыжак</surname><given-names>Юлия Вячеславовна</given-names></name></name-alternatives><bio xml:lang="en"><p>student at the Department of Humanities</p></bio><bio xml:lang="ru"><p>студентка факультета гуманитарных наук</p></bio><email>jeneavas41@yandex.ru</email><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-5928-1482</contrib-id><name-alternatives><name xml:lang="en"><surname>Vinogradova</surname><given-names>Olga Il'inichna</given-names></name><name xml:lang="ru"><surname>Виноградова</surname><given-names>Ольга Ильинична</given-names></name></name-alternatives><bio xml:lang="en"><p>Associate Professor at the School of Linguistics</p></bio><bio xml:lang="ru"><p>доцент Школы лингвистики, научный сотрудник научно-учебной лаборатории учебных корпусов факультета гуманитарных наук</p></bio><email>olgavinogr@gmail.com</email><xref ref-type="aff" rid="aff1"/></contrib></contrib-group><aff-alternatives id="aff1"><aff><institution xml:lang="en">National Research University Higher School of Economics</institution></aff><aff><institution xml:lang="ru">Национальный исследовательский университет «Высшая школа экономики»</institution></aff></aff-alternatives><aff-alternatives id="aff2"><aff><institution xml:lang="en">Vinogradov Russian Language Institute of the Russian Academy of Sciences</institution></aff><aff><institution xml:lang="ru">Институт русского языка им. В. В. Виноградова РАН</institution></aff></aff-alternatives><pub-date date-type="pub" iso-8601-date="2022-06-29" publication-format="electronic"><day>29</day><month>06</month><year>2022</year></pub-date><volume>26</volume><issue>2</issue><issue-title xml:lang="en">Computational Linguistics and Discourse Complexology</issue-title><issue-title xml:lang="ru">Компьютерная лингвистика и дискурсивная комплексология</issue-title><fpage>471</fpage><lpage>492</lpage><history><date date-type="received" iso-8601-date="2022-06-29"><day>29</day><month>06</month><year>2022</year></date></history><permissions><copyright-statement xml:lang="en">Copyright ©; 2022, Lyashevskaya O.N., Pyzhak J.V., Vinogradova O.I.</copyright-statement><copyright-statement xml:lang="ru">Copyright ©; 2022, Ляшевская О.Н., Пыжак Ю.В., Виноградова О.И.</copyright-statement><copyright-statement xml:lang="zh">Copyright ©; 2022, Lyashevskaya O., Pyzhak J., Vinogradova O.</copyright-statement><copyright-year>2022</copyright-year><copyright-holder xml:lang="en">Lyashevskaya O.N., Pyzhak J.V., Vinogradova O.I.</copyright-holder><copyright-holder xml:lang="ru">Ляшевская О.Н., Пыжак Ю.В., Виноградова О.И.</copyright-holder><copyright-holder xml:lang="zh">Lyashevskaya O., Pyzhak J., Vinogradova O.</copyright-holder><ali:free_to_read xmlns:ali="http://www.niso.org/schemas/ali/1.0/"/><license><ali:license_ref xmlns:ali="http://www.niso.org/schemas/ali/1.0/">https://creativecommons.org/licenses/by-nc/4.0</ali:license_ref></license></permissions><self-uri xlink:href="https://journals.rudn.ru/linguistics/article/view/31334">https://journals.rudn.ru/linguistics/article/view/31334</self-uri><abstract xml:lang="en"><p style="text-align: justify;">This article explores the word-formation dimension of learner text complexity which indicates how skilful the non-native speakers are in using more and less complex - and varied - derivational constructions. In order to analyse the association between complexity and writing accuracy in word formation as well as interactive effects of task type, text register, and native language background, we examine the materials of the REALEC corpus of English essays written by university students with Russian L1. We present an approach to measure derivational complexity based on the classification of suffixes offered in Bauer and Nation (1993) and then compare the complexity results and the number of word formation errors annotated in the texts. Starting with the hypothesis that with increasing complexity the number of errors will decrease, we apply statistical analysis to examine the association between complexity and accuracy. We found, first, that the use of more advanced word-formation suffixes affects the number of errors in texts. Second, different levels of suffixes in the hierarchy affect derivation accuracy in different ways. In particular, the use of irregular derivational models is positively associated with the number of errors. Third, the type of examination task and expected format and register of writing should be taken into consideration. The hypothesis holds true for regular but infrequent advanced suffixal models used in more formal descriptive essays associated with an academic register. However, for less formal texts with lower academic register requirements, the hypothesis needs to be amended.</p></abstract><trans-abstract xml:lang="ru"><p style="text-align: justify;">В статье рассматривается словообразовательная сложность учебных текстов, которая трактуется как система измерений, показывающих разнообразие приемов словообразования разного уровня, от простых до продвинутых, используемых учащимся. Анализируется взаимосвязь между сложностью и ошибками, которые учащиеся допускают в словообразовании. Исследование основано на материалах REALEC - корпуса английских экзаменационных эссе, написанных студентами университета с родным русским языком. Предлагается подход к измерению словообразовательной сложности, основанный на классификации суффиксов Бауэра и Нейшена (Bauer &amp; Nation 1993), и анализируется соответствие между показателями индексов сложности и количеством ошибок словообразования, размеченных в текстах корпуса, с учетом типа экзаменационного задания. Постулируется гипотеза о том, что с увеличением сложности количество ошибок должно уменьшаться, и проводится статистический анализ параметров сложности и безошибочности. В работе показано, во-первых, что использование словообразовательных суффиксов более высокой сложности связано с количеством ошибок в текстах. Во-вторых, разные уровни иерархии сложности оказывают разнонаправленное влияние на точность: в частности, использование нерегулярных словообразовательных моделей положительно связано с количеством ошибок. В-третьих, следует учитывать тип экзаменационного задания, в том числе ожидаемые формально-регистровые особенности текста. Гипотеза была подтверждена для регулярных, но нечастотных суффиксальных моделей при их использовании в описаниях рисунков и графиков - текстах, следующих определенному формату и включающих элементы академического письма. Однако в случае аргументативных эссе выдвинутая гипотеза требует уточнения.</p></trans-abstract><kwd-group xml:lang="en"><kwd>linguistic complexity</kwd><kwd>morphological complexity</kwd><kwd>writing accuracy</kwd><kwd>word formation</kwd><kwd>English</kwd><kwd>learner corpora</kwd></kwd-group><kwd-group xml:lang="ru"><kwd>лингвистическая сложность</kwd><kwd>морфологическая сложность</kwd><kwd>безошибочность письма</kwd><kwd>словообразование</kwd><kwd>английский язык как иностранный</kwd><kwd>учебные корпуса</kwd></kwd-group><funding-group/></article-meta></front><body></body><back><ref-list><ref id="B1"><label>1.</label><mixed-citation>Abrahamsson, Niclas. 2013. U-shaped learning and overgeneralization. In Peter Robinson (ed.), The routledge encyclopedia of second language acquisition, 663-664. London: Routledge. https://doi.org/10.4324/9780203135945</mixed-citation></ref><ref id="B2"><label>2.</label><mixed-citation>Baayen, R. Harald. 2009. Corpus linguistics in morphology: Morphological productivity. In Anke Lüdeling &amp; Merja Kytö (eds.), Corpus linguistics: An international handbook, 899-919. Berlin, New York: De Gruyter Mouton. https://doi.org/10.1515/9783110213881.2.899</mixed-citation></ref><ref id="B3"><label>3.</label><mixed-citation>Baerman, Matthew, Dunstan Brown &amp; Greville G. Corbett (eds.). 2015. Understanding and Measuring Morphological Complexity. Oxford: Oxford University Press. https://doi.org/10.1093/acprof:oso/9780198723769.001.0001</mixed-citation></ref><ref id="B4"><label>4.</label><mixed-citation>Bardovi-Harlig, Kathleen &amp; Theodora Bofman. 1989. Attainment of syntactic and morphological accuracy by advanced language learners. Studies in Second Language Acquisition 11(1). 17-34.</mixed-citation></ref><ref id="B5"><label>5.</label><mixed-citation>Bauer, Laurie &amp; Paul Nation 1993. Word families. International Journal of Lexicography 6(4). 253-279.</mixed-citation></ref><ref id="B6"><label>6.</label><mixed-citation>Biber, Douglas. 1988. Variation Across Speech and Writing. Cambridge: Cambridge University Press.</mixed-citation></ref><ref id="B7"><label>7.</label><mixed-citation>Brezina, Vaclav &amp; Gabriele Pallotti. 2019. Morphological complexity in written L2 texts. Second Language Research 35(1). 99-119. https://doi.org/10.1177/0267658316643125</mixed-citation></ref><ref id="B8"><label>8.</label><mixed-citation>Brezina, Vaclav, Pierre Weill-Tessier &amp; Antony McEnery. 2020. #LancsBox v. 5.x. URL: http://corpora.lancs.ac.uk/lancsbox (accessed 25.05.2021).</mixed-citation></ref><ref id="B9"><label>9.</label><mixed-citation>Brown, Dale, Tim Stoeckel, Stuart Mclean &amp; Jeff Stewart. 2020. The most appropriate lexical unit for L2 vocabulary research and pedagogy: A brief review of the evidence. Applied Linguistics, amaa061. https://doi.org/10.1093/applin/amaa061</mixed-citation></ref><ref id="B10"><label>10.</label><mixed-citation>Bulté, Bram &amp; Alex Housen. 2012. Defining and operationalising L2 complexity. In Alex Housen, Folkert Kuiken &amp; Ineke Vedder (eds.), Dimensions of L2 performance and proficiency: Complexity, accuracy and fluency in SLA, 21-46. Amsterdam: John Benjamins. https://doi.org/10.1075/lllt.32.02bul</mixed-citation></ref><ref id="B11"><label>11.</label><mixed-citation>Bulté, Bram &amp; Alex Housen. 2014. Conceptualizing and measuring short-term changes in L2 writing complexity. Journal of Second Language Writing 26. 42-65. https://doi.org/10.1016/j.jslw.2014.09.005</mixed-citation></ref><ref id="B12"><label>12.</label><mixed-citation>Capel, Annette. 2010. A1-B2 vocabulary: Insights and issues arising from the English Profile Wordlists project. English Profile Journal 1(1). 2-7. https://doi.org/10.1017/S2041536210000048</mixed-citation></ref><ref id="B13"><label>13.</label><mixed-citation>Crossley, Scott. 2020. Linguistic features in writing quality and development: An overview. Journal of Writing Research 11(3). 415-443. https://doi.org/10.17239/jowr-2020.11.03.01</mixed-citation></ref><ref id="B14"><label>14.</label><mixed-citation>de la Torre García, Nuria, María Cecilia Ainciburu &amp; Kris Buyse. 2021. Morphological complexity and rated writing proficiency: The case of verbal inflectional diversity in L2 Spanish. ITL - International Journal of Applied Linguistics 172(2). 290-318. https://doi.org/10.1075/itl.20009.del</mixed-citation></ref><ref id="B15"><label>15.</label><mixed-citation>Dobson, Annette J. 1990. An Introduction to Generalized Linear Models. London: Chapman and Hall.</mixed-citation></ref><ref id="B16"><label>16.</label><mixed-citation>Ehret, Katharina &amp; Benedikt Szmrecsanyi. 2019. Compressing learner language: An information-theoretic measure of complexity in SLA production data. Second Language Research 35(1). 23-45. https://doi.org/10.1177/0267658316669559</mixed-citation></ref><ref id="B17"><label>17.</label><mixed-citation>Hassanzadeh, Fatemeh &amp; Iraj Kazemi. 2017. Regression modeling of one-inflated positive count data. Statistical Papers 58(3). 791-809. https://doi.org/10.1007/s00362-015-0726-7</mixed-citation></ref><ref id="B18"><label>18.</label><mixed-citation>Hay, Jennifer &amp; R. Harald Baayen. 2002. Parsing and productivity. In Geert E. Booij &amp; Jaap Van Marle (eds.), Yearbook of morphology 2001, 203-235. Dordrecht: Kluwer Academic. https://doi.org/10.1007/978-94-017-3726-5_8.</mixed-citation></ref><ref id="B19"><label>19.</label><mixed-citation>Hollander, Myles &amp; Douglas A. Wolfe. 1973. Nonparametric Statistical Methods. New York: John Wiley &amp; Sons.</mixed-citation></ref><ref id="B20"><label>20.</label><mixed-citation>Horst, Marlise &amp; Laura Collins. 2006. From faible to strong: How does their vocabulary grow? Canadian Modern Language Review 63(1). 83-106.  https://doi.org/10.1353/cml.2006.0046</mixed-citation></ref><ref id="B21"><label>21.</label><mixed-citation>Kimppa, Lilli , Yury Shtyrov, Suzanne C.A. Hut, Laura Hedlund, Miika Leminen &amp; Alina Leminen. 2019. Acquisition of L2 morphology by adult language learners. Cortex 116. 74-90. https://doi.org/10.1016/j.cortex.2019.01.012</mixed-citation></ref><ref id="B22"><label>22.</label><mixed-citation>Lahuerta, Ana Cristina. 2018. Study of accuracy and grammatical complexity in EFL writing. International Journal of English Studies 18(1). 71-89. https://doi.org/10.6018/ijes/2018/1/258971</mixed-citation></ref><ref id="B23"><label>23.</label><mixed-citation>Laufer, Batia, Stuart Webb, Su Kyung Kim &amp; Beverley Yohanan. 2021. How well do learners know derived words in a second language? The effect of proficiency, word frequency and type of affix. ITL - International Journal of Applied Linguistics 172(2). 229-258. https://doi.org/10.1075/itl.20020.lau</mixed-citation></ref><ref id="B24"><label>24.</label><mixed-citation>Laws, Jacqueline &amp; Chris Ryder. 2014. Getting the measure of derivational morphology in adult speech a corpus analysis using MorphoQuantics. University of Reading Language Studies Working Papers 6. 3-17. http://morphoquantics.co.uk/Resources/Laws%20&amp;%20Ryder%20(2014).pdf (accessed 25.06.2021)</mixed-citation></ref><ref id="B25"><label>25.</label><mixed-citation>Leontjev, Dmitri. 2016. L2 English derivational knowledge: Which affixes are learners more likely to recognise? Studies in Second Language Learning and Teaching 6(2). 225-248. https://doi.org/10.14746/ssllt.2016.6.2.3</mixed-citation></ref><ref id="B26"><label>26.</label><mixed-citation>Lyashevskaya, Olga, Irina Panteleev &amp; Olga Vinogradova. 2021. Automated assessment of learner text complexity. Assessing Writing 49, article 100529. https://doi.org/10.1016/j.asw.2021.100529</mixed-citation></ref><ref id="B27"><label>27.</label><mixed-citation>Lyashevskaya, Olga, Olga Vinogradova &amp; Anna Scherbakova. (forthc.) Accuracy, syntactic complexity, and task type at play in examination writing: A corpus-based study. In Agnieszka Leńko-Szymańska &amp; Sandra Götz (eds.), Complexity, accuracy, and fluency in learner corpus research.</mixed-citation></ref><ref id="B28"><label>28.</label><mixed-citation>Marchand, Hans. 1969. The Categories and Types of Present-Day English Word-Formation. 2nd ed. Munich: C. H. Beck.</mixed-citation></ref><ref id="B29"><label>29.</label><mixed-citation>Nation, Paul. 2021. Thoughts on word families. Studies in Second Language Acquisition 43(5). 969-972. https://doi.org/10.1017/S027226312100067X</mixed-citation></ref><ref id="B30"><label>30.</label><mixed-citation>Norris, John &amp; Lourdes Ortega. 2009. Measurement for understanding: An organic approach to investigating complexity, accuracy, and fluency in SLA. Applied Linguistics 30(4). 555-578. https://doi.org/10.1093/applin/amp044</mixed-citation></ref><ref id="B31"><label>31.</label><mixed-citation>Plakans, Lia, Atta Gebril &amp; Zeynep Bilki. 2019. Shaping a score: Complexity, accuracy, and fluency in integrated writing performances. Language Testing 36(2). 161-179. https://doi.org/10.1177/0265532216669537</mixed-citation></ref><ref id="B32"><label>32.</label><mixed-citation>Plag, Ingo, Christiane Dalton-Puffer &amp; Harald Baayen. 1999. Morphological productivity across speech and writing. English Language &amp; Linguistics 3(2). 209-228.</mixed-citation></ref><ref id="B33"><label>33.</label><mixed-citation>R Core Team. 2019. R: A language and environment for statistical computing. R Foundation for Statistical Computing, Vienna, Austria. https://www.r-project.org (accessed 25.06.2021).</mixed-citation></ref><ref id="B34"><label>34.</label><mixed-citation>Robinson, Peter. 2001. Task complexity, task difficulty, and task production: Exploring interactions in a componential framework. Applied Linguistics 22(1). 27-57. https://doi-org.proxylibrary.hse.ru/10.1093/applin/22.1.27</mixed-citation></ref><ref id="B35"><label>35.</label><mixed-citation>Robinson, Peter. 2011. Second language task complexity, the Cognition Hypothesis, language learning, and performance. In Peter Robinson (ed.), Second language task complexity: Researching the Cognition Hypothesis of language learning and performance, 3-39. Amsterdam: John Benjamins. https://doi.org/10.1075/tblt.2.05ch1</mixed-citation></ref><ref id="B36"><label>36.</label><mixed-citation>Skehan, Peter. 1998. A Cognitive Approach to Language Learning. Oxford: Oxford University Press.</mixed-citation></ref><ref id="B37"><label>37.</label><mixed-citation>Skehan, Peter. 2009. Modelling second language performance: Integrating complexity, accuracy, fluency, and lexis. Applied Linguistics 30(4). 510-532. https://doi.org/10.1093/applin/amp047</mixed-citation></ref><ref id="B38"><label>38.</label><mixed-citation>Stein, Gabriele. 2007. A Dictionary of English Affixes: Their Function and Meaning. Munich: Lincom Europa.</mixed-citation></ref><ref id="B39"><label>39.</label><mixed-citation>Tywoniw, Rurik &amp; Scott Crossley. 2020. Morphological complexity of L2 discourse. In Eric Friginal &amp; Jack A. Hardy (eds.), The Routledge handbook of corpus approaches to discourse analysis, 269-297. London: Routledge. https://doi.org/10.4324/9780429259982-17</mixed-citation></ref><ref id="B40"><label>40.</label><mixed-citation>van der Slik, Frans, Roeland van Hout &amp; Job Schepens. 2019. The role of morphological complexity in predicting the learnability of an additional language: The case of La (additional language) Dutch. Second Language Research 35(1). 47-70. https://doi.org/10.1177/0267658317691322</mixed-citation></ref><ref id="B41"><label>41.</label><mixed-citation>Vasylets, Olena, Roger Gilabert &amp; Rosa M. Manchón. 2017. The effects of mode and task complexity on second language production. Language Learning 67(2). 394-430 https://doi.org/10.1111/lang.1222</mixed-citation></ref><ref id="B42"><label>42.</label><mixed-citation>Vinogradova, Olga, Olga Lyashevskaya &amp; Irina Panteleeva. 2017. Multi-level student essay feedback in a learner corpus. In Computational Linguistics and Intellectual Technologies. Proceedings of the International Conference Dialogue 2017. 373-387. Moscow.</mixed-citation></ref><ref id="B43"><label>43.</label><mixed-citation>Yee, Thomas W. 2015. Vector Generalized Linear and Additive Models. Springer. https://doi.org/10.1007/978-1-4939-2818-7</mixed-citation></ref><ref id="B44"><label>44.</label><mixed-citation>Yoon, Hyung-Jo. 2017. Linguistic complexity in L2 writing revisited: Issues of topic, proficiency, and construct multidimensionality. System 66. 130-141. https://doi.org/10.1016/j.system.2017.03.007</mixed-citation></ref></ref-list></back></article>
