@incollection{BatinićBirzerZinsmeister2017, author = {Dolores Batinić and Sandra Birzer and Heike Zinsmeister}, title = {Automatic classification of Russian texts for didactic purposes}, series = {Trudy meždunarodnoj konferencii „Korpusnaja lingvistika - 2017“. 27-30 ijunja 2017 g., Sankt-Peterburg}, publisher = {Izdatel´stvo Sankt-Peterburgskogo gosudarstvennogo universiteta}, address = {Sankt-Peterburg}, issn = {2412-9623}, url = {https://nbn-resolving.org/urn:nbn:de:bsz:mh39-66003}, pages = {9 -- 15}, year = {2017}, abstract = {In this paper we present the results of an automatic classification of Russian texts into three levels of difficulty. Our aim is to build a study corpus of Russian, in which a L2 student is able to select texts of a desired complexity. We are building on a pilot study, in which we classified Russian texts into two levels of difficulty. In the current paper, we apply the classification to an extended corpus of 577 labelled texts. The best-performing combination of features achieves an accuracy of 0,74 within at most one level difference.}, language = {en} }