@inproceedings{KirkČerm{\´a}kov{\´a}2017, author = {Kirk, John and Čerm{\´a}kov{\´a}, Anna}, title = {From ICE to ICC: The new International Comparable Corpus}, booktitle = {Proceedings of the Workshop on Challenges in the Management of Large Corpora and Big Data and Natural Language Processing (CMLC-5+BigNLP) 2017 including the papers from the Web-as-Corpus (WAC-XI) guest section. Birmingham, 24 July 2017}, editor = {Bański, Piotr and Kupietz, Marc and L{\"u}ngen, Harald and Rayson, Paul and Biber, Hanno and Breiteneder, Evelyn and Clematide, Simon and Mariani, John and Stevenson, Mark and Sick, Theresa}, pages = {7 -- 12}, year = {2017}, abstract = {This paper outlines the broad research context and rationale for a new international comparable corpus (ICC). The ICC is to be largely modelled on the text categories and their quantities the International Corpus of English with only a few changes. The corpus will initially begin with nine European languages but others may join in due course. The paper reports on those and other agreements made at the inaugural planning meeting in Prague on 22-23 June 2017. It also sets out the project's goals for its first two years.}, subject = {Korpus }, language = {en} }