@inproceedings{SanguinettiBoscoCassidyetal.2020, author = {Manuela Sanguinetti and Cristina Bosco and Lauren Cassidy and {\"O}zlem {\c{C}}etinoğlu and Alessandra Teresa Cignarella and Teresa Lynn and Ines Rehbein and Josef Ruppenhofer and Djam{\´e} Seddah and Amir Zeldes}, title = {Treebanking User-Generated Content: A Proposal for a Unified Representation in Universal Dependencies}, series = {Proceedings of the 12th International Conference on Language Resources and Evaluation (LREC), May 11-16, 2020, Palais du Pharo, Marseille, France}, editor = {Nicoletta Calzolari and Fr{\´e}d{\´e}ric B{\´e}chet and Philippe Blache and Khalid Choukri and Christopher Cieri and Thierry Declerck and Sara Goggi and Hitoshi Isahara and Bente Maegaard and Joseph Mariani and H{\´e}l{\`e}ne Mazo and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, publisher = {European Language Resources Association}, address = {Paris}, isbn = {979-10-95546-34-4}, url = {https://nbn-resolving.org/urn:nbn:de:bsz:mh39-98686}, pages = {5240 -- 5250}, year = {2020}, abstract = {The paper presents a discussion on the main linguistic phenomena of user-generated texts found in web and social media, and proposes a set of annotation guidelines for their treatment within the Universal Dependencies (UD) framework. Given on the one hand the increasing number of treebanks featuring user-generated content, and its somewhat inconsistent treatment in these resources on the other, the aim of this paper is twofold: (1) to provide a short, though comprehensive, overview of such treebanks - based on available literature - along with their main features and a comparative analysis of their annotation criteria, and (2) to propose a set of tentative UD-based annotation guidelines, to promote consistent treatment of the particular phenomena found in these types of texts. The main goal of this paper is to provide a common framework for those teams interested in developing similar resources in UD, thus enabling cross-linguistic consistency, which is a principle that has always been in the spirit of UD.}, language = {en} }