@inproceedings{RehbeinHirschmann2018, author = {Ines Rehbein and Hagen Hirschmann}, title = {POS tagset refinement for linguistic analysis and the impact on statistical parsing}, series = {Proceedings of the Thirteenth International Workshop on Treebanks and Linguistic Theories (TLT13). December 12-13, 2014, T{\"u}bingen, Germany}, editor = {Verena Henrich and Erhard Hinrichs and Dani{\"e}l de Kok and Petya Osenova and Adam Przepi{\´o}rkowski}, publisher = {University of T{\"u}bingen}, address = {T{\"u}bingen}, isbn = {978-3-9809183-9-8}, url = {https://nbn-resolving.org/urn:nbn:de:bsz:mh39-80368}, pages = {172 -- 183}, year = {2018}, abstract = {The annotation of parts of speech (POS) in linguistically annotated corpora is a fundamental annotation layer which provides the basis for further syntactic analyses, and many NLP tools rely on POS information as input. However, most POS annotation schemes have been developed with written (newspaper) text in mind and thus do not carry over well to text from other domains and genres. Recent discussions have concentrated on the shortcomings of present POS annotation schemes with regard to their applicability to data from domains other than newspaper text.}, language = {en} }