@inproceedings{RehbeinScholmanDemberg2016, author = {Ines Rehbein and Merel Scholman and Vera Demberg}, title = {Annotating Discourse Relations in Spoken Language: A Comparison of the PDTB and CCR Frameworks}, series = {Proceedings of the 10th International Conference on Language Resources and Evaluation (LREC 2016). May 23-28, 2016. Portorož, Slovenia}, editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Sara Goggi and Marko Grobelnik and Bente Maegaard and Joseph Mariani and H{\´e}l{\`e}ne Mazo and Asunci{\´o}n Moreno and Jan Odijk and Stelios Piperidis}, publisher = {European Language Resources Association}, address = {Paris}, isbn = {978-2-9517408-9-1}, url = {https://nbn-resolving.org/urn:nbn:de:bsz:mh39-56068}, pages = {23 -- 28}, year = {2016}, abstract = {In discourse relation annotation, there is currently a variety of different frameworks being used, and most of them have been developed and employed mostly on written data. This raises a number of questions regarding interoperability of discourse relation annotation schemes, as well as regarding differences in discourse annotation for written vs. spoken domains. In this paper, we describe ouron annotating two spoken domains from the SPICE Ireland corpus (telephone conversations and broadcast interviews) according todifferent discourse annotation schemes, PDTB 3.0 and CCR. We show that annotations in the two schemes can largely be mappedone another, and discuss differences in operationalisations of discourse relation schemes which present a challenge to automatic mapping. We also observe systematic differences in the prevalence of implicit discourse relations in spoken data compared to written texts,find that there are also differences in the types of causal relations between the domains. Finally, we find that PDTB 3.0 addresses many shortcomings of PDTB 2.0 wrt. the annotation of spoken discourse, and suggest further extensions. The new corpus has roughly theof the CoNLL 2015 Shared Task test set, and we hence hope that it will be a valuable resource for the evaluation of automatic discourse relation labellers.}, language = {en} }