@inproceedings{M{\"u}llerStrube2022, author = {M{\"u}ller, Mark-Christoph and Strube, Michael}, title = {An API for discourse-level access to XML-encoded corpora}, booktitle = {Proceedings of the Third International Conference on Language Resources and Evaluation (LREC'02). May 29-31, 2002, Las Palmas, Canary Islands, Spain}, editor = {Gonz{\´a}lez Rodr{\´i}guez, Manuel and Suarez Araujo, Carmen Paz}, url = {http://www.lrec-conf.org/proceedings/lrec2002/pdf/296.pdf}, pages = {26 -- 30}, year = {2022}, abstract = {We describe a simple and efficient Java object model and application programming interface (API) for (possibly multi-modal) annotated natural language corpora. Corpora are represented as elements like Sentences, Turns, Utterances, Words, Gestures and Markables. The API allows linguists to access corpora in terms of these discourse-level elements, i.e. at a conceptual level they are familiar with, with the flexibility offered by a general purpose programming language. It is also a contribution to corpus standardization efforts because it is based on a straightforward and easily extensible data model which can serve as a target for conversion of different corpus formats.}, subject = {API}, language = {en} }