This paper describes the SALSA corpus, a large German corpus manually annotated with role-semantic information, based on the syntactically annotated TIGER newspaper corpus (Brants et al., 2002). The rst release, comprising about 20,000 annotated predicate instances (about half the TIGER corpus), is scheduled for mid-2006. In this paper we discuss the frame-semantic annotation framework and its cross-lingual applicability, problems arising from exhaustive annotation, strategies for quality control, and possible applications.
%0 Conference Paper
%1 burchardt:_salsa
%A Burchardt, Aljoscha
%A Erk, Katrin
%A Frank, Anette
%A Kowalski, Andrea\
%A Padó, Sebastian
%A Pinkal, Manfred
%B Proceedings of LREC 2006
%C Genoa, Italy
%D 2006
%K conference myown
%T The SALSA corpus: a German corpus resource for
lexical semantics
%U http://www.lrec-conf.org/proceedings/lrec2006/pdf/339_pdf.pdf
%X This paper describes the SALSA corpus, a large German corpus manually annotated with role-semantic information, based on the syntactically annotated TIGER newspaper corpus (Brants et al., 2002). The rst release, comprising about 20,000 annotated predicate instances (about half the TIGER corpus), is scheduled for mid-2006. In this paper we discuss the frame-semantic annotation framework and its cross-lingual applicability, problems arising from exhaustive annotation, strategies for quality control, and possible applications.
@inproceedings{burchardt:_salsa,
abstract = {This paper describes the SALSA corpus, a large German corpus manually annotated with role-semantic information, based on the syntactically annotated TIGER newspaper corpus (Brants et al., 2002). The rst release, comprising about 20,000 annotated predicate instances (about half the TIGER corpus), is scheduled for mid-2006. In this paper we discuss the frame-semantic annotation framework and its cross-lingual applicability, problems arising from exhaustive annotation, strategies for quality control, and possible applications.},
added-at = {2017-04-03T19:28:28.000+0200},
address = {Genoa, Italy},
author = {Burchardt, Aljoscha and Erk, Katrin and Frank, Anette and Kowalski, Andrea\ and Padó, Sebastian and Pinkal, Manfred},
biburl = {https://puma.ub.uni-stuttgart.de/bibtex/2b32a5c8f77cff9c736b01ce5c1ebc77c/sp},
booktitle = {Proceedings of {LREC} 2006},
interhash = {729a70f8bdb523410c3e0f2699cda177},
intrahash = {b32a5c8f77cff9c736b01ce5c1ebc77c},
keywords = {conference myown},
timestamp = {2017-04-03T17:28:32.000+0200},
title = {The {SALSA} corpus: a {G}erman corpus resource for
lexical semantics},
url = {http://www.lrec-conf.org/proceedings/lrec2006/pdf/339_pdf.pdf},
year = 2006
}