To date, linguistically annotated corpora are mainly
exploited for feature-based training of automatic
labelling systems. In this paper, we present a general approach for the Description Logics-based modelling of multi-layered annotated corpora which offers (i) flexible and enhanced querying functionality that goes beyond current XML-based query languages, (ii) a basis for consistency checking, and (iii) a general method for defining abstractions over corpus annotations. We apply this method to the syntactically and semantically annotated SALSA/TIGER corpus . By defining abstractions over the corpus data, we generalise from a large set of individual corpus annotations to a corresponding lexicon model. We discuss issues arising from modelling multi-layered corpus annotations in Description Logics and illustrate the benefits of our approach at concrete examples.
%0 Conference Paper
%1 spohr07:_induc_comput_lexic_corpus_syntac_seman_annot
%A Spohr, Dennis
%A Burchardt, Aljoscha
%A Padó, Sebastian
%A Frank, Anette
%A Heid, Ulrich
%B Proceedings of IWCS-7
%C Tilburg, The Netherlands
%D 2007
%K myown workshop
%T Inducing a Computational Lexicon from a Corpus with Syntactic and Semantic Annotation
%U https://www.nlpado.de/~sebastian/pub/papers/iwcs07_spohr.pdf
%X To date, linguistically annotated corpora are mainly
exploited for feature-based training of automatic
labelling systems. In this paper, we present a general approach for the Description Logics-based modelling of multi-layered annotated corpora which offers (i) flexible and enhanced querying functionality that goes beyond current XML-based query languages, (ii) a basis for consistency checking, and (iii) a general method for defining abstractions over corpus annotations. We apply this method to the syntactically and semantically annotated SALSA/TIGER corpus . By defining abstractions over the corpus data, we generalise from a large set of individual corpus annotations to a corresponding lexicon model. We discuss issues arising from modelling multi-layered corpus annotations in Description Logics and illustrate the benefits of our approach at concrete examples.
@inproceedings{spohr07:_induc_comput_lexic_corpus_syntac_seman_annot,
abstract = {To date, linguistically annotated corpora are mainly
exploited for feature-based training of automatic
labelling systems. In this paper, we present a general approach for the Description Logics-based modelling of multi-layered annotated corpora which offers (i) flexible and enhanced querying functionality that goes beyond current XML-based query languages, (ii) a basis for consistency checking, and (iii) a general method for defining abstractions over corpus annotations. We apply this method to the syntactically and semantically annotated SALSA/TIGER corpus . By defining abstractions over the corpus data, we generalise from a large set of individual corpus annotations to a corresponding lexicon model. We discuss issues arising from modelling multi-layered corpus annotations in Description Logics and illustrate the benefits of our approach at concrete examples.},
added-at = {2017-04-03T19:29:52.000+0200},
address = {Tilburg, The Netherlands},
author = {Spohr, Dennis and Burchardt, Aljoscha and Padó, Sebastian and Frank, Anette and Heid, Ulrich},
biburl = {https://puma.ub.uni-stuttgart.de/bibtex/215170e56f27ffda9f527b6cc0a18506a/sp},
booktitle = {Proceedings of IWCS-7},
interhash = {19c4e961e6136b77a8eec819867c0cc9},
intrahash = {15170e56f27ffda9f527b6cc0a18506a},
keywords = {myown workshop},
timestamp = {2017-04-03T17:30:49.000+0200},
title = {Inducing a Computational Lexicon from a Corpus with Syntactic and Semantic Annotation},
url = {https://www.nlpado.de/~sebastian/pub/papers/iwcs07_spohr.pdf},
year = 2007
}