% % GENERATED FROM https://www.coli.uni-saarland.de % by : anonymous % IP : coli2006.lst.uni-saarland.de % at : Mon, 05 Feb 2024 15:43:04 +0100 GMT % % Selection : Reference #1341 % @InProceedings{Vintar_et_al:2002, AUTHOR = {Vintar, Spela and Buitelaar, Paul and Ripplinger, Bärbel and Sacaleanu, Bogdan and Raileanu, Diana and Prescher, Detlef}, TITLE = {An Efficient and Flexible Format for Linguistic and Semantic Annotation}, YEAR = {2002}, BOOKTITLE = {Proceedings of the 3rd International Conference on Language Resources and Evaluation (LREC'02), May 29-31}, ADDRESS = {Las Palmas, Canary Islands, Spain}, URL = {http://dfki.de/~paulb/lrec2002.dtd.ps http://www.dfki.de/dfkibib/publications/docs/lrec2002.dtd.final.pdf}, ABSTRACT = {The paper describes an XML annotation format and tool developed within the MUCHMORE project. The annotation scheme was designed specifically for the purposes of Cross-Lingual Information Retrieval in the medical domain so as to allow both efficient and flexible access to layers of information. We use a parallel English-German corpus of medical abstracts and annotate it with linguistic information (tokenisation, part-of-speech tagging, lemmatisation and decomposition, phrase recognition, grammatical functions) as well as semantic information from various sources. The annotation of medical terms/concepts, semantic types and semantic relations is based on the Unified Medical Language System (UMLS). Additionally, we use EuroWordNet as a general-language resource in annotating word senses and to compare domain-specific and general language use. A major aim of the project is also to complement existing ontological resources by extracting new terms and new semantic relations. We present the annotation scheme, which is conceptually related to stand-off annotation, and describe our tool for automatic semantic annotation.}, ANNOTE = {COLIURL : Vintar:2002:EFF.pdf Vintar:2002:EFF.ps} }