@InProceedings{Hansen_Teich:2002,
AUTHOR = {Hansen, Silvia and Teich, Elke},
TITLE = {The creation and exploitation of a translation reference corpus},
YEAR = {2002},
BOOKTITLE = {Proceedings of the First International Workshop on Language Resources for Translation Work and Research (3rd International Conference on Language Resources and Evaluation (LREC-2002)), May 28},
ADDRESS = {Las Palmas de Gran Canaria, Spain},
URL = {https://www.coli.uni-saarland.de/~hansen/hansen-teich.zip},
ABSTRACT = {While in many branches of linguistics monolingual reference corpora are widely used, e.g., in lexicography, in the construction of grammars and generally in empirical linguistic studies, in translation research as well as translation practice the concept of a parallel refernce corpus has not yet assumed a similarly important role. In our view, this is partly due to a lack of interaction of researchers involved in the development of corpus tools (computational linguistics, humanities computing) and the potential users of such tools in the area of translation (translatology, translation practice). The goal of the present paper is to initiate such an interaction. We present the design of an German-English and French-English translation corpus and explore its use as a reference corpus for translatologists as well as translators. First, we introduce the the basic computational techniques needed to build such a translation reference corpus. These techniques cover the preparation of the corpus as well as its linguistic annotation. In the preparatory step the corpus has to be aligned and encoded. To enrich the corpus with linguistic information, part-of-speech tagging and syntactic parsing have to be carried out for the different languages. Furthermore, to make the parallel reference corpus usable for translation scholars and translators, it has to be searchable, i.e., appropriate query facilities must be provided. We show how to extract instances of linguistic phenomena that are of interest from a translation point of view using a multilingual English-German-French corpus. We explain possible translation procedures for perfect aspect, reduced relative clauses and cleft constructions from English into German and French on the basis of parallel concordances extracted from the translation reference corpus. Finally, we specify some additional requirements to improve the usability of translation corpora in both translation studies and translation practice.} }
|