Title |
Generalising Lexical Translation Strategies for MT Using Comparable Corpora |
Authors |
Bogdan Babych, Serge Sharoff and Anthony Hartley |
Abstract |
We report on an on-going research project aimed at increasing the range of translation equivalents which can be automatically discovered by MT systems. The methodology is based on semi-supervised learning of indirect translation strategies from large comparable corpora and applying them in run-time to generate novel, previously unseen translation equivalents. This approach is different from methods based on parallel resources, which currently can reuse only individual translation equivalents. Instead it models translation strategies which generalise individual equivalents and can successfully generate an open class of new translation solutions. The task of the project is integration of the developed technology into open-source MT systems. |
Language |
Language-independent |
Topics |
Machine Translation, SpeechToSpeech Translation, Multilinguality |
Full paper |
Generalising Lexical Translation Strategies for MT Using Comparable Corpora |
Slides |
Generalising Lexical Translation Strategies for MT Using Comparable Corpora |
Bibtex |
@InProceedings{BABYCH08.340,
author = {Bogdan Babych, Serge Sharoff and Anthony Hartley},
title = {Generalising Lexical Translation Strategies for MT Using Comparable Corpora},
booktitle = {Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC'08)},
year = {2008},
month = {may},
date = {28-30},
address = {Marrakech, Morocco},
editor = {Nicoletta Calzolari (Conference Chair), Khalid Choukri, Bente Maegaard, Joseph Mariani, Jan Odijk, Stelios Piperidis, Daniel Tapias},
publisher = {European Language Resources Association (ELRA)},
isbn = {2-9517408-4-0},
note = {http://www.lrec-conf.org/proceedings/lrec2008/},
language = {english}
} |