Title |
SwissAdmin: a Multilingual Tagged Parallel Corpus of Press Releases |
Authors |
Yves Scherrer, Luka Nerima, Lorenza Russo, Maria Ivanova and Eric Wehrli |
Abstract |
SwissAdmin is a new multilingual corpus of press releases from the Swiss Federal Administration, available in German, French, Italian and English. We provide SwissAdmin in three versions: (i) plain texts of approximately 6 to 8 million words per language; (ii) sentence-aligned bilingual texts for each language pair; (iii) a part-of-speech-tagged version consisting of annotations in both the Universal tagset and the richer Fips tagset, along with grammatical functions, verb valencies and collocations. The SwissAdmin corpus is freely available at www.latl.unige.ch/swissadmin. |
Topics |
Part-of-Speech Tagging, MultiWord Expressions & Collocations |
Full paper |
SwissAdmin: a Multilingual Tagged Parallel Corpus of Press Releases |
Bibtex |
@InProceedings{SCHERRER14.772,
author = {Yves Scherrer and Luka Nerima and Lorenza Russo and Maria Ivanova and Eric Wehrli}, title = {SwissAdmin: a Multilingual Tagged Parallel Corpus of Press Releases}, booktitle = {Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14)}, year = {2014}, month = {may}, date = {26-31}, address = {Reykjavik, Iceland}, editor = {Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Hrafn Loftsson and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, publisher = {European Language Resources Association (ELRA)}, isbn = {978-2-9517408-8-4}, language = {english} } |