Title |
Semantic Clustering of Pivot Paraphrases |
Authors |
Marianna Apidianaki, Emilia Verzeni and Diana Mccarthy |
Abstract |
Paraphrases extracted from parallel corpora by the pivot method (Bannard and Callison-Burch, 2005) constitute a valuable resource for multilingual NLP applications. In this study, we analyse the semantics of unigram pivot paraphrases and use a graph-based sense induction approach to unveil hidden sense distinctions in the paraphrase sets. The comparison of the acquired senses to gold data from the Lexical Substitution shared task (McCarthy and Navigli, 2007) demonstrates that sense distinctions exist in the paraphrase sets and highlights the need for a disambiguation step in applications using this resource. |
Topics |
Textual Entailment and Paraphrasing, Validation of LRs |
Full paper |
Semantic Clustering of Pivot Paraphrases |
Bibtex |
@InProceedings{APIDIANAKI14.475,
author = {Marianna Apidianaki and Emilia Verzeni and Diana Mccarthy}, title = {Semantic Clustering of Pivot Paraphrases}, booktitle = {Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14)}, year = {2014}, month = {may}, date = {26-31}, address = {Reykjavik, Iceland}, editor = {Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Hrafn Loftsson and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, publisher = {European Language Resources Association (ELRA)}, isbn = {978-2-9517408-8-4}, language = {english} } |