Title |
Corpus-based Semantic Relatedness for the Construction of Polish WordNet |
Authors |
Bartosz Broda, Magdalena Derwojedowa, Maciej Piasecki and Stanislaw Szpakowicz |
Abstract |
The construction of a wordnet, a labour-intensive enterprise, can be significantly assisted by automatic grouping of lexical material and discovery of lexical semantic relations. The objective is to ensure high quality of automatically acquired results before they are presented for lexicographers approval. We discuss a software tool that suggests synset members using a measure of semantic relatedness with a given verb or adjective; this extends previous work on nominal synsets in Polish WordNet. Syntactically-motivated constraints are deployed on a large morphologically annotated corpus of Polish. Evaluation has been performed via the WordNet-Based Similarity Test and additionally supported by human raters. A lexicographer also manually assessed a suitable sample of suggestions. The results compare favourably with other known methods of acquiring semantic relations. |
Language |
Single language |
Topics |
Lexicon, lexical database, LR national/international projects, organizational/policy issues, Statistical methods |
Full paper |
Corpus-based Semantic Relatedness for the Construction of Polish WordNet |
Slides |
Corpus-based Semantic Relatedness for the Construction of Polish WordNet |
Bibtex |
@InProceedings{BRODA08.459,
author = {Bartosz Broda, Magdalena Derwojedowa, Maciej Piasecki and Stanislaw Szpakowicz},
title = {Corpus-based Semantic Relatedness for the Construction of Polish WordNet},
booktitle = {Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC'08)},
year = {2008},
month = {may},
date = {28-30},
address = {Marrakech, Morocco},
editor = {Nicoletta Calzolari (Conference Chair), Khalid Choukri, Bente Maegaard, Joseph Mariani, Jan Odijk, Stelios Piperidis, Daniel Tapias},
publisher = {European Language Resources Association (ELRA)},
isbn = {2-9517408-4-0},
note = {http://www.lrec-conf.org/proceedings/lrec2008/},
language = {english}
} |