Title |
Creating Glossaries Using Pattern-Based and Machine Learning Techniques |
Authors |
Eline Westerhout and Paola Monachesi |
Abstract |
One of the aims of the Language Technology for eLearning project is to show that Natural Language Processing techniques can be employed to enhance the learning process. To this end, one of the functionalities that has been developed is a pattern-based glossary candidate detector which is capable of extracting definitions in eight languages. In order to improve the results obtained with the pattern-based approach, machine learning techniques are applied on the Dutch results to filter out incorrectly extracted definitions. In this paper, we discuss the machine learning techniques used and we present the results of the quantitative evaluation. We also discuss the integration of the tool into the Learning Management System ILIAS. |
Language |
Language-independent |
Topics |
Tools, systems, applications, Information Extraction, Information Retrieval, Lexicon, lexical database |
Full paper |
Creating Glossaries Using Pattern-Based and Machine Learning Techniques |
Slides |
- |
Bibtex |
@InProceedings{WESTERHOUT08.783,
author = {Eline Westerhout and Paola Monachesi},
title = {Creating Glossaries Using Pattern-Based and Machine Learning Techniques},
booktitle = {Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC'08)},
year = {2008},
month = {may},
date = {28-30},
address = {Marrakech, Morocco},
editor = {Nicoletta Calzolari (Conference Chair), Khalid Choukri, Bente Maegaard, Joseph Mariani, Jan Odijk, Stelios Piperidis, Daniel Tapias},
publisher = {European Language Resources Association (ELRA)},
isbn = {2-9517408-4-0},
note = {http://www.lrec-conf.org/proceedings/lrec2008/},
language = {english}
} |