Title |
A Multi-Word Term Extraction Program for Arabic Language |
Authors |
Siham Boulaknadel, Beatrice Daille and Driss Aboutajdine |
Abstract |
Terminology extraction commonly includes two steps: identification of term-like units in the texts, mostly multi-word phrases, and the ranking of the extracted term-like units according to their domain representativity. In this paper, we design a multi-word term extraction program for Arabic language. The linguistic filtering performs a morphosyntactic analysis and takes into account several types of variations. The domain representativity is measure thanks to statistical scores. We evalutate several association measures and show that the results we otained are consitent with those obtained for Romance languages. |
Language |
Single language |
Topics |
Information Extraction, Information Retrieval, MultiWord Expressions & Collocations |
Full paper |
A Multi-Word Term Extraction Program for Arabic Language |
Slides |
A Multi-Word Term Extraction Program for Arabic Language |
Bibtex |
@InProceedings{BOULAKNADEL08.378,
author = {Siham Boulaknadel, Beatrice Daille and Driss Aboutajdine},
title = {A Multi-Word Term Extraction Program for Arabic Language},
booktitle = {Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC'08)},
year = {2008},
month = {may},
date = {28-30},
address = {Marrakech, Morocco},
editor = {Nicoletta Calzolari (Conference Chair), Khalid Choukri, Bente Maegaard, Joseph Mariani, Jan Odijk, Stelios Piperidis, Daniel Tapias},
publisher = {European Language Resources Association (ELRA)},
isbn = {2-9517408-4-0},
note = {http://www.lrec-conf.org/proceedings/lrec2008/},
language = {english}
} |