Title |
A Comparison of Various Methods for Concept Tagging for Spoken Language Understanding |
Authors |
Stefan Hahn, Patrick Lehnen, Christian Raymond and Hermann Ney |
Abstract |
The extraction of flat concepts out of a given word sequence is usually one of the first steps in building a spoken language understanding (SLU) or dialogue system. This paper explores five different modelling approaches for this task and presents results on a French state-of-the-art corpus, MEDIA. Additionally, two log-linear modelling approaches could be further improved by adding morphologic knowledge. This paper goes beyond what has been reported in the literature. We applied the models on the same training and testing data and used the NIST scoring toolkit to evaluate the experimental results to ensure identical conditions for each of the experiments and the comparability of the results. Using a model based on conditional random fields, we achieve a concept error rate of 11.8% on the MEDIA evaluation corpus. |
Language |
Single language |
Topics |
Speech recognition and understanding, Tagging, Dialogue & Natural Interactivity |
Full paper |
A Comparison of Various Methods for Concept Tagging for Spoken Language Understanding |
Slides |
- |
Bibtex |
@InProceedings{HAHN08.749,
author = {Stefan Hahn, Patrick Lehnen, Christian Raymond and Hermann Ney},
title = {A Comparison of Various Methods for Concept Tagging for Spoken Language Understanding},
booktitle = {Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC'08)},
year = {2008},
month = {may},
date = {28-30},
address = {Marrakech, Morocco},
editor = {Nicoletta Calzolari (Conference Chair), Khalid Choukri, Bente Maegaard, Joseph Mariani, Jan Odijk, Stelios Piperidis, Daniel Tapias},
publisher = {European Language Resources Association (ELRA)},
isbn = {2-9517408-4-0},
note = {http://www.lrec-conf.org/proceedings/lrec2008/},
language = {english}
} |