Title |
Leveraging study of robustness and portability of spoken language understanding systems across languages and domains: the PORTMEDIA corpora |
Authors |
Fabrice Lefèvre, Djamel Mostefa, Laurent Besacier, Yannick Estève, Matthieu Quignard, Nathalie Camelin, Benoit Favre, Bassam Jabaian and Lina M. Rojas-Barahona |
Abstract |
The PORTMEDIA project is intended to develop new corpora for the evaluation of spoken language understanding systems. The newly collected data are in the field of human-machine dialogue systems for tourist information in French in line with the MEDIA corpus. Transcriptions and semantic annotations, obtained by low-cost procedures, are provided to allow a thorough evaluation of the systems' capabilities in terms of robustness and portability across languages and domains. A new test set with some adaptation data is prepared for each case: in Italian as an example of a new language, for ticket reservation as an example of a new domain. Finally the work is complemented by the proposition of a new high level semantic annotation scheme well-suited to dialogue data. |
Topics |
Speech Recognition/Understanding, Dialogue, Speech resource/database |
Full paper |
Leveraging study of robustness and portability of spoken language understanding systems across languages and domains: the PORTMEDIA corpora |
Bibtex |
@InProceedings{LEFVRE12.751,
author = {Fabrice Lefèvre and Djamel Mostefa and Laurent Besacier and Yannick Estève and Matthieu Quignard and Nathalie Camelin and Benoit Favre and Bassam Jabaian and Lina M. Rojas-Barahona}, title = {Leveraging study of robustness and portability of spoken language understanding systems across languages and domains: the PORTMEDIA corpora}, booktitle = {Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)}, year = {2012}, month = {may}, date = {23-25}, address = {Istanbul, Turkey}, editor = {Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Mehmet Uğur Doğan and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, publisher = {European Language Resources Association (ELRA)}, isbn = {978-2-9517408-7-7}, language = {english} } |