Title |
Basque Speecon-like and Basque SpeechDAT MDB-600: Speech Databases for the Development of ASR Technology for Basque |
Authors |
Igor Odriozola, Inma Hernaez, María Inés Torres, Luis Javier Rodriguez-Fuentes, Mikel Penagarikano and Eva Navas |
Abstract |
This paper introduces two databases specifically designed for the development of ASR technology for the Basque language: the Basque Speecon-like database and the Basque SpeechDat MDB-600 database. The former was recorded in an office environment according to the Speecon specifications, whereas the later was recorded through mobile telephones according to the SpeechDat specifications. Both databases were created under an initiative that the Basque Government started in 2005, a program called ADITU, which aimed at developing speech technologies for Basque. The databases belong to the Basque Government. A comprehensive description of both databases is provided in this work, highlighting the differences with regard to their corresponding standard specifications. The paper also presents several initial experimental results for both databases with the purpose of validating their usefulness for the development of speech recognition technology. Several applications already developed with the Basque Speecon-like database are also described. Authors aim to make these databases widely known to the community as well, and foster their use by other groups. |
Topics |
Speech Resource/Database, Speech Recognition/Understanding |
Full paper |
Basque Speecon-like and Basque SpeechDAT MDB-600: Speech Databases for the Development of ASR Technology for Basque |
Bibtex |
@InProceedings{ODRIOZOLA14.744,
author = {Igor Odriozola and Inma Hernaez and María Inés Torres and Luis Javier Rodriguez-Fuentes and Mikel Penagarikano and Eva Navas}, title = {Basque Speecon-like and Basque SpeechDAT MDB-600: Speech Databases for the Development of ASR Technology for Basque}, booktitle = {Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14)}, year = {2014}, month = {may}, date = {26-31}, address = {Reykjavik, Iceland}, editor = {Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Hrafn Loftsson and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, publisher = {European Language Resources Association (ELRA)}, isbn = {978-2-9517408-8-4}, language = {english} } |