@inproceedings{1dc371c519904346bdc8a25557a5f390,
title = "Small and large vocabulary speech recognition of MP3 data under real-word conditions: Experimental study",
abstract = "This paper presents the study of speech recognition accuracy both for small and large vocabulary task with respect to different levels of MP3 compression of processed data. The motivation behind the work was to evaluate the usage of ASR system for off-line automatic transcription of recordings collected from standard present MP3 devices under different levels of background noise and channel distortion. Although MP3 may not be an optimal compression algorithm, the performed experiments have prooved that it does not distort speech signal significantly for higher compression rates. Realized experiments showed also that the accuracy of speech recognition (both small- and large-vocabulary) decreased very slowly for the bit-rate of 24 kbps and higher. However, slightly different setup of speech feature computation is necessary for MP3 speech data, mainly PLP features give significantly better results in comparison to MFCC.",
keywords = "Large vocabulary, LVCSR, MP3, MPEG compression, Noise robustness, Small vocabulary, Speech recognition",
author = "Petr Pollak and Michal Borsky",
year = "2012",
doi = "10.1007/978-3-642-35755-8_29",
language = "English",
isbn = "9783642357541",
series = "Communications in Computer and Information Science",
pages = "409--419",
editor = "Sevillano, {Jose L.} and Joaquim Filipe",
booktitle = "E-Business and Telecommunications",
note = "8th International Joint Conference on e-Business and Telecommunications, ICETE 2011 ; Conference date: 18-07-2011 Through 21-07-2011",
}