@article{ART003048087},
author={Yeong-Jin Kim and Hyun-Jong Cha and Ah Reum Kang},
title={A Study on the Impact of Speech Data Quality on Speech Recognition Models},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2024},
volume={29},
number={1},
pages={41-49},
doi={10.9708/jksci.2024.29.01.041}
TY - JOUR
AU - Yeong-Jin Kim
AU - Hyun-Jong Cha
AU - Ah Reum Kang
TI - A Study on the Impact of Speech Data Quality on Speech Recognition Models
JO - Journal of The Korea Society of Computer and Information
PY - 2024
VL - 29
IS - 1
PB - The Korean Society Of Computer And Information
SP - 41
EP - 49
SN - 1598-849X
AB - Speech recognition technology is continuously advancing and widely used in various fields. In this study, we aimed to investigate the impact of speech data quality on speech recognition models by dividing the dataset into the entire dataset and the top 70% based on Signal-to-Noise Ratio (SNR).
Utilizing Seamless M4T and Google Cloud Speech-to-Text, we examined the text transformation results for each model and evaluated them using the Levenshtein Distance. Experimental results revealed that Seamless M4T scored 13.6 in models using data with high SNR, which is lower than the score of 16.6 for the entire dataset. However, Google Cloud Speech-to-Text scored 8.3 on the entire dataset, indicating lower performance than data with high SNR. This suggests that using data with high SNR during the training of a new speech recognition model can have an impact, and Levenshtein Distance can serve as a metric for evaluating speech recognition models.
KW - Speech Recognition;Signal-to-Noise-Ratio(SNR);Levenshtein Distance Algorithm;Meta Seamless M4T;Google Cloud Speech-to-Text
DO - 10.9708/jksci.2024.29.01.041
ER -
Yeong-Jin Kim, Hyun-Jong Cha and Ah Reum Kang. (2024). A Study on the Impact of Speech Data Quality on Speech Recognition Models. Journal of The Korea Society of Computer and Information, 29(1), 41-49.
Yeong-Jin Kim, Hyun-Jong Cha and Ah Reum Kang. 2024, "A Study on the Impact of Speech Data Quality on Speech Recognition Models", Journal of The Korea Society of Computer and Information, vol.29, no.1 pp.41-49. Available from: doi:10.9708/jksci.2024.29.01.041
Yeong-Jin Kim, Hyun-Jong Cha, Ah Reum Kang "A Study on the Impact of Speech Data Quality on Speech Recognition Models" Journal of The Korea Society of Computer and Information 29.1 pp.41-49 (2024) : 41.
Yeong-Jin Kim, Hyun-Jong Cha, Ah Reum Kang. A Study on the Impact of Speech Data Quality on Speech Recognition Models. 2024; 29(1), 41-49. Available from: doi:10.9708/jksci.2024.29.01.041
Yeong-Jin Kim, Hyun-Jong Cha and Ah Reum Kang. "A Study on the Impact of Speech Data Quality on Speech Recognition Models" Journal of The Korea Society of Computer and Information 29, no.1 (2024) : 41-49.doi: 10.9708/jksci.2024.29.01.041
Yeong-Jin Kim; Hyun-Jong Cha; Ah Reum Kang. A Study on the Impact of Speech Data Quality on Speech Recognition Models. Journal of The Korea Society of Computer and Information, 29(1), 41-49. doi: 10.9708/jksci.2024.29.01.041
Yeong-Jin Kim; Hyun-Jong Cha; Ah Reum Kang. A Study on the Impact of Speech Data Quality on Speech Recognition Models. Journal of The Korea Society of Computer and Information. 2024; 29(1) 41-49. doi: 10.9708/jksci.2024.29.01.041
Yeong-Jin Kim, Hyun-Jong Cha, Ah Reum Kang. A Study on the Impact of Speech Data Quality on Speech Recognition Models. 2024; 29(1), 41-49. Available from: doi:10.9708/jksci.2024.29.01.041
Yeong-Jin Kim, Hyun-Jong Cha and Ah Reum Kang. "A Study on the Impact of Speech Data Quality on Speech Recognition Models" Journal of The Korea Society of Computer and Information 29, no.1 (2024) : 41-49.doi: 10.9708/jksci.2024.29.01.041