@article{ART003258707},
author={Won Jun Lee and Woo Jin Jung and Hyun-Jong Cha and Ah Reum Kang},
title={Robust Audio Spectrogram Transformer for Sound Source Localization in Noisy Environments},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2025},
volume={30},
number={10},
pages={33-42}
TY - JOUR
AU - Won Jun Lee
AU - Woo Jin Jung
AU - Hyun-Jong Cha
AU - Ah Reum Kang
TI - Robust Audio Spectrogram Transformer for Sound Source Localization in Noisy Environments
JO - Journal of The Korea Society of Computer and Information
PY - 2025
VL - 30
IS - 10
PB - The Korean Society Of Computer And Information
SP - 33
EP - 42
SN - 1598-849X
AB - Conventional sound source localization methods suffer from significant accuracy degradation in low SNR (Signal-to-Noise Ratio) environments. In this paper, we propose a sound source localization model based on an audio spectrogram transformer, which takes GCC (Generalized Cross Correlation) features extracted from multichannel audio signals as input. The proposed model was evaluated under various indoor environments and SNR conditions, and its performance was compared with conventional GCC-PHAT (Generalized Cross Correlation – Phase Transform) and MUSIC (MUltiple SIgnal Classification) algorithms. Experimental results show that the proposed model achieves superior performance, with a mean angular error of 10.0163°, a mean distance error of 0.1626, and a RMSE (Root Mean Square Error) of 0.89 in a 5 m × 5 m × 5 m environment, even at 0 dB SNR. Additionally, the model demonstrates robust performance under changes in room size and noise conditions. This study demonstrates that transformer-based models can be effectively applied to achieve reliable sound source localization in noisy environments.
KW - Sound Source Localization;Direction of Arrival;Signal-to-Noise Ratio;;Audio Sectrogram Transformer;Image Source Method
DO -
UR -
ER -
Won Jun Lee, Woo Jin Jung, Hyun-Jong Cha and Ah Reum Kang. (2025). Robust Audio Spectrogram Transformer for Sound Source Localization in Noisy Environments. Journal of The Korea Society of Computer and Information, 30(10), 33-42.
Won Jun Lee, Woo Jin Jung, Hyun-Jong Cha and Ah Reum Kang. 2025, "Robust Audio Spectrogram Transformer for Sound Source Localization in Noisy Environments", Journal of The Korea Society of Computer and Information, vol.30, no.10 pp.33-42.
Won Jun Lee, Woo Jin Jung, Hyun-Jong Cha, Ah Reum Kang "Robust Audio Spectrogram Transformer for Sound Source Localization in Noisy Environments" Journal of The Korea Society of Computer and Information 30.10 pp.33-42 (2025) : 33.
Won Jun Lee, Woo Jin Jung, Hyun-Jong Cha, Ah Reum Kang. Robust Audio Spectrogram Transformer for Sound Source Localization in Noisy Environments. 2025; 30(10), 33-42.
Won Jun Lee, Woo Jin Jung, Hyun-Jong Cha and Ah Reum Kang. "Robust Audio Spectrogram Transformer for Sound Source Localization in Noisy Environments" Journal of The Korea Society of Computer and Information 30, no.10 (2025) : 33-42.
Won Jun Lee; Woo Jin Jung; Hyun-Jong Cha; Ah Reum Kang. Robust Audio Spectrogram Transformer for Sound Source Localization in Noisy Environments. Journal of The Korea Society of Computer and Information, 30(10), 33-42.
Won Jun Lee; Woo Jin Jung; Hyun-Jong Cha; Ah Reum Kang. Robust Audio Spectrogram Transformer for Sound Source Localization in Noisy Environments. Journal of The Korea Society of Computer and Information. 2025; 30(10) 33-42.
Won Jun Lee, Woo Jin Jung, Hyun-Jong Cha, Ah Reum Kang. Robust Audio Spectrogram Transformer for Sound Source Localization in Noisy Environments. 2025; 30(10), 33-42.
Won Jun Lee, Woo Jin Jung, Hyun-Jong Cha and Ah Reum Kang. "Robust Audio Spectrogram Transformer for Sound Source Localization in Noisy Environments" Journal of The Korea Society of Computer and Information 30, no.10 (2025) : 33-42.