@article{ART002998490},
author={JeongHyeon Park and JunHyeok Go and SiUng Kim and Nammee Moon},
title={Classification of Infant Crying Audio based on 3D Feature-Vector through Audio Data Augmentation},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2023},
volume={28},
number={9},
pages={47-54},
doi={10.9708/jksci.2023.28.09.047}
TY - JOUR
AU - JeongHyeon Park
AU - JunHyeok Go
AU - SiUng Kim
AU - Nammee Moon
TI - Classification of Infant Crying Audio based on 3D Feature-Vector through Audio Data Augmentation
JO - Journal of The Korea Society of Computer and Information
PY - 2023
VL - 28
IS - 9
PB - The Korean Society Of Computer And Information
SP - 47
EP - 54
SN - 1598-849X
AB - Infants utilize crying as a non-verbal means of communication [1]. However, deciphering infant cries presents challenges. Extensive research has been conducted to interpret infant cry audios [2,3]. This paper proposes the classification of infant cries using 3D feature vectors augmented with various audio data techniques. A total of 5 classes (belly pain, burping, discomfort, hungry, tired) are employed in the study dataset. The data is augmented using 5 techniques (Pitch, Tempo, Shift, Mixup-noise, CutMix). Tempo, Shift, and CutMix augmentation techniques demonstrated improved performance.
Ultimately, applying effective data augmentation techniques simultaneously resulted in a 17.75% performance enhancement compared to models using single feature vectors and original data.
KW - 3D Feature Vector;Data Augmentation;Infant;MFCC;Nonverbal sound
DO - 10.9708/jksci.2023.28.09.047
ER -
JeongHyeon Park, JunHyeok Go, SiUng Kim and Nammee Moon. (2023). Classification of Infant Crying Audio based on 3D Feature-Vector through Audio Data Augmentation. Journal of The Korea Society of Computer and Information, 28(9), 47-54.
JeongHyeon Park, JunHyeok Go, SiUng Kim and Nammee Moon. 2023, "Classification of Infant Crying Audio based on 3D Feature-Vector through Audio Data Augmentation", Journal of The Korea Society of Computer and Information, vol.28, no.9 pp.47-54. Available from: doi:10.9708/jksci.2023.28.09.047
JeongHyeon Park, JunHyeok Go, SiUng Kim, Nammee Moon "Classification of Infant Crying Audio based on 3D Feature-Vector through Audio Data Augmentation" Journal of The Korea Society of Computer and Information 28.9 pp.47-54 (2023) : 47.
JeongHyeon Park, JunHyeok Go, SiUng Kim, Nammee Moon. Classification of Infant Crying Audio based on 3D Feature-Vector through Audio Data Augmentation. 2023; 28(9), 47-54. Available from: doi:10.9708/jksci.2023.28.09.047
JeongHyeon Park, JunHyeok Go, SiUng Kim and Nammee Moon. "Classification of Infant Crying Audio based on 3D Feature-Vector through Audio Data Augmentation" Journal of The Korea Society of Computer and Information 28, no.9 (2023) : 47-54.doi: 10.9708/jksci.2023.28.09.047
JeongHyeon Park; JunHyeok Go; SiUng Kim; Nammee Moon. Classification of Infant Crying Audio based on 3D Feature-Vector through Audio Data Augmentation. Journal of The Korea Society of Computer and Information, 28(9), 47-54. doi: 10.9708/jksci.2023.28.09.047
JeongHyeon Park; JunHyeok Go; SiUng Kim; Nammee Moon. Classification of Infant Crying Audio based on 3D Feature-Vector through Audio Data Augmentation. Journal of The Korea Society of Computer and Information. 2023; 28(9) 47-54. doi: 10.9708/jksci.2023.28.09.047
JeongHyeon Park, JunHyeok Go, SiUng Kim, Nammee Moon. Classification of Infant Crying Audio based on 3D Feature-Vector through Audio Data Augmentation. 2023; 28(9), 47-54. Available from: doi:10.9708/jksci.2023.28.09.047
JeongHyeon Park, JunHyeok Go, SiUng Kim and Nammee Moon. "Classification of Infant Crying Audio based on 3D Feature-Vector through Audio Data Augmentation" Journal of The Korea Society of Computer and Information 28, no.9 (2023) : 47-54.doi: 10.9708/jksci.2023.28.09.047