@article{ART002970012},
author={Hyeon Gyu Kim},
title={Efficient Filtering of Noise Reviews Using Supervised Learning in Social Big Data Analysis},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2023},
volume={28},
number={6},
pages={63-69},
doi={10.9708/jksci.2023.28.06.063}
TY - JOUR
AU - Hyeon Gyu Kim
TI - Efficient Filtering of Noise Reviews Using Supervised Learning in Social Big Data Analysis
JO - Journal of The Korea Society of Computer and Information
PY - 2023
VL - 28
IS - 6
PB - The Korean Society Of Computer And Information
SP - 63
EP - 69
SN - 1598-849X
AB - Social reviews collected through the search API may include a large number of reviews unrelated to a given search term, and these reviews are referred to as noise reviews because they may lead to distorted analysis results. In this paper, we discuss supervised learning algorithms to conduct filtering of the noise reviews efficiently, and compare their performance through experiments. About 20,000 reviews collected for tourist attractions in the Ulsan metropolitan city were used for the experiments, and LSTM and BERT, which are known to provide high accuracy in text processing, were adopted for training and testing the reviews. As a result, BERT provided better accuracy than LSTM, where f1-scores of the two algorithms were 90.1% and 95.2%, respectively. On the other hand, in terms of execution time, LSTM was about 5 times faster than BERT. The result shows that, in the noise review filtering, BERT can be used more properly when accuracy is important, whereas LSTM can be used more properly when performance is important or computation resources are insufficient.
KW - Social big data;Noise review filtering;Supervised learning;LSTM;BERT
DO - 10.9708/jksci.2023.28.06.063
ER -
Hyeon Gyu Kim. (2023). Efficient Filtering of Noise Reviews Using Supervised Learning in Social Big Data Analysis. Journal of The Korea Society of Computer and Information, 28(6), 63-69.
Hyeon Gyu Kim. 2023, "Efficient Filtering of Noise Reviews Using Supervised Learning in Social Big Data Analysis", Journal of The Korea Society of Computer and Information, vol.28, no.6 pp.63-69. Available from: doi:10.9708/jksci.2023.28.06.063
Hyeon Gyu Kim "Efficient Filtering of Noise Reviews Using Supervised Learning in Social Big Data Analysis" Journal of The Korea Society of Computer and Information 28.6 pp.63-69 (2023) : 63.
Hyeon Gyu Kim. Efficient Filtering of Noise Reviews Using Supervised Learning in Social Big Data Analysis. 2023; 28(6), 63-69. Available from: doi:10.9708/jksci.2023.28.06.063
Hyeon Gyu Kim. "Efficient Filtering of Noise Reviews Using Supervised Learning in Social Big Data Analysis" Journal of The Korea Society of Computer and Information 28, no.6 (2023) : 63-69.doi: 10.9708/jksci.2023.28.06.063
Hyeon Gyu Kim. Efficient Filtering of Noise Reviews Using Supervised Learning in Social Big Data Analysis. Journal of The Korea Society of Computer and Information, 28(6), 63-69. doi: 10.9708/jksci.2023.28.06.063
Hyeon Gyu Kim. Efficient Filtering of Noise Reviews Using Supervised Learning in Social Big Data Analysis. Journal of The Korea Society of Computer and Information. 2023; 28(6) 63-69. doi: 10.9708/jksci.2023.28.06.063
Hyeon Gyu Kim. Efficient Filtering of Noise Reviews Using Supervised Learning in Social Big Data Analysis. 2023; 28(6), 63-69. Available from: doi:10.9708/jksci.2023.28.06.063
Hyeon Gyu Kim. "Efficient Filtering of Noise Reviews Using Supervised Learning in Social Big Data Analysis" Journal of The Korea Society of Computer and Information 28, no.6 (2023) : 63-69.doi: 10.9708/jksci.2023.28.06.063