@article{ART002639423},
author={Hyeon Gyu Kim},
title={Efficient Keyword Extraction from Social Big Data Based on Cohesion Scoring},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2020},
volume={25},
number={10},
pages={87-94},
doi={10.9708/jksci.2020.25.10.087}
TY - JOUR
AU - Hyeon Gyu Kim
TI - Efficient Keyword Extraction from Social Big Data Based on Cohesion Scoring
JO - Journal of The Korea Society of Computer and Information
PY - 2020
VL - 25
IS - 10
PB - The Korean Society Of Computer And Information
SP - 87
EP - 94
SN - 1598-849X
AB - Social reviews such as SNS feeds and blog articles have been widely used to extract keywords reflecting opinions and complaints from users’ perspective, and often include proper nouns or new words reflecting recent trends. In general, these words are not included in a dictionary, so conventional morphological analyzers may not detect and extract those words from the reviews properly. In addition, due to their high processing time, it is inadequate to provide analysis results in a timely manner. This paper presents a method for efficient keyword extraction from social reviews based on the notion of cohesion scoring. Cohesion scores can be calculated based on word frequencies, so keyword extraction can be performed without a dictionary when using it. On the other hand, their accuracy can be degraded when input data with poor spacing is given. Regarding this, an algorithm is presented which improves the existing cohesion scoring mechanism using the structure of a word tree. Our experiment results show that it took only 0.008 seconds to extract keywords from 1,000 reviews in the proposed method while resulting in 15.5% error ratio which is better than the existing morphological analyzers.
KW - Big data;Social reviews;Keyword extraction;Cohesion score;Morphological analysis
DO - 10.9708/jksci.2020.25.10.087
ER -
Hyeon Gyu Kim. (2020). Efficient Keyword Extraction from Social Big Data Based on Cohesion Scoring. Journal of The Korea Society of Computer and Information, 25(10), 87-94.
Hyeon Gyu Kim. 2020, "Efficient Keyword Extraction from Social Big Data Based on Cohesion Scoring", Journal of The Korea Society of Computer and Information, vol.25, no.10 pp.87-94. Available from: doi:10.9708/jksci.2020.25.10.087
Hyeon Gyu Kim "Efficient Keyword Extraction from Social Big Data Based on Cohesion Scoring" Journal of The Korea Society of Computer and Information 25.10 pp.87-94 (2020) : 87.
Hyeon Gyu Kim. Efficient Keyword Extraction from Social Big Data Based on Cohesion Scoring. 2020; 25(10), 87-94. Available from: doi:10.9708/jksci.2020.25.10.087
Hyeon Gyu Kim. "Efficient Keyword Extraction from Social Big Data Based on Cohesion Scoring" Journal of The Korea Society of Computer and Information 25, no.10 (2020) : 87-94.doi: 10.9708/jksci.2020.25.10.087
Hyeon Gyu Kim. Efficient Keyword Extraction from Social Big Data Based on Cohesion Scoring. Journal of The Korea Society of Computer and Information, 25(10), 87-94. doi: 10.9708/jksci.2020.25.10.087
Hyeon Gyu Kim. Efficient Keyword Extraction from Social Big Data Based on Cohesion Scoring. Journal of The Korea Society of Computer and Information. 2020; 25(10) 87-94. doi: 10.9708/jksci.2020.25.10.087
Hyeon Gyu Kim. Efficient Keyword Extraction from Social Big Data Based on Cohesion Scoring. 2020; 25(10), 87-94. Available from: doi:10.9708/jksci.2020.25.10.087
Hyeon Gyu Kim. "Efficient Keyword Extraction from Social Big Data Based on Cohesion Scoring" Journal of The Korea Society of Computer and Information 25, no.10 (2020) : 87-94.doi: 10.9708/jksci.2020.25.10.087