@article{ART002681557},
author={Wonil Chung and Bahng, Seunghee and Park, Myung Kwan},
title={Classification of Literary Works(Novels) Using Text Mining},
journal={PHILOSOPHY·THOUGHT·CULTURE},
issn={1975-1621},
year={2021},
number={35},
pages={381-407},
doi={10.33639/ptc.2021..35.016}
TY - JOUR
AU - Wonil Chung
AU - Bahng, Seunghee
AU - Park, Myung Kwan
TI - Classification of Literary Works(Novels) Using Text Mining
JO - PHILOSOPHY·THOUGHT·CULTURE
PY - 2021
VL - null
IS - 35
PB - Research Institute for East-West Thought
SP - 381
EP - 407
SN - 1975-1621
AB - This paper is to introduce quantitative text analysis of some literary works registered in the Project Gutenberg among Big Data and classification of the works using text mining techniques. After performing data preprocessing using the programming language R, we measured cosine similarity between chapters within a novel and cosine similarity between chapters of different novels to classify the novels. We found the cosine similarity between chapters within the novel is relatively high, but not between the novels. Furthermore, clustering analysis, which is an unsupervised machine learning task, showed strong cohesion of semantic distance, and classification analysis, which is a supervised machine learning task, showed high accuracy. In addition, we have confirmed that children's novels can be classified as easy-to-read works due to the large cosine similarity value and small semantic distance between chapters. Therefore, quantitative text analysis using text mining technique is expected to serve as a foundation for performing qualitative text analysis.
KW - text mining;classification;clustering;cosain similarity;children’s novel
DO - 10.33639/ptc.2021..35.016
ER -
Wonil Chung, Bahng, Seunghee and Park, Myung Kwan. (2021). Classification of Literary Works(Novels) Using Text Mining. PHILOSOPHY·THOUGHT·CULTURE, 35, 381-407.
Wonil Chung, Bahng, Seunghee and Park, Myung Kwan. 2021, "Classification of Literary Works(Novels) Using Text Mining", PHILOSOPHY·THOUGHT·CULTURE, no.35, pp.381-407. Available from: doi:10.33639/ptc.2021..35.016
Wonil Chung, Bahng, Seunghee, Park, Myung Kwan "Classification of Literary Works(Novels) Using Text Mining" PHILOSOPHY·THOUGHT·CULTURE 35 pp.381-407 (2021) : 381.
Wonil Chung, Bahng, Seunghee, Park, Myung Kwan. Classification of Literary Works(Novels) Using Text Mining. 2021; 35 : 381-407. Available from: doi:10.33639/ptc.2021..35.016
Wonil Chung, Bahng, Seunghee and Park, Myung Kwan. "Classification of Literary Works(Novels) Using Text Mining" PHILOSOPHY·THOUGHT·CULTURE no.35(2021) : 381-407.doi: 10.33639/ptc.2021..35.016
Wonil Chung; Bahng, Seunghee; Park, Myung Kwan. Classification of Literary Works(Novels) Using Text Mining. PHILOSOPHY·THOUGHT·CULTURE, 35, 381-407. doi: 10.33639/ptc.2021..35.016
Wonil Chung; Bahng, Seunghee; Park, Myung Kwan. Classification of Literary Works(Novels) Using Text Mining. PHILOSOPHY·THOUGHT·CULTURE. 2021; 35 381-407. doi: 10.33639/ptc.2021..35.016
Wonil Chung, Bahng, Seunghee, Park, Myung Kwan. Classification of Literary Works(Novels) Using Text Mining. 2021; 35 : 381-407. Available from: doi:10.33639/ptc.2021..35.016
Wonil Chung, Bahng, Seunghee and Park, Myung Kwan. "Classification of Literary Works(Novels) Using Text Mining" PHILOSOPHY·THOUGHT·CULTURE no.35(2021) : 381-407.doi: 10.33639/ptc.2021..35.016