@article{ART002573933},
author={LeeYong-Gu},
title={A Study on Book Categorization in Social Sciences Using kNN Classifiers and Table of Contents Text},
journal={Journal of the Korean Society for Information Management},
issn={1013-0799},
year={2020},
volume={37},
number={1},
pages={1-21},
doi={10.3743/KOSIM.2020.37.1.001}
TY - JOUR
AU - LeeYong-Gu
TI - A Study on Book Categorization in Social Sciences Using kNN Classifiers and Table of Contents Text
JO - Journal of the Korean Society for Information Management
PY - 2020
VL - 37
IS - 1
PB - 한국정보관리학회
SP - 1
EP - 21
SN - 1013-0799
AB - This study applied automatic classification using table of contents (TOC) text for 6,253 social science books from a newly arrived list collected by a university library. The k-nearest neighbors (kNN) algorithm was used as a classifier, and the ten divisions on the second level of the DDC’s main class 300 given to books by the library were used as classes (labels). The features used in this study were keywords extracted from titles and TOCs of the books. The TOCs were obtained through the OpenAPI from an Internet bookstore. As a result, it was found that the TOC features were good for improving both classification recall and precision. The TOC was shown to reduce the overfitting problem of imbalanced data with its rich features. Law and education have high topic specificity in the field of social sciences, so the only title features can bring good classification performance in these fields.
KW - Table of contents;kNN classifier;book categorization;DDC (Dewey Decimal Classification)
DO - 10.3743/KOSIM.2020.37.1.001
ER -
LeeYong-Gu. (2020). A Study on Book Categorization in Social Sciences Using kNN Classifiers and Table of Contents Text. Journal of the Korean Society for Information Management, 37(1), 1-21.
LeeYong-Gu. 2020, "A Study on Book Categorization in Social Sciences Using kNN Classifiers and Table of Contents Text", Journal of the Korean Society for Information Management, vol.37, no.1 pp.1-21. Available from: doi:10.3743/KOSIM.2020.37.1.001
LeeYong-Gu "A Study on Book Categorization in Social Sciences Using kNN Classifiers and Table of Contents Text" Journal of the Korean Society for Information Management 37.1 pp.1-21 (2020) : 1.
LeeYong-Gu. A Study on Book Categorization in Social Sciences Using kNN Classifiers and Table of Contents Text. 2020; 37(1), 1-21. Available from: doi:10.3743/KOSIM.2020.37.1.001
LeeYong-Gu. "A Study on Book Categorization in Social Sciences Using kNN Classifiers and Table of Contents Text" Journal of the Korean Society for Information Management 37, no.1 (2020) : 1-21.doi: 10.3743/KOSIM.2020.37.1.001
LeeYong-Gu. A Study on Book Categorization in Social Sciences Using kNN Classifiers and Table of Contents Text. Journal of the Korean Society for Information Management, 37(1), 1-21. doi: 10.3743/KOSIM.2020.37.1.001
LeeYong-Gu. A Study on Book Categorization in Social Sciences Using kNN Classifiers and Table of Contents Text. Journal of the Korean Society for Information Management. 2020; 37(1) 1-21. doi: 10.3743/KOSIM.2020.37.1.001
LeeYong-Gu. A Study on Book Categorization in Social Sciences Using kNN Classifiers and Table of Contents Text. 2020; 37(1), 1-21. Available from: doi:10.3743/KOSIM.2020.37.1.001
LeeYong-Gu. "A Study on Book Categorization in Social Sciences Using kNN Classifiers and Table of Contents Text" Journal of the Korean Society for Information Management 37, no.1 (2020) : 1-21.doi: 10.3743/KOSIM.2020.37.1.001