@article{ART002480029},
author={Kim, Pan Jun},
title={An Analytical Study on Automatic Classification of Domestic Journal articles Using Random Forest},
journal={Journal of the Korean Society for Information Management},
issn={1013-0799},
year={2019},
volume={36},
number={2},
pages={57-77},
doi={10.3743/KOSIM.2019.36.2.057}
TY - JOUR
AU - Kim, Pan Jun
TI - An Analytical Study on Automatic Classification of Domestic Journal articles Using Random Forest
JO - Journal of the Korean Society for Information Management
PY - 2019
VL - 36
IS - 2
PB - 한국정보관리학회
SP - 57
EP - 77
SN - 1013-0799
AB - Random Forest (RF), a representative ensemble technique, was applied to automatic classification of journal articles in the field of library and information science. Especially, I performed various experiments on the main factors such as tree number, feature selection, and learning set size in terms of classification performance that automatically assigns class labels to domestic journals. Through this, I explored ways to optimize the performance of random forests (RF) for imbalanced datasets in real environments. Consequently, for the automatic classification of domestic journal articles, Random Forest (RF) can be expected to have the best classification performance when using tree number interval 100〜1000(C), small feature set (10%) based on chi-square statistic (CHI), and most learning sets (9-10 years).
KW - automatic classification;automatic annotation;digital curation;journal articles;random forest (RF);multi-label classification;imbalanced data;feature selection
DO - 10.3743/KOSIM.2019.36.2.057
ER -
Kim, Pan Jun. (2019). An Analytical Study on Automatic Classification of Domestic Journal articles Using Random Forest. Journal of the Korean Society for Information Management, 36(2), 57-77.
Kim, Pan Jun. 2019, "An Analytical Study on Automatic Classification of Domestic Journal articles Using Random Forest", Journal of the Korean Society for Information Management, vol.36, no.2 pp.57-77. Available from: doi:10.3743/KOSIM.2019.36.2.057
Kim, Pan Jun "An Analytical Study on Automatic Classification of Domestic Journal articles Using Random Forest" Journal of the Korean Society for Information Management 36.2 pp.57-77 (2019) : 57.
Kim, Pan Jun. An Analytical Study on Automatic Classification of Domestic Journal articles Using Random Forest. 2019; 36(2), 57-77. Available from: doi:10.3743/KOSIM.2019.36.2.057
Kim, Pan Jun. "An Analytical Study on Automatic Classification of Domestic Journal articles Using Random Forest" Journal of the Korean Society for Information Management 36, no.2 (2019) : 57-77.doi: 10.3743/KOSIM.2019.36.2.057
Kim, Pan Jun. An Analytical Study on Automatic Classification of Domestic Journal articles Using Random Forest. Journal of the Korean Society for Information Management, 36(2), 57-77. doi: 10.3743/KOSIM.2019.36.2.057
Kim, Pan Jun. An Analytical Study on Automatic Classification of Domestic Journal articles Using Random Forest. Journal of the Korean Society for Information Management. 2019; 36(2) 57-77. doi: 10.3743/KOSIM.2019.36.2.057
Kim, Pan Jun. An Analytical Study on Automatic Classification of Domestic Journal articles Using Random Forest. 2019; 36(2), 57-77. Available from: doi:10.3743/KOSIM.2019.36.2.057
Kim, Pan Jun. "An Analytical Study on Automatic Classification of Domestic Journal articles Using Random Forest" Journal of the Korean Society for Information Management 36, no.2 (2019) : 57-77.doi: 10.3743/KOSIM.2019.36.2.057