@article{ART001331823},
author={Yong-Gu Lee},
title={A Study on Extracting News Contents from News Web Pages},
journal={Journal of the Korean Society for Information Management},
issn={1013-0799},
year={2009},
volume={26},
number={1},
pages={305-320},
doi={10.3743/KOSIM.2009.26.1.305}
TY - JOUR
AU - Yong-Gu Lee
TI - A Study on Extracting News Contents from News Web Pages
JO - Journal of the Korean Society for Information Management
PY - 2009
VL - 26
IS - 1
PB - 한국정보관리학회
SP - 305
EP - 320
SN - 1013-0799
AB - The news pages provided through the web contain unnecessary information. This causes low performance and inefficiency of the news processing system. In this study, news content extraction methods, which are based on sentence identification and block-level tags news web pages, was suggested. To obtain optimal performance, combinations of these methods were applied. The results showed good performance when using an extraction method which applied the sentence identification and eliminated hyperlink text from web pages. Moreover, this method showed better results when combined with the extraction method which used block-level. Extraction methods, which used sentence identification, were effective for raising the extraction recall ratio.
KW - web news content extraction;sentence based extraction;block based extraction;web mining
DO - 10.3743/KOSIM.2009.26.1.305
ER -
Yong-Gu Lee. (2009). A Study on Extracting News Contents from News Web Pages. Journal of the Korean Society for Information Management, 26(1), 305-320.
Yong-Gu Lee. 2009, "A Study on Extracting News Contents from News Web Pages", Journal of the Korean Society for Information Management, vol.26, no.1 pp.305-320. Available from: doi:10.3743/KOSIM.2009.26.1.305
Yong-Gu Lee "A Study on Extracting News Contents from News Web Pages" Journal of the Korean Society for Information Management 26.1 pp.305-320 (2009) : 305.
Yong-Gu Lee. A Study on Extracting News Contents from News Web Pages. 2009; 26(1), 305-320. Available from: doi:10.3743/KOSIM.2009.26.1.305
Yong-Gu Lee. "A Study on Extracting News Contents from News Web Pages" Journal of the Korean Society for Information Management 26, no.1 (2009) : 305-320.doi: 10.3743/KOSIM.2009.26.1.305
Yong-Gu Lee. A Study on Extracting News Contents from News Web Pages. Journal of the Korean Society for Information Management, 26(1), 305-320. doi: 10.3743/KOSIM.2009.26.1.305
Yong-Gu Lee. A Study on Extracting News Contents from News Web Pages. Journal of the Korean Society for Information Management. 2009; 26(1) 305-320. doi: 10.3743/KOSIM.2009.26.1.305
Yong-Gu Lee. A Study on Extracting News Contents from News Web Pages. 2009; 26(1), 305-320. Available from: doi:10.3743/KOSIM.2009.26.1.305
Yong-Gu Lee. "A Study on Extracting News Contents from News Web Pages" Journal of the Korean Society for Information Management 26, no.1 (2009) : 305-320.doi: 10.3743/KOSIM.2009.26.1.305