@article{ART001201320},
author={Han Kwang Rok and Bokkeun Sun and Hyoungsun Yoo},
title={Text Extraction and Summarization from Web News},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2007},
volume={12},
number={5},
pages={1-10}
TY - JOUR
AU - Han Kwang Rok
AU - Bokkeun Sun
AU - Hyoungsun Yoo
TI - Text Extraction and Summarization from Web News
JO - Journal of The Korea Society of Computer and Information
PY - 2007
VL - 12
IS - 5
PB - The Korean Society Of Computer And Information
SP - 1
EP - 10
SN - 1598-849X
AB - Many types of information provided through the web including news contents contain unnecessary clutters. These clutters make it difficult to build automated information processing systems such as the summarization, extraction and retrieval of documents. We propose a system that extracts and summarizes news contents from the web. The extraction system receives news contents in HTML as input and builds an element tree similar to DOM tree, and extracts texts while removing clutters with the hyperlink attribute in the HTML tag from the element tree. Texts extracted through the extraction system are transferred to the summarization system, which extracts key sentences from the texts. We implement the summarization system using co-occurrence relation graph. The summarized sentences of this paper are expected to be transmissible to PDA or cellular phone by message services such as SMS.
KW - Web News;Extraction;Summarization;Co-occurrence Relation Graph
DO -
UR -
ER -
Han Kwang Rok, Bokkeun Sun and Hyoungsun Yoo. (2007). Text Extraction and Summarization from Web News. Journal of The Korea Society of Computer and Information, 12(5), 1-10.
Han Kwang Rok, Bokkeun Sun and Hyoungsun Yoo. 2007, "Text Extraction and Summarization from Web News", Journal of The Korea Society of Computer and Information, vol.12, no.5 pp.1-10.
Han Kwang Rok, Bokkeun Sun, Hyoungsun Yoo "Text Extraction and Summarization from Web News" Journal of The Korea Society of Computer and Information 12.5 pp.1-10 (2007) : 1.
Han Kwang Rok, Bokkeun Sun, Hyoungsun Yoo. Text Extraction and Summarization from Web News. 2007; 12(5), 1-10.
Han Kwang Rok, Bokkeun Sun and Hyoungsun Yoo. "Text Extraction and Summarization from Web News" Journal of The Korea Society of Computer and Information 12, no.5 (2007) : 1-10.
Han Kwang Rok; Bokkeun Sun; Hyoungsun Yoo. Text Extraction and Summarization from Web News. Journal of The Korea Society of Computer and Information, 12(5), 1-10.
Han Kwang Rok; Bokkeun Sun; Hyoungsun Yoo. Text Extraction and Summarization from Web News. Journal of The Korea Society of Computer and Information. 2007; 12(5) 1-10.
Han Kwang Rok, Bokkeun Sun, Hyoungsun Yoo. Text Extraction and Summarization from Web News. 2007; 12(5), 1-10.
Han Kwang Rok, Bokkeun Sun and Hyoungsun Yoo. "Text Extraction and Summarization from Web News" Journal of The Korea Society of Computer and Information 12, no.5 (2007) : 1-10.