@article{ART001096104},
author={Young-Mee Chung and LeeYong-Gu},
title={Improving the Retrieval Effectiveness by Incorporating Word Sense Disambiguation Process},
journal={Journal of the Korean Society for Information Management},
issn={1013-0799},
year={2005},
volume={22},
number={2},
pages={125-145},
doi={10.3743/KOSIM.2005.22.2.125}
TY - JOUR
AU - Young-Mee Chung
AU - LeeYong-Gu
TI - Improving the Retrieval Effectiveness by Incorporating Word Sense Disambiguation Process
JO - Journal of the Korean Society for Information Management
PY - 2005
VL - 22
IS - 2
PB - 한국정보관리학회
SP - 125
EP - 145
SN - 1013-0799
AB - This paper presents a semantic vector space retrieval model incorporating a word sense disambiguation algorithm in an attempt to improve retrieval effectiveness. Nine Korean homonyms are selected for the sense disambiguation and retrieval experiments. The total of approximately 120,000 news articles comprise the raw test collection and 18 queries including homonyms as query words are used for the retrieval experiments. A Naive Bayes classifier and EM algorithm representing supervised and unsupervised learning algorithms respectively are used for the disambiguation process. The Naive Bayes classifier achieved 92% disambiguation accuracy, while the clustering performance of the EM algorithm is 67% on the average. The retrieval effectiveness of the semantic vector space model incorporating the Naive Bayes classifier showed 39.6% precision achieving about 7.4% improvement. However, the retrieval effectiveness of the EM algorithm-based semantic retrieval is 3% lower than the baseline retrieval without disambiguation. It is worth noting that the performances of disambiguation and retrieval depend on the distribution patterns of homonyms to be disambiguated as well as the characteristics of queries.
KW - information retrieval;word sense disambiguation;Naive Bayes classifier;
EM algorithm;clustering;retrieval effectiveness
DO - 10.3743/KOSIM.2005.22.2.125
ER -
Young-Mee Chung and LeeYong-Gu. (2005). Improving the Retrieval Effectiveness by Incorporating Word Sense Disambiguation Process. Journal of the Korean Society for Information Management, 22(2), 125-145.
Young-Mee Chung and LeeYong-Gu. 2005, "Improving the Retrieval Effectiveness by Incorporating Word Sense Disambiguation Process", Journal of the Korean Society for Information Management, vol.22, no.2 pp.125-145. Available from: doi:10.3743/KOSIM.2005.22.2.125
Young-Mee Chung, LeeYong-Gu "Improving the Retrieval Effectiveness by Incorporating Word Sense Disambiguation Process" Journal of the Korean Society for Information Management 22.2 pp.125-145 (2005) : 125.
Young-Mee Chung, LeeYong-Gu. Improving the Retrieval Effectiveness by Incorporating Word Sense Disambiguation Process. 2005; 22(2), 125-145. Available from: doi:10.3743/KOSIM.2005.22.2.125
Young-Mee Chung and LeeYong-Gu. "Improving the Retrieval Effectiveness by Incorporating Word Sense Disambiguation Process" Journal of the Korean Society for Information Management 22, no.2 (2005) : 125-145.doi: 10.3743/KOSIM.2005.22.2.125
Young-Mee Chung; LeeYong-Gu. Improving the Retrieval Effectiveness by Incorporating Word Sense Disambiguation Process. Journal of the Korean Society for Information Management, 22(2), 125-145. doi: 10.3743/KOSIM.2005.22.2.125
Young-Mee Chung; LeeYong-Gu. Improving the Retrieval Effectiveness by Incorporating Word Sense Disambiguation Process. Journal of the Korean Society for Information Management. 2005; 22(2) 125-145. doi: 10.3743/KOSIM.2005.22.2.125
Young-Mee Chung, LeeYong-Gu. Improving the Retrieval Effectiveness by Incorporating Word Sense Disambiguation Process. 2005; 22(2), 125-145. Available from: doi:10.3743/KOSIM.2005.22.2.125
Young-Mee Chung and LeeYong-Gu. "Improving the Retrieval Effectiveness by Incorporating Word Sense Disambiguation Process" Journal of the Korean Society for Information Management 22, no.2 (2005) : 125-145.doi: 10.3743/KOSIM.2005.22.2.125