@article{ART002524861},
author={Euhee Kim},
title={The Unsupervised Learning-based Language Modeling of Word Comprehension in Korean},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2019},
volume={24},
number={11},
pages={41-49},
doi={10.9708/jksci.2019.24.11.041}
TY - JOUR
AU - Euhee Kim
TI - The Unsupervised Learning-based Language Modeling of Word Comprehension in Korean
JO - Journal of The Korea Society of Computer and Information
PY - 2019
VL - 24
IS - 11
PB - The Korean Society Of Computer And Information
SP - 41
EP - 49
SN - 1598-849X
AB - We are to build an unsupervised machine learning-based language model which can estimate the amount of information that are in need to process words consisting of subword-level morphemes and syllables. We are then to investigate whether the reading times of words reflecting their morphemic and syllabic structures are predicted by an information-theoretic measure such as surprisal. Specifically, the proposed Morfessor-based unsupervised machine learning model is first to be trained on the large dataset of sentences on Sejong Corpus and is then to be applied to estimate the information-theoretic measure on each word in the test data of Korean words. The reading times of the words in the test data are to be recruited from Korean Lexicon Project (KLP) Database. A comparison between the information-theoretic measures of the words in point and the corresponding reading times by using a linear mixed effect model reveals a reliable correlation between surprisal and reading time. We conclude that surprisal is positively related to the processing effort (i.e. reading time), confirming the surprisal hypothesis.
KW - Unsupervised learning;Morfessor;Surprisal;Lexical processing;Word recognition
DO - 10.9708/jksci.2019.24.11.041
ER -
Euhee Kim. (2019). The Unsupervised Learning-based Language Modeling of Word Comprehension in Korean. Journal of The Korea Society of Computer and Information, 24(11), 41-49.
Euhee Kim. 2019, "The Unsupervised Learning-based Language Modeling of Word Comprehension in Korean", Journal of The Korea Society of Computer and Information, vol.24, no.11 pp.41-49. Available from: doi:10.9708/jksci.2019.24.11.041
Euhee Kim "The Unsupervised Learning-based Language Modeling of Word Comprehension in Korean" Journal of The Korea Society of Computer and Information 24.11 pp.41-49 (2019) : 41.
Euhee Kim. The Unsupervised Learning-based Language Modeling of Word Comprehension in Korean. 2019; 24(11), 41-49. Available from: doi:10.9708/jksci.2019.24.11.041
Euhee Kim. "The Unsupervised Learning-based Language Modeling of Word Comprehension in Korean" Journal of The Korea Society of Computer and Information 24, no.11 (2019) : 41-49.doi: 10.9708/jksci.2019.24.11.041
Euhee Kim. The Unsupervised Learning-based Language Modeling of Word Comprehension in Korean. Journal of The Korea Society of Computer and Information, 24(11), 41-49. doi: 10.9708/jksci.2019.24.11.041
Euhee Kim. The Unsupervised Learning-based Language Modeling of Word Comprehension in Korean. Journal of The Korea Society of Computer and Information. 2019; 24(11) 41-49. doi: 10.9708/jksci.2019.24.11.041
Euhee Kim. The Unsupervised Learning-based Language Modeling of Word Comprehension in Korean. 2019; 24(11), 41-49. Available from: doi:10.9708/jksci.2019.24.11.041
Euhee Kim. "The Unsupervised Learning-based Language Modeling of Word Comprehension in Korean" Journal of The Korea Society of Computer and Information 24, no.11 (2019) : 41-49.doi: 10.9708/jksci.2019.24.11.041