@article{ART002814605},
author={Hyo-Jung Oh and Yun Bo-Hyun},
title={Valid Data Conditions and Discrimination for Machine Learning: Case study on Dataset in the Public Data Portal},
journal={Journal of Internet of Things and Convergence},
issn={2466-0078},
year={2022},
volume={8},
number={1},
pages={37-43},
doi={10.20465/KIOTS.2022.8.1.037}
TY - JOUR
AU - Hyo-Jung Oh
AU - Yun Bo-Hyun
TI - Valid Data Conditions and Discrimination for Machine Learning: Case study on Dataset in the Public Data Portal
JO - Journal of Internet of Things and Convergence
PY - 2022
VL - 8
IS - 1
PB - The Korea Internet of Things Society
SP - 37
EP - 43
SN - 2466-0078
AB - The fundamental basis of AI technology is learningable data. Recently, the types and amounts of data collected and produced by the government or private companies are increasing exponentially, however, verified data that can be used for actual machine learning has not yet led to it. This study discusses the conditions that data actually can be used for machine learning should meet, and identifies factors that degrade data quality through case studies. To this end, two representative cases of developing a prediction model using public big data was selected, and data for actual problem solving was collected from the public data portal. Through this, there is a difference from the results of applying valid data screening criteria and post-processing. The ultimate purpose of this study is to argue the importance of data quality management that must be most fundamentally preceded before the development of machine learning technology, which is the core of artificial intelligence, and accumulating valid data.
KW - Valid Data;Machine Learning;Data Discrimination;Quality of Data;Public Big data
DO - 10.20465/KIOTS.2022.8.1.037
ER -
Hyo-Jung Oh and Yun Bo-Hyun. (2022). Valid Data Conditions and Discrimination for Machine Learning: Case study on Dataset in the Public Data Portal. Journal of Internet of Things and Convergence, 8(1), 37-43.
Hyo-Jung Oh and Yun Bo-Hyun. 2022, "Valid Data Conditions and Discrimination for Machine Learning: Case study on Dataset in the Public Data Portal", Journal of Internet of Things and Convergence, vol.8, no.1 pp.37-43. Available from: doi:10.20465/KIOTS.2022.8.1.037
Hyo-Jung Oh, Yun Bo-Hyun "Valid Data Conditions and Discrimination for Machine Learning: Case study on Dataset in the Public Data Portal" Journal of Internet of Things and Convergence 8.1 pp.37-43 (2022) : 37.
Hyo-Jung Oh, Yun Bo-Hyun. Valid Data Conditions and Discrimination for Machine Learning: Case study on Dataset in the Public Data Portal. 2022; 8(1), 37-43. Available from: doi:10.20465/KIOTS.2022.8.1.037
Hyo-Jung Oh and Yun Bo-Hyun. "Valid Data Conditions and Discrimination for Machine Learning: Case study on Dataset in the Public Data Portal" Journal of Internet of Things and Convergence 8, no.1 (2022) : 37-43.doi: 10.20465/KIOTS.2022.8.1.037
Hyo-Jung Oh; Yun Bo-Hyun. Valid Data Conditions and Discrimination for Machine Learning: Case study on Dataset in the Public Data Portal. Journal of Internet of Things and Convergence, 8(1), 37-43. doi: 10.20465/KIOTS.2022.8.1.037
Hyo-Jung Oh; Yun Bo-Hyun. Valid Data Conditions and Discrimination for Machine Learning: Case study on Dataset in the Public Data Portal. Journal of Internet of Things and Convergence. 2022; 8(1) 37-43. doi: 10.20465/KIOTS.2022.8.1.037
Hyo-Jung Oh, Yun Bo-Hyun. Valid Data Conditions and Discrimination for Machine Learning: Case study on Dataset in the Public Data Portal. 2022; 8(1), 37-43. Available from: doi:10.20465/KIOTS.2022.8.1.037
Hyo-Jung Oh and Yun Bo-Hyun. "Valid Data Conditions and Discrimination for Machine Learning: Case study on Dataset in the Public Data Portal" Journal of Internet of Things and Convergence 8, no.1 (2022) : 37-43.doi: 10.20465/KIOTS.2022.8.1.037