@article{ART001456744},
author={Han, Yoo-Jin and Seung-Woo Oh},
title={An Extraction Method of Bibliographic Information from the US Patents: Using an HTML Parsing Technique},
journal={Journal of the Korean Society for Information Management},
issn={1013-0799},
year={2010},
volume={27},
number={2},
pages={7-20},
doi={10.3743/KOSIM.2010.27.2.007}
TY - JOUR
AU - Han, Yoo-Jin
AU - Seung-Woo Oh
TI - An Extraction Method of Bibliographic Information from the US Patents: Using an HTML Parsing Technique
JO - Journal of the Korean Society for Information Management
PY - 2010
VL - 27
IS - 2
PB - 한국정보관리학회
SP - 7
EP - 20
SN - 1013-0799
AB - This study aims to provide a method of extracting the most recent information on US patent documents. An HTML paring technique that can directly connect to the US Patent and Trademark Office (USPTO) Web page is adopted. After obtaining a list of 50 documents through a keyword searching method, this study suggested an algorithm, using HTML parsing techniques, which can extract a patent number, an applicant, and the US patent class information. The study also revealed an algorithm by which we can extract both patents and subsequent patents using their closely connected relationship, that is a very distinctive characteristic of US patent documents. Although the proposed method has several limitations, it can supplement existing databases effectively in terms of timeliness and comprehensiveness.
KW - US patents;bibliographic information;extraction;HTML parsing
DO - 10.3743/KOSIM.2010.27.2.007
ER -
Han, Yoo-Jin and Seung-Woo Oh. (2010). An Extraction Method of Bibliographic Information from the US Patents: Using an HTML Parsing Technique. Journal of the Korean Society for Information Management, 27(2), 7-20.
Han, Yoo-Jin and Seung-Woo Oh. 2010, "An Extraction Method of Bibliographic Information from the US Patents: Using an HTML Parsing Technique", Journal of the Korean Society for Information Management, vol.27, no.2 pp.7-20. Available from: doi:10.3743/KOSIM.2010.27.2.007
Han, Yoo-Jin, Seung-Woo Oh "An Extraction Method of Bibliographic Information from the US Patents: Using an HTML Parsing Technique" Journal of the Korean Society for Information Management 27.2 pp.7-20 (2010) : 7.
Han, Yoo-Jin, Seung-Woo Oh. An Extraction Method of Bibliographic Information from the US Patents: Using an HTML Parsing Technique. 2010; 27(2), 7-20. Available from: doi:10.3743/KOSIM.2010.27.2.007
Han, Yoo-Jin and Seung-Woo Oh. "An Extraction Method of Bibliographic Information from the US Patents: Using an HTML Parsing Technique" Journal of the Korean Society for Information Management 27, no.2 (2010) : 7-20.doi: 10.3743/KOSIM.2010.27.2.007
Han, Yoo-Jin; Seung-Woo Oh. An Extraction Method of Bibliographic Information from the US Patents: Using an HTML Parsing Technique. Journal of the Korean Society for Information Management, 27(2), 7-20. doi: 10.3743/KOSIM.2010.27.2.007
Han, Yoo-Jin; Seung-Woo Oh. An Extraction Method of Bibliographic Information from the US Patents: Using an HTML Parsing Technique. Journal of the Korean Society for Information Management. 2010; 27(2) 7-20. doi: 10.3743/KOSIM.2010.27.2.007
Han, Yoo-Jin, Seung-Woo Oh. An Extraction Method of Bibliographic Information from the US Patents: Using an HTML Parsing Technique. 2010; 27(2), 7-20. Available from: doi:10.3743/KOSIM.2010.27.2.007
Han, Yoo-Jin and Seung-Woo Oh. "An Extraction Method of Bibliographic Information from the US Patents: Using an HTML Parsing Technique" Journal of the Korean Society for Information Management 27, no.2 (2010) : 7-20.doi: 10.3743/KOSIM.2010.27.2.007