@inproceedings{5990b3ef1019475abac54f9222550497,
title = "Internet articles classification by industry types based on TF-IDF",
abstract = "In order to understand a specific industry field, people usually look at the financial statements of the companies relevant to the industry field. Financial statements have diverse and numerical information but have past financial states of companies because those are usually quarterly reported. So, needs to timely obtain the current states of an industry field is increasing. Proposed method is focusing on internet articles because they are easy to obtain and updated with new information every day. As a preliminary study of extracting information on industries from internet articles, this paper proposes a method to classify internet articles by industry types. The proposed method in this paper computes importance values of nouns in internet articles based on TF-IDF. Using calculated importance values, proposed method classifies articles by industry types. Through experiments, it is proven that proposed method can achieve high accuracy in industry article classification.",
keywords = "Classification, Industry, Internet article, TF-IDF",
author = "Jonghun Cha and Lee, \{Jee Hyong\}",
note = "Publisher Copyright: {\textcopyright} Springer Nature Singapore Pte Ltd. 2018.; International Conference on Computer Science and its Applications, CSA 2017 ; Conference date: 18-12-2017 Through 20-12-2017",
year = "2018",
doi = "10.1007/978-981-10-7605-3\_179",
language = "English",
isbn = "9789811076046",
series = "Lecture Notes in Electrical Engineering",
publisher = "Springer Verlag",
pages = "1121--1125",
editor = "Gangman Yi and Yunsick Sung and Park, \{James J.\} and Vincenzo Loia",
booktitle = "Advances in Computer Science and Ubiquitous Computing - CSA-CUTE 17",
}