@inproceedings{1214d1492729402a9a2f30dd6cc86ca9,
title = "Named Entity Extraction from Semi-structured Data Using Machine Learning Algorithms",
abstract = "The modern society have been witnessed that intensive development of Internet technologies had followed to information explosion during last decades. This explosion had been expressing by an exponential growth of data volume among the low-quality information. This paper is designed to provide detailed information about some intellectual tools which are support decision taking by automatic knowledge extraction. In the first part of paper, we considered a preprocessing contains morphological analysis of texts. Then we had considered the model of text documents in the form of a hypergraph and implementation of the random walk method to extract semantically close word{\textquoteright}s pairs, in other words, pairs that often appears together. Result of calculations is matrix with word affinity coefficients corresponding to each other component of vocabulary vector. In the second part we describe training of neural network for linguistic constructions extraction. These ones include possible values of text named entities descriptors. The neural network enables to retrieve information on one preselected descriptor, for example, location, in the form of the final result of the name of geographical objects. In a general case, the neural network can retrieve information on several descriptors simultaneously.",
keywords = "Entity extraction, Machine learning algorithms, Neural networks, Random walk method, Semi-structured data",
author = "Madina Mansurova and Vladimir Barakhnin and Yerzhan Khibatkhanuly and Ilya Pastushkov",
year = "2019",
month = jan,
day = "1",
doi = "10.1007/978-3-030-28374-2_6",
language = "English",
isbn = "9783030283735",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer-Verlag GmbH and Co. KG",
pages = "58--69",
editor = "Nguyen, {Ngoc Thanh} and Richard Chbeir and Ernesto Exposito and Philippe Aniort{\'e} and Bogdan Trawinski and Nguyen, {Ngoc Thanh}",
booktitle = "Computational Collective Intelligence - 11th International Conference, ICCCI 2019, Proceedings",
address = "Germany",
note = "11th International Conference on Computational Collective Intelligence, ICCCI 2019 ; Conference date: 04-09-2019 Through 06-09-2019",
}