@inbook{b59054cf4e0246a5b3f7125d05781acb,
title = "Data mining, management and visualization in large scientific corpuses",
abstract = "Organizing scientific papers helps efficiently derive meaningful insights of the published scientific resources, enables researchers grasp rapid technological change and hence assists new scientific discovery. In this paper, we experiment text mining and data management of scientific publications for collecting and presenting useful information to support research. For efficient data management and fast information retrieval, four data storages are employed: a semantic repository, an index and search repository, a document repository and a graph repository, taking full advantage of their features and strength. The results show that the combination of these four repositories can effectively store and index the publication data with reliability and efficiency and hence supply meaningful information to support scientific research.",
keywords = "Data management, Distributed storage, Document repository, Elasticsearch, Graph database, NoSql, Text mining, Visualization",
author = "Hui Wei and Shaopeng Wu and Youbing Zhao and Zhikun Deng and Nikolaos Ersotelos and Farzad Parvinzamir and Baoquan Liu and Enjie Liu and Feng Dong",
year = "2016",
doi = "10.1007/978-3-319-40259-8_32",
language = "English",
isbn = "9783319402581",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer-Verlag",
pages = "371--379",
booktitle = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
}