@inproceedings{acde7b5e3dff4d07abf93c09e544bbb6,
title = "Managing heterogeneous data on a big data platform: A multi-criteria decision making model for data-intensive science",
abstract = "This paper presents an approach to solving the data variety problem of big data through an offline and online decisionmaking system. We present a graph-based approach to imitate real-world problem domain with a set of criteria and problem solvers. We introduce a Multi-criteria decision-making model to select a set of problem solvers that meets the set of criteria most. Suppose a system is processing Twitter data that comes as a stream of JSON records from multiple data sources. The decision system determines which of the available methods to use for a list of requirements (criteria). When multiple criteria (must meet requirements) coexist in a problem domain, their order of importance against the criteria, the mutual influence on each other and level of indispensability forms a graphic structure. In the proposed model, we consider each vertex of the graph as a criterion or benefit of an agent against the criterion. The mutual influence of multiple agents is denoted by the connecting edges of the graph. We also proposed a fuzzy graph framework to model real-world unpredictability. The model produces benchmarking results for each of the problem solvers in terms of absolute values to support decision making. The model is implemented through TopBread, Resource Description Framework (RDF), and RDF Data Query Language (RDQL). The key advantage of the proposed model over the existing ones is that the framework can operate in a dual-mode - both as a standalone offline tool and as an online decision-making gateway, it can also be used in high-velocity ingestion scenarios.",
keywords = "3 Vs of big data, Fuzzy graph, NoSQL databases, Terms - Multi criteria decision making. Multi agent systems",
author = "Gautam Pal and Katie Atkinson and Gangmin Li",
note = "Funding Information: Funding: This research was funded by Accenture Technology Labs, Beijing, China. Grant number: RDF 15-02-35. Project code: RDS10120180003. Publisher Copyright: {\textcopyright} 2020 IEEE.; 2020 IEEE International Conference on Big Data and Smart Computing, BigComp 2020 ; Conference date: 19-02-2020 Through 22-02-2020",
year = "2020",
month = feb,
doi = "10.1109/BigComp48618.2020.00-69",
language = "English",
series = "Proceedings - 2020 IEEE International Conference on Big Data and Smart Computing, BigComp 2020",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "229--239",
editor = "Wookey Lee and Luonan Chen and Yang-Sae Moon and Julien Bourgeois and Mehdi Bennis and Yu-Feng Li and Young-Guk Ha and Hyuk-Yoon Kwon and Alfredo Cuzzocrea",
booktitle = "Proceedings - 2020 IEEE International Conference on Big Data and Smart Computing, BigComp 2020",
}