@inproceedings{2e3237a7d7c84d2b890b6c1c25009d84,
title = "A privacy preserving platform for MapReduce",
abstract = "Big data applications typically require a large number of clusters, running in parallel, to process data fast and more efficiently. This is typically controlled and managed by MapReduce. In MapReduce operations, Mappers transform input original key/value pairs to a set of intermediate key/value pairs while Reducers aggregate a set of intermediate values, compute and write to the output. The output however can bring serious privacy concerns. Firstly, the output can directly leak sensitive information because it contains the global view of the final computation. Secondly, the output can also indirectly leak information via composite attacks where the adversary can link it with public information published via different sources such as Facebook or Twitter. To address such privacy concerns, we propose a privacy preserving platform which can prevent privacy leakage in MapReduce. Our platform can be plugged into the Reduce phase to sanitize the final output in such a way that the privacy is preserved while it yet provides a high data utility. We demonstrate the feasibility of our platform by providing empirical studies and highlights that our proposal can be used for real life applications.",
keywords = "Differential privacy, K-anonymity, MapReduce, New york taxi data",
author = "Bazai, {Sibghat Ullah} and Julian Jang-Jaccard and Xuyun Zhang",
year = "2017",
month = jan,
day = "1",
doi = "10.1007/978-981-10-5421-1_8",
language = "English",
isbn = "9789811054204",
series = "Communications in Computer and Information Science",
publisher = "Springer, Springer Nature",
pages = "88--99",
editor = "Lynn Batten and Kim, {Dong Seong} and Xuyun Zhang and Gang Li",
booktitle = "Applications and Techniques in Information Security",
address = "United States",
note = "8th International Conference on Applications and Techniques in Information Security, ATIS 2017 ; Conference date: 06-07-2017 Through 07-07-2017",
}