@inproceedings{2b17b5642aca49438040336a6fa57171,
title = "EclipseMR: Distributed and Parallel Task Processing with Consistent Hashing",
abstract = "We present EclipseMR, a novel MapReduce framework prototype that efficiently utilizes a large distributed memory in cluster environments. EclipseMR consists of double-layered consistent hash rings-a decentralized DHT-based file system and an in-memory key-value store that employs consistent hashing. The in-memory key-value store in EclipseMR is designed not only to cache local data but also remote data as well so that globally popular data can be distributed across cluster serversand found by consistent hashing.In order to leverage large distributed memories and increase the cache hit ratio, we propose a locality-Aware fair (LAF) job scheduler that works as the load balancer for the distributed in-memorycaches. Based on hash keys, the LAF job scheduler predicts which servers have reusable data, and assigns tasks to the servers so that they can be reused. The LAF job scheduler makes its best efforts to strike a balance between data locality and load balance, which often conflict with each other. We evaluate EclipseMR by quantifying the performance effect of each component using several representative MapReduce applications and show EclipseMR is faster than Hadoop andSpark by a large margin for various applications.",
keywords = "Consistent Hashing, Distributed Caching, Distributed Hash Table, MapReduce",
author = "Sanchez, \{Vicente A.B.\} and Wonbae Kim and Youngmoon Eom and Kibeom Jin and Moohyeon Nam and Deukyeon Hwang and Kim, \{Jik Soo\} and Beomseok Nam",
note = "Publisher Copyright: {\textcopyright} 2017 IEEE.; 2017 IEEE International Conference on Cluster Computing, CLUSTER 2017 ; Conference date: 05-09-2017 Through 08-09-2017",
year = "2017",
month = sep,
day = "22",
doi = "10.1109/CLUSTER.2017.12",
language = "English",
series = "Proceedings - IEEE International Conference on Cluster Computing, ICCC",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "322--332",
booktitle = "Proceedings - 2017 IEEE International Conference on Cluster Computing, CLUSTER 2017",
}