@inproceedings{0babcf42a9534b838bc45dc6f3a32bab,
title = "Content-based chunk placement scheme for decentralized deduplication on distributed file systems",
abstract = "The rapid growth of data size causes several problems such as storage limitation and increment of data management cost. In order to store and manage massive data, Distributed File System (DFS) is widely used. Furthermore, in order to reduce the volume of storage, data deduplication schemes are being extensively studied. The data deduplication increases the available storage capacity by eliminating duplicated data. However, deduplication process causes performance overhead such as disk I/O. In this paper, we propose a content-based chunk placement scheme to increase deduplication rate on the DFS. To avoid performance overhead caused by deduplication process, we use lessfs in each chunk server. With our design, our system performs decentralized deduplication process in each chunk server. Moreover, we use consistent hashing for chunk allocation and failure recovery. Our experimental results show that the proposed system reduces the storage space by 60\% than the system without consistent hashing.",
keywords = "Chunk placement, Consistent hashing, Deduplication, Distributed file system",
author = "Keonwoo Kim and Jeehong Kim and Changwoo Min and Eom, \{Young Ik\}",
year = "2013",
doi = "10.1007/978-3-642-39637-3\_14",
language = "English",
isbn = "9783642396366",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
number = "PART 1",
pages = "173--183",
booktitle = "Computational Science and Its Applications, ICCSA 2013 - 13th International Conference, Proceedings",
edition = "PART 1",
note = "13th International Conference on Computational Science and Its Applications, ICCSA 2013 ; Conference date: 24-06-2013 Through 27-06-2013",
}