@conference {PRP+12,
	title = {DEDISbench: A Benchmark for Deduplicated Storage Systems},
	booktitle = {In proceedings of International Symposium on Secure Virtual Infrastructures - ACSAC},
	volume = {7566},
	year = {2012},
	month = {September},
	publisher = {Springer},
	organization = {Springer},
	address = {Rome, Italy},
	abstract = {<p>Deduplication is widely accepted as an effective technique for eliminating duplicated data in backup and archival systems. Nowadays, deduplication is also becoming appealing in cloud computing, where large-scale virtualized storage infrastructures hold huge data volumes with a significant share of duplicated content. There have thus been several proposals for embedding deduplication in storage appliances and file systems, providing different performance trade-offs while targeting both user and application data, as well as virtual machine images.</p>
<p>It is however hard to determine to what extent is deduplication useful in a particular setting and what technique will provide the best results. In fact, existing disk I/O micro-benchmarks are not designed for evaluating deduplication systems, following simplistic approaches for generating data written that lead to unrealistic amounts of duplicates.</p>
<p>We address this with DEDISbench, a novel micro-benchmark for evaluating disk I/O performance of block based deduplication systems. As the main contribution, we introduce the generation of a realistic duplicate distribution based on real datasets. Moreover, DEDISbench also allows simulating access hotspots and different load intensities for I/O operations. The usefulness of DEDISbench is shown by comparing it with Bonnie++ and IOzone open-source disk I/O micro-benchmarks on assessing two open-source deduplication systems, Opendedup and Lessfs, using Ext4 as a baseline. As a secondary contribution, our results lead to novel insight on the performance of these file systems.</p>
},
	attachments = {https://haslab.uminho.pt/sites/default/files/jtpaulo/files/pp12.pdf},
	author = {Jo{\~a}o Paulo and P. Reis and Jos{\'e} Orlando Pereira and Ant{\'o}nio Luis Sousa}
}
