@inproceedings{89e26cdafceb4fa3add05af987648a2d,
title = "Natjam: Design and evaluation of eviction policies for supporting priorities and deadlines in mapreduce clusters",
abstract = "This paper presents Natjam, a system that supports arbitrary job priorities, hard real-time scheduling, and efficient preemption for Mapreduce clusters that are resource-constrained. Our contributions include: i) exploration and evaluation of smart eviction policies for jobs and for tasks, based on resource usage, task runtime, and job deadlines; and ii) a work-conserving task preemption mechanism for Mapreduce. We incorporated Natjam into the Hadoop YARN scheduler framework (in Hadoop 0.23). We present experiments from deployments on a test cluster, Emulab and a Yahoo! Inc. commercial cluster, using both synthetic workloads as well as Hadoop cluster traces from Yahoo!. Our results reveal that Natjam incurs overheads as low as 7%, and is preferable to existing approaches.",
keywords = "Deadlines, Hadoop, Mapreduce, Priorities, Scheduling",
author = "Brian Cho and Muntasir Rahman and Tej Chajed and Indranil Gupta and Cristina Abad and Nathan Roberts and Philbert Lin",
year = "2013",
doi = "10.1145/2523616.2523624",
language = "English (US)",
isbn = "9781450324281",
series = "Proceedings of the 4th Annual Symposium on Cloud Computing, SoCC 2013",
publisher = "Association for Computing Machinery",
booktitle = "Proceedings of the 4th Annual Symposium on Cloud Computing, SoCC 2013",
address = "United States",
note = "4th Annual Symposium on Cloud Computing, SoCC 2013 ; Conference date: 01-10-2013 Through 03-10-2013",
}