@inproceedings{b95cd096ceaf4798954a5dd55a609d80,
title = "Energy-efficient dynamic scheduling of deadline-constrained MapReduce workflows",
abstract = "Big data workflows comprised of moldable parallel MapReduce programs running on a large number of processors have become a main consumer of energy at data centers. The degree of parallelism of each moldable job in such workflows has a significant impact on the energy efficiency of parallel computing systems, which remains largely unexplored. In this paper, we validate with experimental results the moldable parallel computing model where the dynamic energy consumption of a moldable job increases with the number of parallel tasks. Based on our validation, we construct rigorous cost models and formulate a dynamic scheduling problem of deadline-constrained MapReduce workflows to minimize energy consumption in Hadoop systems. We propose a semi-dynamic online scheduling algorithm based on adaptive task partitioning to reduce dynamic energy consumption while meeting performance requirements from a global perspective, and also design the corresponding system modules for algorithm implementation in Hadoop architecture. The performance superiority of the proposed algorithm in terms of dynamic energy saving and deadline violation is illustrated by extensive simulation results in Hadoop/YARN in comparison with existing algorithms, and the core module of adaptive task partitioning is further validated through real-life workflow implementation and experimental results using the Oozie workflow engine in Hadoop/YARN systems.",
keywords = "Big data, MapReduce, job scheduling, scientific workflow",
author = "Tong Shu and Wu, {Chase Q.}",
note = "Publisher Copyright: {\textcopyright} 2017 IEEE.; 13th IEEE International Conference on eScience, eScience 2017 ; Conference date: 24-10-2017 Through 27-10-2017",
year = "2017",
month = nov,
day = "14",
doi = "10.1109/eScience.2017.18",
language = "English (US)",
series = "Proceedings - 13th IEEE International Conference on eScience, eScience 2017",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "393--402",
booktitle = "Proceedings - 13th IEEE International Conference on eScience, eScience 2017",
address = "United States",
}