@inproceedings{84b4a74ee2764c7ea6032fb3f94bc28b,
title = "A distributed workflow mapping algorithm for minimum end-to-end delay under fault-tolerance constraint",
abstract = "Many large-scale scientific applications feature distributed computing workflows of complex structures that must be executed and transferred in shared wide-area networks consisting of unreliable nodes and links. Mapping these computing workflows in such faulty network environments for optimal latency while ensuring certain fault tolerance is crucial to the success of eScience that requires both performance and reliability. We construct analytical cost models and formulate workflow mapping as an optimization problem under failure rate constraint. We propose a distributed heuristic mapping solution based on recursive critical path to achieve minimum end-to-end delay and satisfy a pre-specified overall failure rate for a guaranteed level of fault tolerance. The performance superiority of the proposed mapping solution is illustrated by extensive simulation-based comparisons with existing mapping algorithms.",
keywords = "Distributed algorithm, End-to-end delay, Fault tolerance, Scientific workflow",
author = "Qishi Wu and Yi Gu",
year = "2010",
doi = "10.1109/ICPADS.2010.38",
language = "English (US)",
isbn = "9780769543079",
series = "Proceedings of the International Conference on Parallel and Distributed Systems - ICPADS",
pages = "508--515",
booktitle = "Proceedings - 16th International Conference on Parallel and Distributed Systems, ICPADS 2010",
note = "16th IEEE International Conference on Parallel and Distributed Systems, ICPADS 2010 ; Conference date: 08-12-2010 Through 10-12-2010",
}