@InProceedings{Supelec688,
author = {Virginie Galtier and Constantinos Makassikis and Stephane Vialle},
title = {{A Javaspace-based Framework for Efficient Fault-Tolerant Master-Worker Distributed Applications}},
year = {2011},
booktitle = {{Proceedings of the 19th International Euromicro Conference on Parallel, Distributed and Network-based Processing (PDP 2011)}},
publisher = {IEEE Computer Society},
pages = {272-276},
month = {February},
editor = {Yiannis Cotronis and Marco Danelutto and George Angelos Papadopoulos},
address = {Ayia Napa, Cyprus},
isbn = {978-0-7695-4328-4},
abstract = {We propose a framework built around a JavaSpace to ease the
development of bag-of-tasks applications. The framework may
optionally and automatically tolerate transient crash failures
occurring on any of the distributed elements. It relies on
checkpointing and underlying middleware mechanisms to do so. To
further improve checkpointing efficiency, both in size and
frequency, the programmer can introduce intermediate user-defined
checkpoint data and code within the task processing program. The
framework used without fault tolerance accelerates application
development, does not introduce runtime overhead and yields to
expected speedup. When enabling fault tolerance, our framework
allows, despite failures, correct completion of applications with
limited runtime and data storage overheads. Experiments run with
up to 128 workers study the impact of some user-related and
implementation-related parameters on overall performance, and
reveal good performances for classical JavaSpace-based master-
worker application profiles.}
}