@techreport{RISC119,author = {Károly Bósa and Wolfgang Schreiner},
title = {{Task Logging, Rescheduling and Peer Checking in Distributed Maple}},
language = {english},
abstract = {We have extended the parallel computer algebra environment Distributed
Maple by fault tolerance mechanisms such that the time spent in a long
running computation is not any wasted by the eventual occurrence of
session failure. The first mechanism is the logging of task return
values and of shared object values such that after a failure the
newly started session can (transparently to the application program)
reuse already computed result. The second mechanism is the migration
of tasks such that a session may tolerate the failure of individual
nodes without overall failure. The third mechanism is the redirection
of the messages such that a session may tolerate also the failure of
the connections between nodes without overall failure.},
number = {02-10},
year = {2002},
month = {March},
institution = {RISC-Linz, Johannes Kepler University, Linz, Austria},
length = {24}
}