RISC RISC Research Institute for Symbolic Computation  
  • @techreport{RISC119,
    author = {Károly Bósa and Wolfgang Schreiner},
    title = {{Task Logging, Rescheduling and Peer Checking in Distributed Maple}},
    language = {english},
    abstract = {We have extended the parallel computer algebra environment Distributed Maple by fault tolerance mechanisms such that the time spent in a long running computation is not any wasted by the eventual occurrence of session failure. The first mechanism is the logging of task return values and of shared object values such that after a failure the newly started session can (transparently to the application program) reuse already computed result. The second mechanism is the migration of tasks such that a session may tolerate the failure of individual nodes without overall failure. The third mechanism is the redirection of the messages such that a session may tolerate also the failure of the connections between nodes without overall failure.},
    number = {02-10},
    year = {2002},
    month = {March},
    institution = {RISC-Linz, Johannes Kepler University, Linz, Austria},
    length = {24}