RISC RISC Research Institute for Symbolic Computation  
  • @inproceedings{RISC120,
    author = {Károly Bósa and Wolfgang Schreiner},
    title = {{Tolerating Stop Failures in Distributed Maple}},
    booktitle = {{Distributed and Parallel Systems - Cluster and Grid Computing}},
    language = {english},
    abstract = {Earlier we introduced some fault tolerance mechanisms to the parallel computer algebra system Distributed Maple such that a session may tolerate the failure of nodes and connections without overall failure. We have extended this fault tolerance by some advanced mechanisms. The first is the reconnection of a node after a connection failure such that a session does not deadlock. The second mechanism is the restarting of a node after a failure such that the session does not fail. The third mechanism is the change of the root node such that a session may tolerate also the failure of the root without overall failure.},
    pages = {203--210},
    publisher = {Kluwer Academic Publishers Group},
    isbn_issn = {ISBN 1-4020-7209-0},
    year = {2002},
    editor = {Péter Kacsuk and Dieter Kranzmüller and Zsolt Németh and Jens Volkert},
    refereed = {yes},
    institution = {RISC-Linz, Johannes Kepler University, Linz, Austria},
    keywords = {distributed systems, fault tolerance, computer algebra},
    length = {8},
    conferencename = {4th Austrian-Hungarian Workshop on Distributed and Parallel Processing}