@inproceedings{a4b55e9d7482496cba7701d1d0d50a0d,
title = "Distributed peer-to-peer control in harness",
abstract = "Harness is an adaptable fault-tolerant virtual machine environment for next-generation heterogeneous distributed computing developed as a follow on to PVM. It additionally enables the assembly of applications from plug-ins and provides fault-tolerance. This work describes the distributed control, which manages global state replication to ensure a high-availability of service. Group communication services achieve an agreement on an initial global state and a linear history of global state changes at all members of the distributed virtual machine. This global state is replicated to all members to easily recover from single, multiple and cascaded faults. A peer-to-peer ring network architecture and tunable multi-point failure conditions provide heterogeneity and scalability. Finally, the integration of the distributed control into the multi-threaded kernel architecture of Harness offers a fault-tolerant global state database service for plug-ins and applications.",
author = "C. Engelmann and Scott, {S. L.} and Geist, {G. A.}",
year = "2002",
doi = "10.1007/3-540-46080-2_76",
language = "English",
isbn = "354043593X",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
number = "PART 2",
pages = "720--728",
booktitle = "Computational Science, ICCS 2002 - International Conference, Proceedings",
edition = "PART 2",
note = "International Conference on Computational Science, ICCS 2002 ; Conference date: 21-04-2002 Through 24-04-2002",
}