@inproceedings{271ea1e0e5d04d6db441268260a6a5df,
title = "Lineage management for networks of varying reliability",
abstract = "In distributed and grid applications, complex work dependencies may build between machines during execution and the occurrence of faults may have a detrimental impact on the execution profile. An efficient fault tolerance policy should aim to reduce this impact, whilst taking into account the varying reliability of machines and sites taking part in the computation. This paper proposes a Lineage Management algorithm to protect the work dependency topology. This is accomplished by combining processor replacement mechanisms with data retention {"}housekeeping{"} on participating machines. The number of concurrent faults catered for is linearly dependent on the amount of housekeeping performed. This housekeeping {"}throttle{"} can then be adjusted from machine to machine in accordance with the reliability of machines or sites.",
keywords = "Dynamic fault tolerance, Grid computing, Quality of service, WebCom",
author = "Kennedy, \{James J.\} and Morrison, \{John P.\}",
year = "2005",
language = "English",
isbn = "9781932415582",
series = "Proceedings of the 2005 International Conference on Parallel and Distributed Processing Techniques and Applications, PDPTA'05",
pages = "504--513",
booktitle = "Proceedings of the 2005 International Conference on Parallel and Distributed Processing Techniques and Applications, PDPTA'05",
note = "2005 International Conference on Parallel and Distributed Processing Techniques and Applications, PDPTA'05 ; Conference date: 27-06-2005 Through 30-06-2005",
}