@inbook{a3150bd43da64aaeb5fb7448a3bf3882,
title = "Running MPI jobs with WebCom",
abstract = "A {"}typical{"} MPI job consists of 4 components: an MPI binary; an optional machines file; a set of optional input files and a parameterised start script. Of these, the machines file and the starting script are most prone to change from run to run on the same parallel architecture or on a different architecture. Moving an MPI job to a different architecture will precipitate the greatest changes in these and possibly the other components. The work associated with making and managing these changes is tedious and error-prone, especially if the user-base is large, andlor the underlying system is dynamic in size or is heterogeneous. This problem can be addressed by employing an abstract machine to separate the MPI launch process from the underlying parallel architecture. In this role the WebCom abstract machine can readily be used to generate a parallel architecture from component machines, to dynamically create a machines file and startup script and, if necessary, to stage the binary and input files. Change management is also addressed by employing WebCom to manage user accounts, shared file space, data storage and on-going run-time costs.",
keywords = "Cluster, Condensed graphs, Mpi",
author = "Brian Clayton and Therese Enright and Morrison, \{John P.\}",
year = "2005",
language = "English",
isbn = "9781932415605",
series = "Proceedings of the 2005 International Conference on Parallel and Distributed Processing Techniques and Applications, PDPTA'05",
publisher = "CSREA Press",
pages = "946--949",
booktitle = "Proceedings of the 2005 International Conference on Parallel and Distributed Processing Techniques and Applications, PDPTA'05",
note = "2005 International Conference on Parallel and Distributed Processing Techniques and Applications, PDPTA'05 ; Conference date: 27-06-2005 Through 30-06-2005",
}