@inproceedings{41725c09d50143daa712d6562106f11c,
title = "Design of a fault-tolerant job-flow manager for grid environments using standard technologies, job-flow patterns, and a transparent proxy",
abstract = "The execution of job flow applications is a reality today in academic and industrial domains. Current approaches to execution of job flows often follow proprietary solutions on expressing the job flows and do not leverage recurrent job-flow patterns to address faults in Grid computing environments. In this paper, we provide a design solution to development of job-flow managers that uses standard technologies such as BPEL and JSDL to express job flows and employs a two-layer peer-to-peer architecture with interoperable protocols for cross-domain interactions among job-flow mangers. In addition, we identify a number of recurring job-flow patterns and introduce their corresponding fault-tolerant patterns to address runtime faults and exceptions. Finally, to keep the business logic of job flows separate from their fault-tolerant behavior, we use a transparent proxy that intercepts job-flow execution at runtime to handle potential faults using a growing knowledge base that contains the most recently identified job-flow patterns and their corresponding fault-tolerant patterns.",
keywords = "BPEL, Fault tolerant, Grid computing, JSDL, Job-flow patterns, Peer-to-peer, Software design",
author = "Gargi Dasgupta and Onyeka Ezenwoye and Liana Fong and Selim Kalayci and Sadjadi, {S. Masoud} and Balaji Viswanathan",
year = "2008",
language = "English (US)",
isbn = "9781627486620",
series = "20th International Conference on Software Engineering and Knowledge Engineering, SEKE 2008",
pages = "814--819",
booktitle = "20th International Conference on Software Engineering and Knowledge Engineering, SEKE 2008",
note = "20th International Conference on Software Engineering and Knowledge Engineering, SEKE 2008 ; Conference date: 01-07-2008 Through 03-07-2008",
}