@inproceedings{5339afc7927d492b999f70b743687dc6,
title = "Network multicomputing using recoverable distributed shared memory",
abstract = "A network multicomputer is a multiprocessor in which the processors are connected by general-purpose networking technology, in contrast to current distributed memory multi-processors where a dedicated special-purpose interconnect is used. The advent of high-speed general-purpose networks provides the impetus for a new look at the network multiprocessor model, by removing the bottleneck of current slow networks. However, major software issues remain unsolved. A convenient machine abstraction must be developed that hides from the application programmer low-level details such as message passing or machine failures. We use distributed shared memory as a programming abstraction, and rollback recovery through consistent checkpointing to provide fault tolerance. Measurements of our implementations of distributed shared memory and consistent checkpointing show that these abstractions can be implemented efficiently.",
author = "Carter, {John B.} and Cox, {Alan L.} and Sandhya Dwarkadas and Elnozahy, {Elmootazbellah N.} and Johnson, {David B.} and Pete Keleher and Steven Rodriguez and Weimin Yu and Willy Zwaenepoel",
year = "1993",
language = "English (US)",
isbn = "0780312945",
series = "1993 IEEE Compcon Spring",
publisher = "Publ by IEEE",
pages = "519--527",
booktitle = "1993 IEEE Compcon Spring",
note = "38th Annual IEEE Computer Society International Computer Conference - COMPCON SPRING '93 ; Conference date: 22-02-1993 Through 26-02-1993",
}