1 % THIS IS A COPY, DO NOT EDIT IT!!
2 % REFEER TO ORIGINAL /home/rodrigo/Dropbox/papers//bibliography.bib
3 @InProceedings
{labos2009
:viera09
,
4 address = {Estoril
, Lisbon
, Portugal
},
6 author = {Vieira
, Gustavo M. D. and Zwaenepoel
, Willy and Buzato
, Luis E.
},
7 booktitle = {Proceedings of the
39th
{I
}nternational
{C
}onference on
8 {D
}ependable
{S
}ystems and
{N
}etworks
({DSN
})},
9 details
= {http
://infoscience.epfl.ch
/record
/135193},
10 documenturl
= {http
://infoscience.epfl.ch
/getfile.py?recid
=135193&mode
=best
},
13 location
= {Estoril
, Lisbon
, Portugal
},
14 oai
-id
= {oai
:infoscience.epfl.ch
:135193},
15 oai
-set
= {conf
; fulltext
-public
; fulltext
},
20 title = {Dynamic
{C
}ontent
{W
}eb
{A
}pplications
: {C
}rash
,
21 {F
}ailover
, and
{R
}ecovery
{A
}nalysis
},
23 url
= {http
://www.dsn.org
/},
26 @article
{Chandra
:1996:WFD
:234533.234549,
27 author = {Chandra
, Tushar D. and Hadzilacos
, Vassos and Toueg
, Sam
},
28 title = {The weakest failure detector for solving consensus
},
37 url
= {http
://doi.acm.org
/10.1145/234533.234549},
38 doi
= {http
://doi.acm.org
/10.1145/234533.234549},
41 address = {New York
, NY
, USA
},
42 keywords = {Byzantine Generals' problem
, agreement problem
, asynchronous systems
, atomic broadcast
, commit problem
, consensus problem
, crash failures
, failure detection
, fault
-tolerance
, message passing
, partial synchrony
, processor failures
},
44 @inproceedings
{Aguilera
:2001:SLE
:645958.676119,
45 author = {Aguilera
, Marcos K. and Delporte
-Gallet
, Carole and Fauconnier
, Hugues and Toueg
, Sam
},
46 title = {Stable Leader Election
},
47 booktitle = {Proceedings of the
15th International Conference on Distributed Computing
},
50 isbn
= {3-540-42605-1},
53 url
= {http
://portal.acm.org
/citation.cfm?id
=645958.676119},
55 publisher = {Springer
-Verlag
},
56 address = {London
, UK
},
58 @InProceedings
{vieira08
:_trepl
,
59 author = {Vieira
, Gustavo M. D. and Buzato
, Luis E.
},
60 title = {Treplica
: {U
}biquitous
{R
}eplication
},
61 booktitle = {Proceedings of the
26th Brazilian Symposium on Computer Networks and Distributed Systems
},
63 @inproceedings
{Aguilera
:2007:SNP
:1294261.1294278,
64 author = {Aguilera
, Marcos K. and Merchant
, Arif and Shah
, Mehul and Veitch
, Alistair and Karamanolis
, Christos
},
65 title = {Sinfonia
: a new paradigm for building scalable distributed systems
},
66 booktitle = {Proceedings of twenty
-first ACM SIGOPS symposium on Operating systems principles
},
69 isbn
= {978-1-59593-591-5},
70 location
= {Stevenson
, Washington
, USA
},
73 url
= {http
://doi.acm.org
/10.1145/1294261.1294278},
74 doi
= {http
://doi.acm.org
/10.1145/1294261.1294278},
77 address = {New York
, NY
, USA
},
78 keywords = {distributed systems
, fault tolerance
, scalability
, shared memory
, transactions
, two
-phase commit
},
80 @article
{Lamport
:1978_clocks
,
81 author = {Lamport
, Leslie
},
82 title = {Time
, clocks
, and the ordering of events in a distributed system
},
83 journal = {Commun. ACM
},
91 url
= {http
://doi.acm.org
/10.1145/359545.359563},
92 doi
= {http
://doi.acm.org
/10.1145/359545.359563},
95 address = {New York
, NY
, USA
},
96 keywords = {clock synchronization
, computer networks
, distributed systems
, multiprocess systems
},
98 @inproceedings
{Isard
:2007:DDD
:1272996.1273005,
99 author = {Isard
, Michael and Budiu
, Mihai and Yu
, Yuan and Birrell
, Andrew and Fetterly
, Dennis
},
100 title = {Dryad
: distributed data
-parallel programs from sequential building blocks
},
101 booktitle = {Proceedings of the
2nd ACM SIGOPS
/EuroSys European Conference on Computer Systems
2007},
102 series = {EuroSys '
07},
104 isbn
= {978-1-59593-636-3},
105 location
= {Lisbon
, Portugal
},
108 url
= {http
://doi.acm.org
/10.1145/1272996.1273005},
109 doi
= {http
://doi.acm.org
/10.1145/1272996.1273005},
112 address = {New York
, NY
, USA
},
113 keywords = {cluster computing
, concurrency
, dataflow
, distributed programming
},
115 @article
{Defago
:2004,
116 author = {D\'
{e
}fago
, Xavier and Schiper
, Andr\'
{e
} and Urb\'
{a
}n
, P\'
{e
}ter
},
117 title = {Total order broadcast and multicast algorithms
: Taxonomy and survey
},
118 journal = {ACM Comput. Surv.
},
126 url
= {http
://doi.acm.org
/10.1145/1041680.1041682},
127 doi
= {http
://doi.acm.org
/10.1145/1041680.1041682},
130 address = {New York
, NY
, USA
},
131 keywords = {Distributed systems
, agreement problems
, atomic broadcast
, atomic multicast
, classification
, distributed algorithms
, fault
-tolerance
, global ordering
, group communication
, message passing
, survey
, taxonomy
, total ordering
},
133 @TechReport
{hadzilacos94
,
134 author = {Hadzilacos
, Vassos and Toueg
, Sam
},
135 title = {A modular approach to the specification and implementation of fault
-tolerant broadcasts
},
136 institution = {Department of Computer Science
, Cornell University
},
139 address = {Ithaca
, NY
},
141 @inproceedings
{Rodrigues
:2000,
142 author = {Rodrigues
, L. and Raynal
, M.
},
143 title = {Atomic Broadcast in Asynchronous Crash
-Recovery Distributed Systems
},
144 booktitle = {Proceedings of the The
20th International Conference on Distributed Computing Systems
( ICDCS
2000)},
145 series = {ICDCS '
00},
147 isbn
= {0-7695-0601-1},
149 url
= {http
://portal.acm.org
/citation.cfm?id
=850927.851790},
151 publisher = {IEEE Computer Society
},
152 address = {Washington
, DC
, USA
},
153 keywords = {Distributed Algorithms
, Distributed Fault Tolerant Systems
, Communication Protocols
}
155 @article
{Chandra
:1996:UFD
:226643.226647,
156 author = {Chandra
, Tushar D. and Toueg
, Sam
},
157 title = {Unreliable failure detectors for reliable distributed systems
},
166 url
= {http
://doi.acm.org
/10.1145/226643.226647},
167 doi
= {http
://doi.acm.org
/10.1145/226643.226647},
170 address = {New York
, NY
, USA
},
171 keywords = {Byzantine Generals' problem
, agreement problem
, asynchronous systems
, atomic broadcast
, commit problem
, consensus problem
, crash failures
, failure detection
, fault
-tolerance
, message passing
, partial synchrony
, processor failures
},
173 @inproceedings
{Schroeder
:2007:DFR
:1267903.1267904,
174 author = {Schroeder
, Bianca and Gibson
, Garth A.
},
175 title = {Disk failures in the real world
: what does an MTTF of
1,000,000 hours mean to you?
},
176 booktitle = {Proceedings of the
5th USENIX conference on File and Storage Technologies
},
178 location
= {San Jose
, CA
},
181 url
= {http
://portal.acm.org
/citation.cfm?id
=1267903.1267904},
183 publisher = {USENIX Association
},
184 address = {Berkeley
, CA
, USA
},
186 @article
{Dwork
:1988:CPP
:42282.42283,
187 author = {Dwork
, Cynthia and Lynch
, Nancy and Stockmeyer
, Larry
},
188 title = {Consensus in the presence of partial synchrony
},
197 url
= {http
://doi.acm.org
/10.1145/42282.42283},
198 doi
= {http
://doi.acm.org
/10.1145/42282.42283},
201 address = {New York
, NY
, USA
},
203 @ARTICLE
{Boichat_deconstructingpaxos
,
204 author = {Boichat
, Romain and Dutta
, Partha and Fr
{\o
}lund
, Svend and Guerraoui
, Rachid
},
205 title = {Deconstructing paxos
},
206 journal = {SIGACT News
},
214 url
= {http
://doi.acm.org
/10.1145/637437.637447},
215 doi
= {http
://doi.acm.org
/10.1145/637437.637447},
218 address = {New York
, NY
, USA
},
220 @article
{Lamport
:1998:PP
:279227.279229,
221 author = {Lamport
, Leslie
},
222 title = {The part
-time parliament
},
223 journal = {ACM Trans. Comput. Syst.
},
231 url
= {http
://doi.acm.org
/10.1145/279227.279229},
232 doi
= {http
://doi.acm.org
/10.1145/279227.279229},
235 address = {New York
, NY
, USA
},
236 keywords = {state machines
, three
-phase commit
, voting
},
238 @article
{Elnozahy
:2002:SRP
:568522.568525,
239 author = {Elnozahy
, E. N.
(Mootaz
) and Alvisi
, Lorenzo and Wang
, Yi
-Min and Johnson
, David B.
},
240 title = {A survey of rollback
-recovery protocols in message
-passing systems
},
241 journal = {ACM Comput. Surv.
},
242 issue_date
= {September
2002},
250 url
= {http
://doi.acm.org
/10.1145/568522.568525},
251 doi
= {http
://doi.acm.org
/10.1145/568522.568525},
254 address = {New York
, NY
, USA
},
255 keywords = {message logging
, rollback
-recovery
},
257 @inproceedings
{Koo
:1986:CRD
:324493.325074,
258 author = {Koo
, Richard and Toueg
, Sam
},
259 title = {Checkpointing and rollback
-recovery for distributed systems
},
260 booktitle = {Proceedings of
1986 ACM Fall joint computer conference
},
263 isbn
= {0-8186-4743-4},
264 location
= {Dallas
, Texas
, United States
},
265 pages = {1150--1158},
267 url
= {http
://portal.acm.org
/citation.cfm?id
=324493.325074},
269 publisher = {IEEE Computer Society Press
},
270 address = {Los Alamitos
, CA
, USA
},
272 @article
{10.1109/CCGRID
.2010.40,
273 author = {Leonardo Arturo Bautista Gomez and Naoya Maruyama and Franck Cappello and Satoshi Matsuoka
},
274 title = {Distributed Diskless Checkpoint for Large Scale Systems
},
275 journal ={Cluster Computing and the Grid
, IEEE International Symposium on
},
277 isbn
= {978-0-7695-4039-9},
280 doi
= {http
://doi.ieeecomputersociety.org
/10.1109/CCGRID
.2010.40},
281 publisher = {IEEE Computer Society
},
282 address = {Los Alamitos
, CA
, USA
},
284 @article
{Charron
-Bost
:2007:HDF
:1233481.1233496,
285 author = {Charron
-Bost
, Bernadette and Schiper
, Andr\'
{e
}},
286 title = {Harmful dogmas in fault tolerant distributed computing
},
287 journal = {SIGACT News
},
295 url
= {http
://doi.acm.org
/10.1145/1233481.1233496},
296 doi
= {http
://doi.acm.org
/10.1145/1233481.1233496},
299 address = {New York
, NY
, USA
},
301 @inproceedings
{Camargos
:2007:MP
:1281100.1281150,
302 author = {Camargos
, L\'
{a
}saro Jonas and Schmidt
, Rodrigo Malta and Pedone
, Fernando
},
303 title = {Multicoordinated Paxos
},
304 booktitle = {Proceedings of the twenty
-sixth annual ACM symposium on Principles of distributed computing
},
307 isbn
= {978-1-59593-616-5},
308 location
= {Portland
, Oregon
, USA
},
311 url
= {http
://doi.acm.org
/10.1145/1281100.1281150},
312 doi
= {http
://doi.acm.org
/10.1145/1281100.1281150},
315 address = {New York
, NY
, USA
},
316 keywords = {Paxos
, atomic broadcast
, consensus
, generalized
, multicoordinated
},
318 @inproceedings
{Fischer
:1983:CPU
:647891.739594,
319 author = {Fischer
, Michael J.
},
320 title = {The Consensus Problem in Unreliable Distributed Systems
(A Brief Survey
)},
321 booktitle = {Proceedings of the
1983 International FCT
-Conference on Fundamentals of Computation Theory
},
323 isbn
= {3-540-12689-9},
326 url
= {http
://portal.acm.org
/citation.cfm?id
=647891.739594},
328 publisher = {Springer
-Verlag
},
329 address = {London
, UK
},
331 @article
{10.1109/SRDS
.2009.25,
332 author = {Omid Shahmirzadi and Sergio Mena and Andr\'
{e
} Schiper
},
333 title = {Relaxed Atomic Broadcast
: State
-Machine Replication Using Bounded Memory
},
334 journal ={Reliable Distributed Systems
, IEEE Symposium on
},
339 doi
= {http
://doi.ieeecomputersociety.org
/10.1109/SRDS
.2009.25},
340 publisher = {IEEE Computer Society
},
341 address = {Los Alamitos
, CA
, USA
},
343 @inproceedings
{Okun
:2002:NSR
:829526.831119,
344 author = {Okun
, Michael and Barak
, Amnon
},
345 title = {On Node State Reconstruction for Fault Tolerant Distributed Algorithms
},
346 booktitle = {Proceedings of the
21st IEEE Symposium on Reliable Distributed Systems
},
349 isbn
= {0-7695-1659-9},
351 url
= {http
://portal.acm.org
/citation.cfm?id
=829526.831119},
353 publisher = {IEEE Computer Society
},
354 address = {Washington
, DC
, USA
},
355 keywords = {Distributed algorithms
, fault tolerance
, state reconstruction
, recovery
},
357 @inproceedings
{Chandra
:2007:PML
:1281100.1281103,
358 author = {Chandra
, Tushar D. and Griesemer
, Robert and Redstone
, Joshua
},
359 title = {Paxos made live
: an engineering perspective
},
360 booktitle = {Proceedings of the twenty
-sixth annual ACM symposium on Principles of distributed computing
},
363 isbn
= {978-1-59593-616-5},
364 location
= {Portland
, Oregon
, USA
},
367 url
= {http
://doi.acm.org
/10.1145/1281100.1281103},
368 doi
= {http
://doi.acm.org
/10.1145/1281100.1281103},
371 address = {New York
, NY
, USA
},
372 keywords = {Paxos
, experiences
, fault
-tolerance
, implementation
},
374 @conference
{juang2002crash
,
375 title={{Crash recovery with little overhead
}},
376 author={Juang
, T.T.Y. and Venkatesan
, S.
},
377 booktitle={Distributed Computing Systems
, 1991.
, 11th International Conference on
},
383 @inproceedings
{Freiling
:2009:MCA
:1729641.1730101,
384 author = {Freiling
, Felix C. and Lambertz
, Christian and Majster
-Cederbaum
, Mila
},
385 title = {Modular Consensus Algorithms for the Crash
-Recovery Model
},
386 booktitle = {Proceedings of the
2009 International Conference on Parallel and Distributed Computing
, Applications and Technologies
},
387 series = {PDCAT '
09},
389 isbn
= {978-0-7695-3914-0},
392 url
= {http
://dx.doi.org
/10.1109/PDCAT
.2009.50},
393 doi
= {http
://dx.doi.org
/10.1109/PDCAT
.2009.50},
395 publisher = {IEEE Computer Society
},
396 address = {Washington
, DC
, USA
},
397 keywords = {asynchronous systems
, consensus
, fault tolerance
, process crash and recovery
, stable storage
},
399 @TechReport
{oliveira97
:consensus
,
400 author = {Oliveira
, Rui and Guerraoui
, Rachid and Schiper
, Andr\'
{e
}},
401 title = {Consensus in the crash
-recover model
},
402 institution = {Département d'Informatique
, Ecole Polytechnique Fédérale
},
405 address = {Laussane
, Switzerland
},
407 @inproceedings
{Freiling
:2008:ECA
:1432291.1432332,
408 author = {Freiling
, Felix C. and Lambertz
, Christian and Majster
-Cederbaum
, Mila
},
409 title = {Easy Consensus Algorithms for the Crash
-Recovery Model
},
410 booktitle = {Proceedings of the
22nd international symposium on Distributed Computing
},
413 isbn
= {978-3-540-87778-3},
414 location
= {Arcachon
, France
},
417 url
= {http
://dx.doi.org
/10.1007/978-3-540-87779-0_39
},
418 doi
= {http
://dx.doi.org
/10.1007/978-3-540-87779-0_39
},
420 publisher = {Springer
-Verlag
},
421 address = {Berlin
, Heidelberg
},
423 @article
{Vieira
:2008:CRF
:1390853.1390875,
424 author = {Vieira
, Gustavo M. D. and Buzato
, Luiz E.
},
425 title = {On the coordinator's rule for Fast Paxos
},
426 journal = {Inf. Process. Lett.
},
434 url
= {http
://portal.acm.org
/citation.cfm?id
=1390853.1390875},
435 doi
= {10.1016/j.ipl
.2008.03.001},
437 publisher = {Elsevier North
-Holland
, Inc.
},
438 address = {Amsterdam
, The Netherlands
, The Netherlands
},
439 keywords = {Consensus
, Crash
-recovery
, Distributed systems
, Paxos
},
441 @article
{Schneider
:1990:IFS
:98163.98167,
442 author = {Schneider
, Fred B.
},
443 title = {Implementing fault
-tolerant services using the state machine approach
: a tutorial
},
444 journal = {ACM Comput. Surv.
},
452 url
= {http
://doi.acm.org
/10.1145/98163.98167},
453 doi
= {http
://doi.acm.org
/10.1145/98163.98167},
456 address = {New York
, NY
, USA
},
458 @article
{lamport1978implementation
,
459 title={{The implementation of reliable distributed multiprocess systems
}},
460 author={Lamport
, Leslie
},
461 journal={Computer Networks
(1976)},
469 @inproceedings
{Oki
:1988:VRN
:62546.62549,
470 author = {Oki
, Brian M. and Liskov
, Barbara H.
},
471 title = {Viewstamped Replication
: A New Primary Copy Method to Support Highly
-Available Distributed Systems
},
472 booktitle = {Proceedings of the seventh annual ACM Symposium on Principles of distributed computing
},
475 isbn
= {0-89791-277-2},
476 location
= {Toronto
, Ontario
, Canada
},
479 url
= {http
://doi.acm.org
/10.1145/62546.62549},
480 doi
= {http
://doi.acm.org
/10.1145/62546.62549},
483 address = {New York
, NY
, USA
},
485 @article
{Lamport
:1982:BGP
:357172.357176,
486 author = {Lamport
, Leslie and Shostak
, Robert and Pease
, Marshall
},
487 title = {The Byzantine Generals Problem
},
488 journal = {ACM Trans. Program. Lang. Syst.
},
489 issue_date
= {July
1982},
497 url
= {http
://doi.acm.org
/10.1145/357172.357176},
498 doi
= {http
://doi.acm.org
/10.1145/357172.357176},
501 address = {New York
, NY
, USA
},
503 @article
{Neiger
:1990:AIF
:83334.83337,
504 author = {Neiger
, Gil and Toueg
, Sam
},
505 title = {Automatically increasing the fault
-tolerance of distributed algorithms
},
506 journal = {J. Algorithms
},
514 url
= {http
://portal.acm.org
/citation.cfm?id
=83334.83337},
515 doi
= {10.1016/0196-6774(90)90019-B
},
517 publisher = {Academic Press
, Inc.
},
518 address = {Duluth
, MN
, USA
},
520 @TechReport
{vieira10
:implementing
-tr
,
521 author = {Vieira
, Gustavo M. D. and Buzato
, Luiz E.
},
522 title = {Implementation of an Object
-Oriented Specification
523 for Active Replication Using Consensus
},
524 institution = {Instituto de Computação
, Universidade Estadual de Campinas
},
528 @article
{Reynal
:2005:SIF
:1052796.1052806,
529 author = {Reynal
, Michel
},
530 title = {A short introduction to failure detectors for asynchronous distributed systems
},
531 journal = {SIGACT News
},
539 url
= {http
://doi.acm.org
/10.1145/1052796.1052806},
540 doi
= {http
://doi.acm.org
/10.1145/1052796.1052806},
543 address = {New York
, NY
, USA
},
545 @inproceedings
{Bonnet
:2010:CAD
:1825731.1826088,
546 author = {Bonnet
, Fran\c
{c
}ois and Raynal
, Michel
},
547 title = {Consensus in Anonymous Distributed Systems
: Is There a Weakest Failure Detector?
},
548 booktitle = {Proceedings of the
2010 24th IEEE International Conference on Advanced Information Networking and Applications
},
551 isbn
= {978-0-7695-4018-4},
554 url
= {http
://dx.doi.org
/10.1109/AINA
.2010.19},
555 doi
= {http
://dx.doi.org
/10.1109/AINA
.2010.19},
557 publisher = {IEEE Computer Society
},
558 address = {Washington
, DC
, USA
},
560 @inproceedings
{Gupta
:2001:SED
:383962.384010,
561 author = {Gupta
, Indranil and Chandra
, Tushar D. and Goldszmidt
, Germ\'
{a
}n S.
},
562 title = {On scalable and efficient distributed failure detectors
},
563 booktitle = {Proceedings of the twentieth annual ACM symposium on Principles of distributed computing
},
566 isbn
= {1-58113-383-9},
567 location
= {Newport
, Rhode Island
, United States
},
570 url
= {http
://doi.acm.org
/10.1145/383962.384010},
571 doi
= {http
://doi.acm.org
/10.1145/383962.384010},
574 address = {New York
, NY
, USA
},
575 keywords = {accuracy
, distributed systems
, efficiency
, failure detectors
, scalability
},
577 @inproceedings
{Xiong
:2009:SFD
:1632708.1633468,
578 author = {Xiong
, Naixue and Yang
, Yan and Cao
, Ming and He
, Jing and Shu
, Lei
},
579 title = {A Survey on Fault
-Tolerance in Distributed Network Systems
},
580 booktitle = {Proceedings of the
2009 International Conference on Computational Science and Engineering
- Volume
02},
583 isbn
= {978-0-7695-3823-5},
584 pages = {1065--1070},
586 url
= {http
://dx.doi.org
/10.1109/CSE
.2009.497},
587 doi
= {http
://dx.doi.org
/10.1109/CSE
.2009.497},
589 publisher = {IEEE Computer Society
},
590 address = {Washington
, DC
, USA
},
591 keywords = {Failure detector
, Fault
-tolerance
, Network Systems
, Quality
-of
-service
},
593 @article
{10.1109/CSE
.2009.497,
594 author = {Naixue Xiong and Yan Yang and Ming Cao and Jing He and Lei Shu
},
595 title = {A Survey on Fault
-Tolerance in Distributed Network Systems
},
596 journal ={Computational Science and Engineering
, IEEE International Conference on
},
598 isbn
= {978-0-7695-3823-5},
601 doi
= {http
://doi.ieeecomputersociety.org
/10.1109/CSE
.2009.497},
602 publisher = {IEEE Computer Society
},
603 address = {Los Alamitos
, CA
, USA
},
605 @article
{Chockler
:2001:GCS
:503112.503113,
606 author = {Chockler
, Gregory V. and Keidar
, Idit and Vitenberg
, Roman
},
607 title = {Group communication specifications
: a comprehensive study
},
608 journal = {ACM Comput. Surv.
},
609 issue_date
= {December
2001},
617 url
= {http
://doi.acm.org
/10.1145/503112.503113},
618 doi
= {http
://doi.acm.org
/10.1145/503112.503113},
621 address = {New York
, NY
, USA
},
622 keywords = {Group communication systems
, partitionable group membership
, process group membership
, specifications of group communication systems
, view synchrony
, virtual synchrony
},
624 @inproceedings
{Hurfin
:1998:CAS
:829523.830974,
625 author = {Hurfin
, Michel and Most\'
{e
}faoui
, Achour and Raynal
, Michel
},
626 title = {Consensus in Asynchronous Systems Where Processes Can Crash and Recover
},
627 booktitle = {Proceedings of the The
17th IEEE Symposium on Reliable Distributed Systems
},
630 isbn
= {0-8186-9218-9},
632 url
= {http
://portal.acm.org
/citation.cfm?id
=829523.830974},
634 publisher = {IEEE Computer Society
},
635 address = {Washington
, DC
, USA
},
637 @inproceedings
{Pinheiro
:2007:FTL
:1267903.1267905,
638 author = {Pinheiro
, Eduardo and Weber
, Wolf
-Dietrich and Barroso
, Luiz Andr\'
{e
}},
639 title = {Failure trends in a large disk drive population
},
640 booktitle = {Proceedings of the
5th USENIX conference on File and Storage Technologies
},
642 location
= {San Jose
, CA
},
645 url
= {http
://portal.acm.org
/citation.cfm?id
=1267903.1267905},
647 publisher = {USENIX Association
},
648 address = {Berkeley
, CA
, USA
},
650 @ARTICLE
{gray07
:empirical
,
651 author = {{Gray
}, Jim and
{van Ingen
}, Catherine
},
652 title = "
{Empirical Measurements of Disk Failure Rates and Error Rates
}"
,
653 journal = {ArXiv Computer Science e
-prints
},
654 eprint
= {arXiv
:cs
/0701166},
655 keywords = {Computer Science
- Databases
, Computer Science
- Architecture
},
658 adsurl
= {http
://adsabs.harvard.edu
/abs
/2007cs.......
.1166G
},
660 @article
{10.1109/SRDS
.2008.9,
661 author = {Timo Warns and Christian Storm and Wilhelm Hasselbring
},
662 title = {Availability of Globally Distributed Nodes
: An Empirical Evaluation
},
663 journal ={Reliable Distributed Systems
, IEEE Symposium on
},
668 doi
= {http
://doi.ieeecomputersociety.org
/10.1109/SRDS
.2008.9},
669 publisher = {IEEE Computer Society
},
670 address = {Los Alamitos
, CA
, USA
},
672 @article
{10.1109/SRDS
.2010.17,
673 author = {Raphael Marcos Menderico and Islene Calciolari Garcia
},
674 title = {Diskless Checkpointing with Rollback
-Dependency Trackability
},
675 journal ={Reliable Distributed Systems
, IEEE Symposium on
},
680 doi
= {http
://doi.ieeecomputersociety.org
/10.1109/SRDS
.2010.17},
681 publisher = {IEEE Computer Society
},
682 address = {Los Alamitos
, CA
, USA
},
684 @article
{Chandy
:1985:DSD
:214451.214456,
685 author = {Chandy
, K. Mani and Lamport
, Leslie
},
686 title = {Distributed snapshots
: determining global states of distributed systems
},
687 journal = {ACM Trans. Comput. Syst.
},
695 url
= {http
://doi.acm.org
/10.1145/214451.214456},
696 doi
= {http
://doi.acm.org
/10.1145/214451.214456},
699 address = {New York
, NY
, USA
},
701 @article
{Randell
:1978:RIC
:356725.356729,
702 author = {Randell
, Brian and Lee
, Pete and Treleaven
, Phillip C.
},
703 title = {Reliability Issues in Computing System Design
},
704 journal = {ACM Comput. Surv.
},
712 url
= {http
://doi.acm.org
/10.1145/356725.356729},
713 doi
= {http
://doi.acm.org
/10.1145/356725.356729},
716 address = {New York
, NY
, USA
},
718 @article
{Pease
:1980:RAP
:322186.322188,
719 author = {Pease
, Marshall and Shostak
, Robert and Lamport
, Leslie
},
720 title = {Reaching Agreement in the Presence of Faults
},
729 url
= {http
://doi.acm.org
/10.1145/322186.322188},
730 doi
= {http
://doi.acm.org
/10.1145/322186.322188},
733 address = {New York
, NY
, USA
},
735 @inproceedings
{Song
:2008:BBC
:1785854.1785862,
736 author = {Song
, Yee Jiun and van Renesse
, Robbert and Schneider
, Fred B. and Dolev
, Danny
},
737 title = {The building blocks of consensus
},
738 booktitle = {Proceedings of the
9th international conference on Distributed computing and networking
},
741 isbn
= {3-540-77443-2, 978-3-540-77443-3},
742 location
= {Kolkata
, India
},
745 url
= {http
://portal.acm.org
/citation.cfm?id
=1785854.1785862},
747 publisher = {Springer
-Verlag
},
748 address = {Berlin
, Heidelberg
},
750 @TechReport
{HUS
+02/LSR
,
751 author = {Hayashibara
, Naohiro and Urbán
, Péter and Schiper
, André
752 and Katayama
, Takuya
},
753 details
= {http
://infoscience.epfl.ch
/record
/49945},
754 documenturl
= {http
://infoscience.epfl.ch
/getfile.py?recid
=49945},
755 oai
-id
= {oai
:infoscience.epfl.ch
:49945},
756 oai
-set
= {fulltext
; report
; fulltext
-public
},
757 title = {Performance
{C
}omparison
{B
}etween the
{P
}axos and
758 {C
}handra
-{T
}oueg
{C
}onsensus
{A
}lgorithms
},
761 institution = {EPFL
},
763 @inproceedings
{Burrows
:2006:CLS
:1298455.1298487,
764 author = {Burrows
, Mike
},
765 title = {The Chubby lock service for loosely
-coupled distributed systems
},
766 booktitle = {Proceedings of the
7th symposium on Operating systems design and implementation
},
769 isbn
= {1-931971-47-1},
770 location
= {Seattle
, Washington
},
773 url
= {http
://portal.acm.org
/citation.cfm?id
=1298455.1298487},
775 publisher = {USENIX Association
},
776 address = {Berkeley
, CA
, USA
},
778 @article
{Camargos
:2007:SMH
:1272998.1273036,
779 author = {Camargos
, L\'
{a
}saro and Pedone
, Fernando and Wieloch
, Marcin
},
780 title = {Sprint
: a middleware for high
-performance transaction processing
},
781 journal = {SIGOPS Oper. Syst. Rev.
},
789 url
= {http
://doi.acm.org
/10.1145/1272998.1273036},
790 doi
= {http
://doi.acm.org
/10.1145/1272998.1273036},
793 address = {New York
, NY
, USA
},
794 keywords = {middleware
, parallel databases
, partitioning
, replication
},
796 @inproceedings
{Camargos
:2007:SMH
:1272996.1273036,
797 author = {Camargos
, L\'
{a
}saro and Pedone
, Fernando and Wieloch
, Marcin
},
798 title = {Sprint
: a middleware for high
-performance transaction processing
},
799 booktitle = {Proceedings of the
2nd ACM SIGOPS
/EuroSys European Conference on Computer Systems
2007},
800 series = {EuroSys '
07},
802 isbn
= {978-1-59593-636-3},
803 location
= {Lisbon
, Portugal
},
806 url
= {http
://doi.acm.org
/10.1145/1272996.1273036},
807 doi
= {http
://doi.acm.org
/10.1145/1272996.1273036},
810 address = {New York
, NY
, USA
},
811 keywords = {middleware
, parallel databases
, partitioning
, replication
},
813 @inproceedings
{MacCormick
:2004:BAF
:1251254.1251262,
814 author = {MacCormick
, John and Murphy
, Nick and Najork
, Marc and Thekkath
, Chandramohan A. and Zhou
, Lidong
},
815 title = {Boxwood
: abstractions as the foundation for storage infrastructure
},
816 booktitle = {Proceedings of the
6th conference on Symposium on Opearting Systems Design \
& Implementation
- Volume
6},
818 location
= {San Francisco
, CA
},
821 url
= {http
://portal.acm.org
/citation.cfm?id
=1251254.1251262},
823 publisher = {USENIX Association
},
824 address = {Berkeley
, CA
, USA
},
826 @inproceedings
{Saito
:2004:FBD
:1024393.1024400,
827 author = {Saito
, Yasushi and Fr
{\o
}lund
, Svend and Veitch
, Alistair and Merchant
, Arif and Spence
, Susan
},
828 title = {FAB
: building distributed enterprise disk arrays from commodity components
},
829 booktitle = {Proceedings of the
11th international conference on Architectural support for programming languages and operating systems
},
830 series = {ASPLOS
-XI
},
832 isbn
= {1-58113-804-0},
833 location
= {Boston
, MA
, USA
},
836 url
= {http
://doi.acm.org
/10.1145/1024393.1024400},
837 doi
= {http
://doi.acm.org
/10.1145/1024393.1024400},
840 address = {New York
, NY
, USA
},
841 keywords = {consensus
, disk array
, erasure coding
, replication
, storage
, voting
},
843 @article
{Saito
:2004:FBD
:1037949.1024400,
844 author = {Saito
, Yasushi and Fr
{\o
}lund
, Svend and Veitch
, Alistair and Merchant
, Arif and Spence
, Susan
},
845 title = {FAB
: building distributed enterprise disk arrays from commodity components
},
846 journal = {SIGOPS Oper. Syst. Rev.
},
854 url
= {http
://doi.acm.org
/10.1145/1037949.1024400},
855 doi
= {http
://doi.acm.org
/10.1145/1037949.1024400},
858 address = {New York
, NY
, USA
},
859 keywords = {consensus
, disk array
, erasure coding
, replication
, storage
, voting
},
861 @article
{Saito
:2004:FBD
:1037947.1024400,
862 author = {Saito
, Yasushi and Fr
{\o
}lund
, Svend and Veitch
, Alistair and Merchant
, Arif and Spence
, Susan
},
863 title = {FAB
: building distributed enterprise disk arrays from commodity components
},
864 journal = {SIGARCH Comput. Archit. News
},
872 url
= {http
://doi.acm.org
/10.1145/1037947.1024400},
873 doi
= {http
://doi.acm.org
/10.1145/1037947.1024400},
876 address = {New York
, NY
, USA
},
877 keywords = {consensus
, disk array
, erasure coding
, replication
, storage
, voting
},
879 @article
{Saito
:2004:FBD
:1037187.1024400,
880 author = {Saito
, Yasushi and Fr
{\o
}lund
, Svend and Veitch
, Alistair and Merchant
, Arif and Spence
, Susan
},
881 title = {FAB
: building distributed enterprise disk arrays from commodity components
},
882 journal = {SIGPLAN Not.
},
890 url
= {http
://doi.acm.org
/10.1145/1037187.1024400},
891 doi
= {http
://doi.acm.org
/10.1145/1037187.1024400},
894 address = {New York
, NY
, USA
},
895 keywords = {consensus
, disk array
, erasure coding
, replication
, storage
, voting
},
897 @PhdThesis
{vieira10
:thesis
,
898 author = {Vieira
, Gustavo M. D.
},
899 title = {Uma arquitetura de software para replicação baseda em consenso
},
900 school = {{U
}niversidade
{E
}studual de
{C
}ampinas
, {I
}nstituto de
{C
}omputaçao
},
904 @conference
{garcia2002message
,
905 title={{Message ordering in a multicast environment
}},
906 author={Garcia
-Molina
, Hector and Spauster
, Annemarie
},
907 booktitle={Distributed Computing Systems
, 1989.
, 9th International Conference on
},
913 @article
{cristian97
:high_performance
,
914 author={Flaviu Cristian and Shivakant Mishra and Guillermo Alvarez
},
915 title={High
-performance asynchronous atomic broadcast
},
916 journal={Distributed Systems Engineering
},
920 url
={http
://stacks.iop.org
/0967-1846/4/i
=2/a
=005},
923 @inproceedings
{Gopal
:1989:RBS
:645946.675018,
924 author = {Gopal
, Ajei S. and Toueg
, Sam
},
925 title = {Reliable Broadcast in Synchronous and Asynchronous Environments
(Preliminary Version
)},
926 booktitle = {Proceedings of the
3rd International Workshop on Distributed Algorithms
},
928 isbn
= {3-540-51687-5},
931 url
= {http
://portal.acm.org
/citation.cfm?id
=645946.675018},
933 publisher = {Springer
-Verlag
},
934 address = {London
, UK
},
936 @inproceedings
{Bar
-Joseph
:2002:EDA
:645959.676132,
937 author = {Bar
-Joseph
, Ziv and Keidar
, Idit and Lynch
, Nancy
},
938 title = {Early
-Delivery Dynamic Atomic Broadcast
},
939 booktitle = {Proceedings of the
16th International Conference on Distributed Computing
},
942 isbn
= {3-540-00073-9},
945 url
= {http
://portal.acm.org
/citation.cfm?id
=645959.676132},
947 publisher = {Springer
-Verlag
},
948 address = {London
, UK
, UK
},
950 @inproceedings
{Birman
:1987:EVS
:41457.37515,
951 author = {Birman
, Kenneth and Joseph
, Thomas
},
952 title = {Exploiting virtual synchrony in distributed systems
},
953 booktitle = {Proceedings of the eleventh ACM Symposium on Operating systems principles
},
956 isbn
= {0-89791-242-X
},
957 location
= {Austin
, Texas
, United States
},
960 url
= {http
://doi.acm.org
/10.1145/41457.37515},
961 doi
= {http
://doi.acm.org
/10.1145/41457.37515},
964 address = {New York
, NY
, USA
},
966 @article
{10.1109/DOA
.1999.794001,
967 author = {Pascal Felber and Xavier Défago and Rachid Guerraoui and Philipp Oser
},
968 title = {Failure Detectors as First Class Objects
},
969 journal ={Distributed Objects and Applications
, International Symposium on
},
971 isbn
= {0-7695-0182-6},
974 doi
= {http
://doi.ieeecomputersociety.org
/10.1109/DOA
.1999.794001},
975 publisher = {IEEE Computer Society
},
976 address = {Los Alamitos
, CA
, USA
},
978 @article
{Aguilera
:2000:FDC
:1035750.1035753,
979 author = {Aguilera
, Marcos Kawazoe and Chen
, Wei and Toueg
, Sam
},
980 title = {Failure detection and consensus in the crash
-recovery model
},
981 journal = {Distrib. Comput.
},
989 url
= {http
://portal.acm.org
/citation.cfm?id
=1035750.1035753},
990 doi
= {10.1007/s004460050070
},
992 publisher = {Springer
-Verlag
},
993 address = {London
, UK
},
994 keywords = {asynchronous systems
, consensus
, failure detection
, fault tolerance
, process crash
, process recovery
, stable storage
},