forked from ketancmaheshwari/tccstorage
-
Notifications
You must be signed in to change notification settings - Fork 0
/
ref.bib
1563 lines (1425 loc) · 58.2 KB
/
ref.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
@STRING{IPDPS = {Proceedings Int'l Parallel and Distributed Processing Symp.}}
@INPROCEEDINGS{STAPL_2011,
title = {The {STAPL} {P}arallel {C}ontainer {F}ramework},
author = { Gabriel Tanase and Antal Buss and Adam Fidel and
Harshvardhan and Ioannis Papadopoulos and Olga
Pearce and Timmie Smith and Nathan Thomas and
Xiabing Xu and Nedhal Mourad and Jeremy Vu and Mauro
Bianco and Nancy M. Amato and Lawrence Rauchwerger},
booktitle = {Proceedings of ACM SIGPLAN Symp. Prin. Prac. Par. Prog. (PPOPP)},
year = 2011
}
@InProceedings{maheshwari-lim-etal:2013,
title = {{Toward a reliable, secure and fault tolerant smart
grid state estimation in the cloud}},
author = {Maheshwari, Ketan and Lim, Marcus and Wang, Lydia and Birman, Ken and van Renesse, Robbert},
year = 2013,
booktitle = {Innovative Smart Grid Technologies},
address = {Washington DC, USA},
month = feb,
days = {24-27},
publisher = {IEEE-PES}
}
@article{chirp,
year={2009},
issn={1570-7873},
journal={Journal of Grid Computing},
volume={7},
number={1},
doi={10.1007/s10723-008-9100-5},
title={Chirp: a practical global filesystem for cluster and Grid computing},
url={http://dx.doi.org/10.1007/s10723-008-9100-5},
publisher={Springer Netherlands},
keywords={Filesystem; Grid computing; Cluster computing},
author={Thain, Douglas and Moretti, Christopher and Hemmes, Jeffrey},
pages={51-72},
language={English}
}
@inproceedings {
chirp-tickets-ccgrid12,
author = "Patrick Donnelly and Douglas Thain",
title = "{Fine-Grained Access Control in the Chirp Distributed File System}",
booktitle = "{IEEE/ACM International Symposium on Cluster, Cloud, and Grid Computing}",
year = 2012,
cclpaperid = "101"
}
@inproceedings{s3-viable,
author = {Palankar, Mayur R. and Iamnitchi, Adriana and Ripeanu, Matei and Garfinkel, Simson},
title = {Amazon S3 for science grids: a viable solution?},
booktitle = {Proceedings of the 2008 International Workshop on Data-Aware Distributed Computing},
series = {DADC '08},
year = {2008},
isbn = {978-1-60558-154-5},
location = {Boston, MA, USA},
pages = {55--64},
numpages = {10},
url = {http://doi.acm.org/10.1145/1383519.1383526},
doi = {10.1145/1383519.1383526},
acmid = {1383526},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {amazon simple storage service, performance evaluation, utility computing},
}
@INPROCEEDINGS{hdfs-main,
author={Shvachko, K. and Hairong Kuang and Radia, S. and Chansler, R.},
booktitle={Mass Storage Systems and Technologies (MSST), 2010 IEEE 26th Symposium on},
title={The Hadoop Distributed File System},
year={2010},
pages={1-10},
keywords={Internet;distributed databases;network operating systems;Hadoop distributed file system;Yahoo!;data storage;data stream;enterprise data;Bandwidth;Clustering algorithms;Computer architecture;Concurrent computing;Distributed computing;Facebook;File servers;File systems;Protection;Protocols;HDFS;Hadoop;distributed file system},
doi={10.1109/MSST.2010.5496972},}
@INPROCEEDINGS{hdfs-metadata,
author={Mackey, G. and Sehrish, S. and Jun Wang},
booktitle={Cluster Computing and Workshops, 2009. CLUSTER '09. IEEE International Conference on},
title={Improving metadata management for small files in HDFS},
year={2009},
pages={1-4},
keywords={cache storage;data analysis;meta data;HDFS-MapReduce program;Namenode;file storage;hadoop distributed file system;large datasets analysis;metadata management;single server;Application software;Availability;Computer architecture;Computer science;Data analysis;Engineering management;File servers;File systems;Large-scale systems;Performance analysis},
doi={10.1109/CLUSTR.2009.5289133},
ISSN={1552-5244},}
@INPROCEEDINGS{hdfs-caching,
author={Jing Zhang and Gongqing Wu and Xuegang Hu and Xindong Wu},
booktitle={Grid Computing (GRID), 2012 ACM/IEEE 13th International Conference on},
title={A Distributed Cache for Hadoop Distributed File System in Real-Time Cloud Services},
year={2012},
pages={12-21},
keywords={cache storage;cloud computing;disc storage;distributed databases;distributed shared memory systems;peer-to-peer computing;software libraries;table lookup;HDCache;HDFS-based distributed cache system;Hadoop distributed file system;P2P style;access layer;cache service;client library;disk;distributed hash table;distributed layered cache system;file access performance;hardware;in-memory cache;network environment;real-time cloud service;shared memory;software;Cloud computing;Data models;File systems;Libraries;Random access memory;Real-time systems;Servers;HDFS;cloud storage;distributed cache system;in-memory cloud;real-time file acces},
doi={10.1109/Grid.2012.17},
ISSN={1550-5510},}
@article{cloudreq,
year={2013},
issn={1570-7873},
journal={Journal of Grid Computing},
volume={11},
number={2},
doi={10.1007/s10723-013-9255-6},
title={Data-Intensive Cloud Computing: Requirements, Expectations, Challenges, and Solutions},
url={http://dx.doi.org/10.1007/s10723-013-9255-6},
publisher={Springer Netherlands},
keywords={Data-intensive cloud computing; Scalability; Fault tolerance; Heterogeneity; Large scale data management; Cloud data storage},
author={Shamsi, Jawwad and Khojaye, MuhammadAli and Qasmi, MohammadAli},
pages={281-310},
language={English}
}
@ARTICLE{ADLB_2010,
title = {More scalability, less pain: {A} simple programming model
and its implementation for extreme computing},
author = {Ewing L. Lusk and Steve C. Pieper and Ralph M. Butler},
journal = {SciDAC Review},
volume = 17,
month = {Jan.},
year = 2010,
pages = {30-37}
}
@INPROCEEDINGS{Pipes_2009,
title = {Composing and Executing Parallel Data-flow Graphs
with Shell Pipes},
author = {Edward Walker and Weijia Xu and Vinoth Chandar},
booktitle = {Work. on Workflows in Support of
Large-Scale Science at SC'09},
year = 2009,
}
@ARTICLE{Swift_2009,
author = {Wilde, M. and Foster, I. and Iskra, K. and Beckman, P. and
Zhao Zhang and Espinosa, A. and Hategan, M. and
Clifford, B. and Raicu, I.},
journal={Computer},
title={Parallel Scripting for Applications at the Petascale and Beyond},
year={2009},
volume={42},
number={11},
pages={50-60}
}
@ARTICLE{Swift_2010,
title = {{SWIFT}: {S}calable Parallel Scripting
for Scientific Computing},
author = {Peter Beckman and Ian Foster and Michael Wilde and
Ioan Raicu},
journal = {{SciDAC} Review},
number = 17,
year = 2010
}
@ARTICLE{rebalance,
author={Hsiao, Hung-Chang and Chung, Hsueh-Yi and Shen, Haiying and Chao, Yu-Chang},
journal={Parallel and Distributed Systems, IEEE Transactions on},
title={Load Rebalancing for Distributed File Systems in Clouds},
year={2013},
volume={24},
number={5},
pages={951-962},
keywords={Algorithm design and analysis;Cloud computing;Clustering algorithms;Heuristic algorithms;Load management;Proposals;Vectors;Load balance;clouds;distributed file systems},
doi={10.1109/TPDS.2012.196},
ISSN={1045-9219},}
@ARTICLE{Swift_2011_old,
title = {Swift: {A} language for distributed parallel scripting},
author = {Michael Wilde and Mihael Hategan and Justin M. Wozniak
and Ben Clifford and Daniel S. Katz and Ian Foster},
journal = {\it to appear in Parallel Computing},
year = 2011
}
@ARTICLE{Swift_2011,
title = "Swift: A language for distributed parallel scripting",
journal = "Par. Comp.",
volume = "37",
year = "2011",
pages="633--652",
author = "Michael Wilde and Mihael Hategan and Justin M. Wozniak and Ben Clifford and Daniel S. Katz and Ian Foster",
}
@INPROCEEDINGS{cloud-dataintensive,
author={Kolodner, E.K. and Tal, S. and Kyriazis, D. and Naor, D. and Allalouf, M. and Bonelli, L. and Brand, P. and Eckert, A. and Elmroth, E. and Gogouvitis, S.V. and Harnik, D. and Hernandez, F. and Jaeger, M.C. and Lakew, E.B. and Lopez, J.M. and Lorenz, M. and Messina, A. and Shulman-Peleg, A. and Talyansky, R. and Voulodimos, A. and Wolfsthal, Y.},
booktitle={Cloud Computing Technology and Science (CloudCom), 2011 IEEE Third International Conference on},
title={A Cloud Environment for Data-intensive Storage Services},
year={2011},
pages={357-366},
keywords={Web services;cloud computing;quality of service;security of data;smart phones;social networking (online);Internet-scale services;QoS;abstraction level;cloud storage;content-centric access;data mobility;data-intensive storage cloud services;data-oriented mechanisms;fault tolerance;flexible cloud environment;healthcare;live migration;media domains;quality of service;real-life application scenarios;rich digital environment;scalable cloud environment;security guarantees;sensors;smart phones;social networks;user generated content;Cloud computing;Computational modeling;Computer architecture;Containers;Data models;Monitoring;Security;Cloud computing;Data-intensive services;Storage},
doi={10.1109/CloudCom.2011.55},}
@INPROCEEDINGS{ParallelPatterns_2010,
title = {Structured Parallel Programming with Deterministic Patterns},
author = {Michael D. McCool},
booktitle = {Proc. HotPar},
year = 2010
}
@inproceedings{Skywriting,
abstract = {{Recent distributed computing frameworks--such as MapReduce, Hadoop and Dryad--have made it simple to exploit multiple machines in a compute cloud. However, these frameworks use coordination languages that are insufficiently expressive for many classes of computation, including iterative and recursive algorithms. To address this problem, and generalise previous approaches, we introduce Skywriting: a Turing-powerful, purely-functional script language for describing distributed computations. In this paper, we introduce the main features of Skywriting, and outline our novel cooperative task farming execution engine.}},
address = {Boston, MA, USA},
author = {Murray, Derek G. and Hand, Steven},
booktitle = {HotCloud '10: Proc. of 2nd USENIX Work. on Hot Topics in Cloud Computing},
citeulike-article-id = {7531226},
citeulike-linkout-0 = {http://www.usenix.org/event/hotcloud10/tech/full\_papers/Murray.pdf},
citeulike-linkout-1 = {http://www.cl.cam.ac.uk/\~{}dgm36/publications/2010-murray2010skywriting.pdf},
citeulike-linkout-2 = {http://www.usenix.org/event/hotcloud10/tech/},
keywords = {cloud, programming, script},
month = jun,
posted-at = {2010-12-10 11:51:32},
priority = {0},
publisher = {USENIX},
title = {{Scripting the cloud with Skywriting}},
year = {2010}
}
%% location = {Boston, MA, USA},
@article{scioto,
author = {James Dinan and Sriram Krishnamoorthy and D. Brian Larkins and Jarek Nieplocha and P. Sadayappan},
title = {Scioto: A Framework for Global-View Task Parallelism},
journal ={Int'l Conf. on Parallel Processing},
year = {2008},
pages = {586-593},
publisher = {IEEE Computer Society},
address = {Los Alamitos, CA, USA},
}
@article{mapreduce,
author = {Dean, Jeffrey and Ghemawat, Sanjay},
title = {MapReduce: {S}implified data processing on large clusters},
journal = {Commun. ACM},
issue_date = {January 2008},
volume = {51},
issue = {1},
month = {Jan.},
year = {2008},
issn = {0001-0782},
pages = {107--113},
numpages = {7},
doi = {http://doi.acm.org/10.1145/1327452.1327492},
acmid = {1327492},
publisher = {ACM},
address = {New York, NY, USA},
}
@article{dryad,
author = {Isard, Michael and Budiu, Mihai and Yu, Yuan and Birrell, Andrew and Fetterly, Dennis},
title = {Dryad: {D}istributed data-parallel programs from sequential
building blocks},
journal = {SIGOPS Oper. Syst. Rev.},
issue_date = {June 2007},
volume = {41},
issue = {3},
month = {Mar.},
year = {2007},
issn = {0163-5980},
pages = {59--72},
numpages = {14},
doi = {10.1145/1272998.1273005},
acmid = {1273005},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {cluster computing, concurrency, dataflow, distributed programming},
}
@inproceedings{DryadLINQ,
title={{DryadLINQ}: A System for General-Purpose Distributed Data-Parallel Computing Using a High-Level Language},
author={Yuan Yu and Michael Isard and Dennis Fetterly and Mihai Budiu and Ulfar Erlingsson and Pradeep Kumar Gunda and Jon Currey},
booktitle={Proc. of Symp. on Operating System Design and Implementation (OSDI)},
month={Dec.},
year={2008}
}
@MISC{Exascale_Software_2009,
author = {{V. Sarkar et al.}},
title = {{ExaScale} Software Study: {S}oftware Challenges in Extreme
Scale Systems},
howpublished = {DARPA Report},
year = 2009,
}
@ARTICLE{CoG_2001,
author = {Gregor von Laszewski and Ian Foster and Jarek Gawor and Peter Lane},
title = {A {J}ava {C}ommodity {G}rid {K}it},
journal = {Concurrency and Computation: {Practice} and Experience},
year = {2001},
volume = {13},
number = {8-9},
comment = {vonLaszewski-final.bib},
}
@INPROCEEDINGS{CIEL_2011,
title = {{CIEL}: a universal execution engine for distributed
data-flow computing},
author = {Derek G. Murray and Malte Schwarzkopf and Christopher
Smowton and Steven Smith and Anil Madhavapeddy and
Steven Hand},
booktitle = {Proc. NSDI 2011},
year = 2011,
}
% Boston, MA, March 2011
@INPROCEEDINGS{DAGuE_2011,
title = {{DAGuE}: {A} generic distributed {DAG} engine for high
performance computing},
author = {Bosilca, G. and Bouteiller, A. and Danalis, A. and
Herault, T. and Lemarinier, P. and Dongarra, J.},
booktitle = IPDPS,
year = 2011,
}
@article{LINDA,
title = {{Linda and friends}},
author = {S. Ahuja and N. Carriero and D. Gelernter},
journal = {{IEEE Computer}},
volume = {19(8)},
year = 1986,
pages = {26--34}
}
@mastersthesis{armstrong-pydflow-11,
author = "Timothy G. Armstrong",
title = "Integrating Task Parallelism into the Python Programming Language",
school = "The University of Chicago",
year = "2011",
month = "May",
url = "http://people.cs.uchicago.edu/~tga/pubs/armstrong-masters.pdf",
}
@misc{SwiftR_web,
Title={{SwiftR: a parallel and distributed computing package for R}},
key={{SwiftR: a parallel and distributed computing package for R}},
Note = {url{http://people.cs.uchicago.edu/~tga/swiftR/}}
}
@misc{SwiftR_wiki,
Title={{User info for SwiftR: a parallel and distributed computing package for R}},
key={{User info for SwiftR: a parallel and distributed computing package for R}},
Note = {url{http://www.ci.uchicago.edu/wiki/bin/view/SWFT/SwiftR}}
}
@article{PCN,
author = {Foster, Ian and Olson, Robert and Tuecke, Steven},
title = {Productive Parallel Programming: The {PCN} Approach},
journal = {Sci. Program.},
volume = {1},
issue = {1},
month = {Jan.},
year = {1992},
issn = {1058-9244},
pages = {51--66},
numpages = {16},
acmid = {1402587},
publisher = {IOS Press},
address = {Amsterdam, The Netherlands},
}
@article{CCA,
sortkey = {Allan, B. A.},
author = {{B. A. Allan, R. Armstrong et al.}},
title = {A Component Architecture for High-Performance Scientific Computing},
journal = {Int'l J. High Perform. Comput. Appl.},
volume = {20},
issue = {2},
month = {May},
year = {2006},
issn = {1094-3420},
pages = {163--202},
numpages = {40},
doi = {10.1177/1094342006064488},
acmid = {1125983},
publisher = {Sage Publications, Inc.},
address = {Thousand Oaks, CA, USA},
keywords = {climate modeling, combustion modeling, component architecture, parallel computing, quantum chemistry},
}
@misc{corba,
author={{Object Management Group}},
year={2002},
title={{CORBA} component model},
note={url{http://www.omg.org/technology/ documents/formal/components.htm}}
}
@inproceedings{comet,
author={Zhen Li and M. Parashar},
title={Comet: {A} scalable coordination space for decentralized
distributed environments},
pages={104--111},
year={2005},
booktitle={2nd Int'l Work. on Hot Topics in Peer-to-Peer Systems, HOT-P2P 2005}
}
@article{MapReduce_2004,
author = {Dean, Jeffrey and Ghemawat, Sanjay},
title = {{MapReduce}: simplified data processing on large clusters},
journal = {Commun. ACM},
volume = {51},
issue = {1},
month = {Jan.},
year = {2008},
issn = {0001-0782},
pages = {107--113},
numpages = {7},
doi = {10.1145/1327452.1327492},
acmid = {1327492},
publisher = {ACM},
address = {New York, NY, USA},
}
@article{Sawzall_2005,
title = {Interpreting the data: {P}arallel analysis with {Sawzall}},
author = {Pike, R. and Dorward, S. and Griesemer, R. and Quinlan, S.},
journal = {Scientific Programming},
volume = {13},
number = {4},
year = 2005,
pages = {277--298},
publisher={IOS Press}
}
@inproceedings{Futures,
author = {{Baker, Jr.}, Henry C. and Hewitt, Carl},
title = {The incremental garbage collection of processes},
booktitle = {Proc. of 1977 Symp. on Artificial Intelligence and Programming Languages},
year = {1977},
pages = {55--59},
numpages = {5},
doi = {10.1145/800228.806932},
acmid = {806932},
publisher = {ACM},
address = {New York},
keywords = {Eager evaluation, Garbage collection, Lazy evaluation, Multiprocessing systems, Processor scheduling},
}
@inproceedings{Falkon_2008,
author = {Raicu, Ioan and Zhang, Zhao and Wilde, Mike and Foster, Ian
and Beckman, Pete and Iskra, Kamil and Clifford,
Ben},
title = {Toward loosely coupled programming on petascale systems},
booktitle = {Proc. of 2008 ACM/IEEE Conf. on
Supercomputing},
series = {SC '08},
year = {2008},
location = {Austin, Texas},
pages = {22:1--22:12},
articleno = {22},
numpages = {12},
acmid = {1413393},
publisher = {IEEE Press},
address = {Piscataway, NJ},
keywords = {Blue Gene, Falkon, Swift, high throughput computing, loosely coupled applications, many task computing, petascale},
}
@techreport{Spark_2010,
Author = {Zaharia, Matei and Chowdhury, N. M. Mosharaf and Franklin, Michael and Shenker, Scott and Stoica, Ion},
Title = {Spark: Cluster Computing with Working Sets},
Institution = {EECS Department, U. . lifornia, Berkeley},
Year = {2010},
Month = {May},
URL = {http://www.eecs.berkeley.edu/Pubs/TechRpts/2010/EECS-2010-53.html},
Number = {UCB/EECS-2010-53},
Abstract = {MapReduce and its variants have been highly successful in implementing large-scale data intensive applications on clusters of unreliable machines. However, most of these systems are built around an acyclic data flow programming model that is not suitable for other popular applications. In this paper, we focus on one such class of applications: those that reuse a working set of data across multiple parallel operations. This includes many iterative machine learning algorithms, as well as interactive data analysis environments. We propose a new framework called Spark that supports these applications while maintaining the scalability and fault-tolerance properties of MapReduce. To achieve these goals, Spark introduces a data abstraction called resilient distributed datasets (RDDs). An RDD is a read-only collection of objects partitioned across a set of machines that can be rebuilt if a partition is lost. Spark can outperform Hadoop by 10x in iterative machine learning jobs, and can be used to interactively query a 39 GB dataset with sub-second response time.}
}
@inproceedings{Lithe_2009,
address = {Berkeley, CA, USA},
author = {Heidi Pan and Benjamin Hindman and Krste Asanovi\'{c}},
booktitle = {Proc. of 1st USENIX Conf. on Hot Topics in Parallelism},
interhash = {b7fed0316b1a8568cf2b0b40aa415d4c},
intrahash = {783d4567cb6b3bf266d0674a5195f626},
pages = 6,
publisher = {USENIX Association},
series = {HotPar'09},
title = {Lithe: Enabling Efficient Composition of Parallel Libraries},
url = {http://portal.acm.org/citation.cfm?id=1855591.1855602},
year = 2009,
timestamp = {2011-08-10T21:46:42.000+0200},
keywords = {Scheduling Threads},
added-at = {2011-08-10T21:46:42.000+0200},
location = {Berkeley, California},
acmid = {1855602},
description = {Lithe},
numpages = {1},
biburl = {http://www.bibsonomy.org/bibtex/2783d4567cb6b3bf266d0674a5195f626/gron},
abstract = {For the software industry to take advantage of multicore processors, we must allow programmers to arbitrarily compose parallel libraries without sacrificing performance. We argue that high-level task or thread abstractions and a common global scheduler cannot provide effective library composition. Instead, the operating system should expose unvirtualized processing resources that can be shared cooperatively between parallel libraries within an application. In this paper, we describe a system that standardizes and facilitates the exchange of these unvirtualized processing resources between libraries.}
}
@ARTICLE{Make_1979,
author = {Stuart I. Feldman},
title = {Make - A Program for Maintaining Computer Programs},
journal = {Software - Practice and Experience},
year = {1979},
volume = 9,
pages = {255-265},
}
@MISC{E3_2007,
author = {Horst Simon and Thomas Zacharia and Rick Stevens},
title = {Modeling and Simulation at the Exascale for Energy and the
Environment},
note = {Report on the Advanced Scientific Computing Research Town
Hall Meetings on Simulation and Modeling at the
Exascale for Energy, Ecological Sustainability and
Global Security ({E3})},
year = 2007
}
@MISC{Exascale_Architecture_2009,
title = {Architectures and technology for extreme scale computing},
author = {Rick Stevens and Andrew White},
note = {U.S. Dept. of Energy report},
year = 2009
}
@MISC{Exascale_Technology_slides_2010,
title = {Exascale Computing Technology Challenges},
author = {John Shalf},
note = {{ScicomP / SP-XXL 16}},
year = 2010
}
@MISC{Exascale_Technology_2010,
title = {Exascale Computing Technology Challenges},
author = {John Shalf and J. Morrison and S. Dosanj},
howpublished = {VECPAR'2010},
year = 2010,
pages = {1-25}
}
@MISC{ASCAC_Report_2010,
title = {The Opportunities and Challenges of Exascale Computing},
author = {{ASCAC Subcommittee on Exascale Computing}},
note = {{U.S. Dept. of Energy report}},
year = 2010
}
@ARTICLE{Workflow_Opportunistic_2006,
author = {Ewa Deelman and Tevfik Kosar and Carl Kesselman and Miron
Livny},
title = {What makes workflows work in an opportunistic environment?},
journal = {Concurrency and Computation: Practice and Experience},
year = {2006},
volume = {18},
issue = {10},
timestamp = {2007.07.05},
pages = {1187-1199}
}
@article{Charles_2005,
author = {Charles, Philippe and Grothoff, Christian and Saraswat,
Vijay and Donawa, Christopher and Kielstra, Allan
and Ebcioglu, Kemal and von Praun, Christoph and
Sarkar, Vivek},
title = {X10: {A}n object-oriented approach to non-uniform cluster
computing},
journal = {SIGPLAN Not.},
issue_date = {October 2005},
volume = {40},
issue = {10},
month = {Oct.},
year = {2005},
issn = {0362-1340},
pages = {519--538},
numpages = {20},
doi = {http://doi.acm.org/10.1145/1103845.1094852},
acmid = {1094852},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {Java, X10, atomic blocks, clocks, data distribution, multithreading, non-uniform cluster computing (NUCC), partitioned global address space (PGAS), places, productivity, scalability},
}
@techreport{Allen_2008,
author = {Allen, Eric and Chase, David and Hallett, Joe and Luchangco, Victor and Maessen, Jan-Willem and Ryu, Sukyoung and Steele, Jr., Guy L. and Tobin-Hochstadt, Sam},
institution = {Sun Microsystems, Inc.},
title = {The {Fortress} Language Specification},
url = {http://labs.oracle.com/projects/plrg/Publications/fortress.1.0.pdf},
year = 2008
}
@article{Chamberlain_2007,
author = {Chamberlain, B.L. and Callahan, D. and Zima, H.P.},
title = {Parallel Programmability and the {Chapel} Language},
volume = {21},
number = {3},
pages = {291-312},
year = {2007},
doi = {10.1177/1094342007078442},
eprint = {http://hpc.sagepub.com/content/21/3/291.full.pdf+html},
journal = {Int'l J. High Perform. Comput. Appl.}
}
@techreport{Shet_2008,
author={Shet, Aniruddha G and Elwasif, Wael R and Harrison, Robert J and Bernholdt, David E},
title={Programmability of the {HPCS} Languages: A Case Study with a Quantum Chemistry Kernel (Extended Version)},
url={http://www.osti.gov/bridge/servlets/purl/931141-V8yRh4/},
institution={Oak Ridge National Laboratory},
number={ORNL/TM-2008/011},
year={2008},
}
@article{DeCandia_2007,
author = {DeCandia, Giuseppe and Hastorun, Deniz and Jampani, Madan and Kakulapati, Gunavardhan and Lakshman, Avinash and Pilchin, Alex and Sivasubramanian, Swaminathan and Vosshall, Peter and Vogels, Werner},
title = {{Dynamo: Amazon's highly available key-value store}},
journal = {SIGOPS Oper. Syst. Rev.},
issue_date = {December 2007},
volume = {41},
issue = {6},
month = oct,
year = {2007},
issn = {0163-5980},
pages = {205--220},
numpages = {16},
doi = {http://doi.acm.org/10.1145/1323293.1294281},
acmid = {1294281},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {performance, reliability, scalability},
}
@article{memcached_2004,
author = {Fitzpatrick, Brad},
title = {Distributed caching with memcached},
journal = {Linux J.},
issue_date = {August 2004},
volume = {2004},
issue = {124},
month = {Aug.},
year = {2004},
issn = {1075-3583},
pages = {5--},
acmid = {1012894},
publisher = {Belltown Media},
address = {Houston, TX},
}
@misc{redis_web,
title={Redis},
author={Salvatore Sanfilippo and Pieter Noordhuis},
key={redis_web},
note={url{http://redis.io/}},
}
@article{Lakshman_2010,
author = {Lakshman, Avinash and Malik, Prashant},
title = {Cassandra: a decentralized structured storage system},
journal = {SIGOPS Oper. Syst. Rev.},
volume = {44},
issue = {2},
month = {Apr.},
year = {2010},
issn = {0163-5980},
pages = {35--40},
numpages = {6},
doi = {http://doi.acm.org/10.1145/1773912.1773922},
acmid = {1773922},
publisher = {ACM},
address = {New York, NY, USA},
}
@inproceedings{Ekanayake_2010,
author = {Ekanayake, Jaliya and Li, Hui and Zhang, Bingjing and Gunarathne, Thilina and Bae, Seung-Hee and Qiu, Judy and Fox, Geoffrey},
title = {Twister: {A} runtime for iterative {MapReduce}},
booktitle = {Proc. of 19th ACM Int'l Symp. on High Performance Distributed Computing},
series = {HPDC '10},
year = {2010},
isbn = {978-1-60558-942-8},
location = {Chicago, Illinois},
pages = {810--818},
numpages = {9},
doi = {http://doi.acm.org/10.1145/1851476.1851593},
acmid = {1851593},
publisher = {ACM},
keywords = {MapReduce, cloud technologies, iterative algorithms},
address = {New York},
}
@inproceedings{PigLatin,
author = {Olston, Christopher and Reed, Benjamin and Srivastava,
Utkarsh and Kumar, Ravi and Tomkins, Andrew},
title = {Pig {L}atin: {A} not-so-foreign language for data
processing},
booktitle = {Proc. of 2008 ACM SIGMOD Int'l
Conf. on Management of Data},
series = {SIGMOD '08},
year = {2008},
isbn = {978-1-60558-102-6},
location = {Vancouver, Canada},
pages = {1099--1110},
numpages = {12},
doi = {http://doi.acm.org/10.1145/1376616.1376726},
acmid = {1376726},
publisher = {ACM},
address = {New York},
keywords = {dataflow language, pig latin},
}
@article{Hive,
author = {Thusoo, Ashish and Sarma, Joydeep Sen and Jain, Namit and Shao, Zheng and Chakka, Prasad and Anthony, Suresh and Liu, Hao and Wyckoff, Pete and Murthy, Raghotham},
title = {Hive: a warehousing solution over a map-reduce framework},
journal = {Proc. VLDB Endow.},
issue_date = {August 2009},
volume = {2},
issue = {2},
month = {Aug.},
year = {2009},
issn = {2150-8097},
pages = {1626--1629},
numpages = {4},
url = {http://dl.acm.org/citation.cfm?id=1687553.1687609},
acmid = {1687609},
publisher = {VLDB Endowment},
}
@inproceedings{Blumofe_1997,
author = {Blumofe, Robert D. and Lisiecki, Philip A.},
title = {Adaptive and reliable parallel computing on networks of workstations},
booktitle = {Proc. of Annual Conf. on USENIX},
year = {1997},
location = {Anaheim, California},
numpages = {1},
url = {http://dl.acm.org/citation.cfm?id=1268680.1268690},
acmid = {1268690},
publisher = {USENIX Association},
address = {Berkeley, CA, USA},
pages = {10},
}
@INPROCEEDINGS{Coasters_UCC_2011,
author = {Mihael Hategan and Justin Wozniak and Ketan Maheshwari},
title = {Coasters: uniform resource provisioning and access for
scientific computing on clouds and grids},
booktitle = {Proceedings of Utility and Cloud Computing},
year = 2011
}
@inproceedings{Delirium_1990,
author = {Lucco, Steven and Sharp, Oliver},
title = {Delirium: an embedding coordination language},
booktitle = {Proceedings of the 1990 ACM/IEEE conference on Supercomputing},
series = {Supercomputing '90},
year = {1990},
isbn = {0-89791-412-0},
location = {New York, New York, United States},
pages = {515--524},
numpages = {10},
url = {http://dl.acm.org/citation.cfm?id=110382.110582},
acmid = {110582},
publisher = {IEEE Computer Society Press},
address = {Los Alamitos, CA, USA},
}
@inproceedings{Zuckerman_2011,
author = {Zuckerman, St{\'e}phane and Suetterlein, Joshua and
Knauerhase, Rob and Gao, Guang R.},
title = {Using a ``codelet'' program execution model for exascale machines},
booktitle = {Workshop Adaptive Self-Tuning Comp. Syst. for the Exaflop Era, 2011},
year = {2011},
isbn = {978-1-4503-0708-6},
location = {San Jose, California},
pages = {64--69},
numpages = {6},
doi = {10.1145/2000417.2000424},
acmid = {2000424},
publisher = {ACM},
address = {New York},
keywords = {dataflow, exascale, manycore, program execution model},
}
@INPROCEEDINGS{Turbine_2012,
title = {Turbine: A distributed memory data flow engine
for many-task applications},
author = {Justin M. Wozniak and Timothy G. Armstrong and Ketan Maheshwari and
Ewing L. Lusk and Daniel S. Katz and Michael Wilde
and Ian T. Foster},
booktitle = {Int'l Workshop Scalable Workflow
Enactment Engines and Technologies (SWEET) 2012},
year = {2012}
}
@INPROCEEDINGS{ExM_2012,
title = {{ExM}: High level dataflow programming for extreme-scale systems},
author = {Timothy G. Armstrong and Justin M. Wozniak and
Michael Wilde and Ketan Maheshwari and Daniel S. Katz
and Matei Ripeanu and Ewing L. Lusk and Ian T. Foster},
LONGbooktitle = {4th {USENIX} Workshop Hot Topics in Parallel Computing:
HotPar'12},
booktitle = {Workshop Hot Topics in Parallelism:
HotPar'12},
year = {2012}
}
@inproceedings{Beazley_1996,
author = {Beazley, David M.},
title = {{SWIG}: an easy to use tool for integrating scripting languages with {C} and {C++}},
booktitle = {Proceedings of the 4th Conference on USENIX Tcl/Tk Workshop, 1996 - Volume 4},
year = {1996},
location = {Monterey, California},
acmid = {1267513},
publisher = {USENIX Association},
address = {Berkeley, CA, USA},
}
@book{Scott_2009,
author = {Scott, Michael L.},
title = {Programming Language Pragmatics, Third Edition},
year = {2009},
isbn = {0123745144, 9780123745149},
edition = {3rd},
publisher = {Morgan Kaufmann Publishers Inc.},
address = {San Francisco, CA, USA},
}
@book{Aho_2006,
author = {Aho, Alfred V. and Lam, Monica S. and Sethi, Ravi and
Ullman, Jeffrey D.},
title = {Compilers: Principles, Techniques, and Tools (2nd Edition)},
year = {2006},
isbn = {0321486811},
publisher = {Addison-Wesley Longman Publishing Co.},
address = {Boston, MA},
}
@inproceedings{Bocchino_2009,
author = {{Bocchino, Jr.}, Robert L. and Adve, Vikram S. and Adve, Sarita V. and Snir, Marc},
title = {Parallel programming must be deterministic by default},
booktitle = {Workshop Hot Topics in Parallelism:
HotPar'09},
year = {2009},
location = {Berkeley, California},
acmid = {1855595},
publisher = {USENIX Association},
address = {Berkeley, CA},
}
@article{Feo_90,
title = "A Report on the {Sisal} Language Project",
journal = "J. Parallel and Distributed Computing",
volume = "10",
number = "4",
pages = "349 - 366",
year = "1990",
issn = "0743-7315",
doi = "10.1016/0743-7315(90)90035-N",
author = "John T. Feo and David C. Cann and Rodney R. Oldehoeft"
}
@techreport{Traub_86,
author = {Traub, Kenneth. R.},
title = {A Compiler for the {MIT} tagged-token dataflow architecture},
year = {1986},
institution = {Massachusetts Institute of Technology},
address = {Cambridge, MA},
}
@MISC{Mahajan_12,
author={Ashutosh Mahajan and Sven Leyffer and Christian Kirches},
title={Solving Mixed-Integer Nonlinear Programs by {QP-Diving}},
month={Mar.},
year={2012},
institution={Argonne National Laboratory},
note={Preprint ANL/MCS-P2071-0312},
}
@article{SimAnneal,
author = {Kirkpatrick, S. and Gelatt, C. D. and Vecchi, M. P.},
title = {Optimization by Simulated Annealing},
volume = {220},
number = {4598},
pages = {671-680},
year = {1983},
doi = {10.1126/science.220.4598.671},
journal = {Science}
}
@INPROCEEDINGS{Raicu_MTAGS_08,
author={Raicu, I. and Foster, I. T. and Yong Zhao},
booktitle={1st Workshop Many-Task Computing on Grids and Supercomputers: {MTAGS} 2008},
title={Many-task computing for grids and supercomputers},
year={2008},
month={Nov.},
volume={},
number={},
pages={1--11},
keywords={file system operations;grid computing;high performance computing;high throughput computing;many task computing;message passing interface;supercomputers;file organisation;grid computing;message passing;parallel machines;},
doi={10.1109/MTAGS.2008.4777912},
ISSN={},
}
@article{Al-Kiswany_2010,
author = {Al-Kiswany, Samer and Gharaibeh, Abdullah and Ripeanu, Matei},
title = {The case for a versatile storage system},
journal = {SIGOPS Oper. Sys. Rev.},
issue_date = {January 2010},
volume = {44},
number = {1},
month = {Mar.},
year = {2010},
issn = {0163-5980},
pages = {10--14},
numpages = {5},
doi = {10.1145/1740390.1740394},
acmid = {1740394},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {dynamic deployment, high performance storage, storage system specialization, versatile storage system},
}
@book{Herlihy_08,
author = {Herlihy, Maurice and Shavit, Nir},
title = {The Art of Multiprocessor Programming},
year = {2008},
isbn = {0123705916, 9780123705914},
publisher = {Morgan Kaufmann Publishers Inc.},
address = {San Francisco, CA, USA},
}
@INPROCEEDINGS{Orozco_11,
author={Orozco, Daniel and Garcia, Elkin and Pavel, Robert and Khan, Rishi and Gao, Guang},
booktitle={1st Workshop Data-Flow Execution Models for Extreme Scale Computing: DFM'11},
title={{TIDeFlow}: The Time Iterated Dependency Flow Execution Model},
year={2011},
month={Oct.},
volume={},
number={},
pages={1--9},
keywords={},
doi={10.1109/DFM.2011.11},
ISSN={},
}
@PHDTHESIS{cicotti_11,
author={Pietro Cicotti},
title={Tarragon: a Programming Model for Latency-Hiding Scientific Computation},
school={U. California, San Diego},
year={2011},
}
@article{latency,
author = {Patterson, David A.},
title = {Latency Lags Bandwith},
journal = {Commun. ACM},
issue_date = {October 2004},
volume = {47},
number = {10},
month = oct,
year = {2004},
issn = {0001-0782},
pages = {71--75},
numpages = {5},
url = {http://doi.acm.org/10.1145/1022594.1022596},
doi = {10.1145/1022594.1022596},
acmid = {1022596},
publisher = {ACM},
address = {New York, NY, USA},
}
@article{Babb_1984,
author = {Babb, II, R. G.},
title = {Parallel Processing with Large-Grain Data Flow Techniques},
journal = {Computer},
issue_date = {July 1984},
volume = {17},
number = {7},
month = {July},
year = {1984},
issn = {0018-9162},
pages = {55--61},
numpages = {7},
doi = {10.1109/MC.1984.1659186},
acmid = {1319843},
publisher = {IEEE Computer Society Press},
address = {Los Alamitos, CA, USA},
}
@techreport{Bosilca_10,
author={Bosilca, George and Bouteiller, Aurelien and
Danalis, Anthony and Herault, Thomas and
Lemarinier, Pierre and Dongarra, Jack},
title={{DAGuE}: A generic distributed {DAG} engine for high performance computing},
number={ICL-UT-10-01},
institution={U. Tennessee},
year={2010},
month={ 2012Apr.},
}
@inproceedings{Minnich_11,
author = {Minnich, Ronald G. and Janssen, Curtis L. and
Krishnamoorthy, Sriram and Marquez, Andres and
Gokhale, Maya and Sadayappan, P. and Van Hensbergen,
Eric and McKie, Jim and Appavoo, Jonathan},
title = {Fault Oblivious {eXascale} whitepaper},
booktitle = {Proc. 1st Int'l Workshop Runtime and Operating Systems
for Supercomputers: ROSS'11},
year = {2011},