-
Notifications
You must be signed in to change notification settings - Fork 0
/
many-core.bib
1432 lines (1337 loc) · 54.8 KB
/
many-core.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
@InProceedings{hori:hpdc2018,
author = {Atsushi Hori and Min Si and Balazs Gerofi and Masamichi Takagi and Jai Dayal and Pavan Balaji and Yutaka Ishikawa},
title = "{Process-in-Process: Techniques for Practical Address-Space Sharing}",
booktitle = "{The 27th International Symposium on High-Performance Parallel and Distributed Computing (HPDC'18)}",
year = {2018},
publisher = {ACM},
note = "{(to appear)}"
}
@InProceedings{tsujita:WS_EuroMPI2014,
author = {Yuichi Tsujita and Atsushi Hori and Yutaka Ishikawa},
title = {Locality-Aware Process Mapping for High Performance Collective MPI-IO
on FEFS with Tofu Interconnect},
booktitle = {Proceedings of the 21th European MPI Users' Group Meeting},
pages = {157-162},
year = {2014},
publisher = {ACM},
doi = {10.1145/2642769.2642799},
note = {Challenges in Data-Centric Computing}
}
@InProceedings{tsujita:hpcasia18,
author = {Yuichi Tsujita and Atsushi Hori and Toyohisa Kameyama and Atsuya Uno
and Fumiyoshi Shoji and Yutaka Ishikawa},
title = {Improving Collective {MPI-IO} Using Topology-Aware Stepwise Data Aggregation
with {I/O} Throttling},
booktitle = {Proceedings of the International Conference on High Performance Computing in Asia-Pacific Region},
pages = {12-23},
year = {2018},
publisher = {ACM},
doi = {10.1145/3149457.3149464}
}
@inproceedings{Herault:2015:PSC:2807591.2807665,
author = {Herault, Thomas and Bouteiller, Aurelien and Bosilca, George and Gamell, Marc and Teranishi, Keita and Parashar, Manish and Dongarra, Jack},
title = {Practical Scalable Consensus for Pseudo-synchronous Distributed Systems},
booktitle = {Proceedings of the International Conference for High Performance Computing, Networking, Storage and Analysis},
series = {SC '15},
year = {2015},
isbn = {978-1-4503-3723-6},
location = {Austin, Texas},
pages = {31:1--31:12},
articleno = {31},
numpages = {12},
url = {http://doi.acm.org/10.1145/2807591.2807665},
doi = {10.1145/2807591.2807665},
acmid = {2807665},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {MPI, agreement, fault-tolerance},
}
@inproceedings{Bouteiller:2015:PBI:2802658.2802668,
author = {Bouteiller, Aurelien and Bosilca, George and Dongarra, Jack J.},
title = {Plan B: Interruption of Ongoing MPI Operations to Support Failure Recovery},
booktitle = {Proceedings of the 22Nd European MPI Users' Group Meeting},
series = {EuroMPI '15},
year = {2015},
isbn = {978-1-4503-3795-3},
location = {Bordeaux, France},
pages = {11:1--11:9},
articleno = {11},
numpages = {9},
url = {http://doi.acm.org/10.1145/2802658.2802668},
doi = {10.1145/2802658.2802668},
acmid = {2802668},
publisher = {ACM},
address = {New York, NY, USA},
}
@article{Bouteiller:2015:AFT:2737841.2686892,
author = {Bouteiller, Aurelien and Herault, Thomas and Bosilca, George and Du, Peng and Dongarra, Jack},
title = {Algorithm-Based Fault Tolerance for Dense Matrix Factorizations, Multiple Failures and Accuracy},
journal = {ACM Trans. Parallel Comput.},
issue_date = {January 2015},
volume = {1},
number = {2},
month = feb,
year = {2015},
issn = {2329-4949},
pages = {10:1--10:28},
articleno = {10},
numpages = {28},
url = {http://doi.acm.org/10.1145/2686892},
doi = {10.1145/2686892},
acmid = {2686892},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {ABFT, fault-tolerance, high performance computing, linear algebra},
}
@article{doi:10.1177/1094342013488238,
author = {Wesley Bland and Aurelien Bouteiller and Thomas Herault and George Bosilca and Jack Dongarra},
title ={Post-failure recovery of MPI communication capability: Design and rationale},
journal = {The International Journal of High Performance Computing Applications},
volume = {27},
number = {3},
pages = {244-254},
year = {2013},
doi = {10.1177/1094342013488238},
URL = {https://doi.org/10.1177/1094342013488238},
eprint = {https://doi.org/10.1177/1094342013488238} ,
abstract = { As supercomputers are entering an era of massive parallelism where the frequency of faults is increasing, the MPI Standard remains distressingly vague on the consequence of failures on MPI communications. Advanced fault-tolerance techniques have the potential to prevent full-scale application restart and therefore lower the cost incurred for each failure, but they demand from MPI the capability to detect failures and resume communications afterward. In this paper, we present a set of extensions to MPI that allow communication capabilities to be restored, while maintaining the extreme level of performance to which MPI users have become accustomed. The motivation behind the design choices are weighted against alternatives, a task that requires simultaneously considering MPI from the viewpoint of both the user and the implementor. The usability of the interfaces for expressing advanced recovery techniques is then discussed, including the difficult issue of enabling separate software layers to coordinate their recovery. }
}
@phdthesis{shimada-thesis,
author = {Akio Shimada},
school = "{Keio University}",
title = "{A Atsudy on Task Models for High-performance and Efficient Intra-node Communication in Many-core Environments}",
year = "2017",
note = "(in Japanese)"
}
@masterthesis{fukazawa-thesis,
author = {Go Fukazawa},
school = "{Tokyo University of Agriculture and Technology}",
title = "{Multiple PVAS: a systems software for HPC application programs on multi-core and many-core}",
year = "2014",
note = "(Master Thesis, in Japanese)"
}
@INPROCEEDINGS{pm-infiniband-fj,
author={S. Sumimoto and A. Naruse and K. Kumon and K. Hosoe and T. Shimizu},
booktitle={Proceedings. Seventh International Conference on High Performance Computing and Grid in Asia Pacific Region, 2004.},
title="{PM/InfiniBand-FJ: a high performance communication facility using InfiniBand for large scale PC clusters}",
year={2004},
volume={},
number={},
pages={104-113},
keywords={multiprocessor interconnection networks;network operating systems;software performance evaluation;workstation clusters;Fujitsu PR1MERGY RX200 PC cluster;InfiniBand interconnect;NAS parallel benchmark;PM/InfiniBand-FJ;PM/MyrinetXP;SCore cluster system software;ServerWorks GC LE chipset;Xeon;communication facility;large scale PC clusters;Application software;Automobiles;Availability;Bandwidth;Computational modeling;High performance computing;Laboratories;Large-scale systems;Supercomputers;System software},
doi={10.1109/HPCASIA.2004.1324023},
ISSN={},
month={July},}
@article{Sato:2001:COO:1239928.1239934,
author = {Sato, Mitsuhisa and Harada, Hiroshi and Hasegawa, Atsushi and Ishikawa, Yutaka},
title = "{Cluster-enabled OpenMP: An OpenMP Compiler for the SCASH Software Distributed Shared Memory System}",
journal = {Sci. Program.},
issue_date = {August 2001},
volume = {9},
number = {2,3},
month = aug,
year = {2001},
issn = {1058-9244},
pages = {123--130},
numpages = {8},
url = {http://dl.acm.org/citation.cfm?id=1239928.1239934},
acmid = {1239934},
publisher = {IOS Press},
address = {Amsterdam, The Netherlands, The Netherlands},
}
@article{CAPPELLO2001711,
title = "{Understanding performance of SMP clusters running MPI programs}",
journal = "Future Generation Computer Systems",
volume = "17",
number = "6",
pages = "711 - 720",
year = "2001",
note = "I: PaCT. II: HPC applications",
issn = "0167-739X",
doi = "https://doi.org/10.1016/S0167-739X(00)00054-6",
url = "http://www.sciencedirect.com/science/article/pii/S0167739X00000546",
author = "Franck Cappello and Olivier Richard and Daniel Etiemble",
keywords = "Clusters of multiprocessors, SMP clusters, MPI programs"
}
@INPROCEEDINGS{1488614,
author={H. W. Jin and S. Sur and L. Chai and D. K. Panda},
booktitle={2005 International Conference on Parallel Processing (ICPP'05)},
title="{LiMIC: support for high-performance MPI intra-node communication on Linux cluster}",
year={2005},
volume={},
number={},
pages={184-191},
keywords={Linux;message passing;multiprocessing systems;network operating systems;operating system kernels;performance evaluation;workstation clusters;8-node dual SMP InfiniBand cluster;LiMIC;Linux cluster;MPI friendly interface;MPI stack;MVAPICH;SMP workstation clusters;high-performance MPI intra-node communication;kernel module interface;open source MPI;point-to-point latency;Application software;Bandwidth;Computer science;Delay;Kernel;Linux;Local area networks;Message passing;Operating systems;Workstations},
doi={10.1109/ICPP.2005.48},
ISSN={0190-3918},
month={June},}
@INPROCEEDINGS{1630865,
author={D. Buntinas and G. Mercier and W. Gropp},
booktitle={Cluster Computing and the Grid, 2006. CCGRID 06. Sixth IEEE International Symposium on},
title="{Design and evaluation of Nemesis, a scalable, low-latency, message-passing communication subsystem}",
year={2006},
volume={1},
number={},
pages={10 pp.-530},
keywords={message passing;shared memory systems;MPI implementation;MPICH2 architecture;Nemesis;dedicated communication channel;high performance network;internode communication;intranode communication context;low-latency message passing;low-level communication subsystem;message passing communication subsystem;point-to-point benchmark;scalable message passing interface;shared memory systems;Communication channels;Computer architecture;Computer science;Concurrent computing;Context;Hardware;Laboratories;Mathematics;Message passing;Scalability},
doi={10.1109/CCGRID.2006.31},
ISSN={},
month={May},}
@article{Leiserson:1996:NAC:226363.226368,
author = {Leiserson, Charles E. and Abuhamdeh, Zahi S. and Douglas, David C. and Feynman, Carl R. and Ganmukhi, Mahesh N. and Hill, Jeffrey V. and Hillis, W.Daniel and Kuszmaul, Bradley C. and St. Pierre, Margaret A. and Wells, David S. and Wong-Chan, Monica C. and Yang, Shaw-Wen and Zak, Robert},
title = "{The Network Architecture of the Connection Machine CM-5}",
journal = {J. Parallel Distrib. Comput.},
issue_date = {March 15, 1996},
volume = {33},
number = {2},
month = mar,
year = {1996},
issn = {0743-7315},
pages = {145--158},
numpages = {14},
url = {http://dx.doi.org/10.1006/jpdc.1996.0033},
doi = {10.1006/jpdc.1996.0033},
acmid = {226368},
publisher = {Academic Press, Inc.},
address = {Orlando, FL, USA},
}
@Article{u-net,
author = "T. von Eicken and A. Basu and V. Buch and W. Vogels",
title = "{U-Net: a user-level network interface for parallel and
distributed computing}",
journal = "SIGOPS Oper. Syst. Rev.",
volume = "29",
issue = "5",
month = dec,
year = "1995",
ISSN = "0163-5980",
pages = "40--53",
numpages = "14",
URL = "http://doi.acm.org/10.1145/224057.224061",
DOI = "http://doi.acm.org/10.1145/224057.224061",
acmid = "224061",
publisher = "ACM",
address = "New York, NY, USA",
}
@InProceedings{AM,
author = "Thorsten von Eicken and David E. Culler and Seth Copen
Goldstein and Klaus Erik Schauser",
title = "{Active messages: a mechanism for integrated
communication and computation}",
booktitle = "Proceedings of the 19th annual international symposium
on Computer architecture",
series = "ISCA '92",
year = "1992",
ISBN = "0-89791-509-7",
location = "Queensland, Australia",
pages = "256--266",
numpages = "11",
URL = "http://doi.acm.org/10.1145/139669.140382",
DOI = "http://doi.acm.org/10.1145/139669.140382",
acmid = "140382",
publisher = "ACM",
address = "New York, NY, USA",
}
@Article{FM,
author = "Scott Pakin and Vijay Karamcheti and Andrew A. Chien",
title = "{Fast Messages: Efficient, Portable Communication for
Workstation Clusters and MPPs}",
journal = "IEEE Parallel Distrib. Technol.",
volume = "5",
issue = "2",
month = apr,
year = "1997",
ISSN = "1063-6552",
pages = "60--73",
numpages = "14",
URL = "http://dl.acm.org/citation.cfm?id=613783.614014",
acmid = "614014",
publisher = "IEEE Computer Society Press",
address = "Los Alamitos, CA, USA",
}
@InProceedings{PM,
author = "Hiroshi Tezuka and Atsushi Hori and Yutaka Ishikawa
and Mitsuhisa Sato",
title = "{PM: An Operating System Coordinated High Performance
Communication Library}",
booktitle = "Proceedings of the International Conference and
Exhibition on High-Performance Computing and
Networking",
series = "HPCN Europe '97",
year = "1997",
ISBN = "3-540-62898-3",
pages = "708--717",
numpages = "10",
URL = "http://dl.acm.org/citation.cfm?id=645561.658906",
acmid = "658906",
publisher = "Springer-Verlag",
address = "London, UK",
}
@Article{boden95myrinet,
author = "Nanette J. Boden and Danny Cohen and Robert E.
Felderman and Alan E. Kulawik and Charles L. Seitz and
Jakov N. Seizovic and Wen-King Su",
title = "{Myrinet: A Gigabit-per-Second Local Area Network}",
journal = "IEEE Micro",
volume = "15",
number = "1",
pages = "{29--36}",
year = "1995",
URL = "citeseer.nj.nec.com/boden95myrinet.html",
}
@INPROCEEDINGS{Sterling95beowulf:a,
author = {Thomas Sterling and Donald J. Becker and Daniel Savarese and John E. Dorband and Udaya A. Ranawake and Charles V. Packer},
title = "{Beowulf: A Parallel Workstation For Scientific Computation}",
booktitle = {In Proceedings of the 24th International Conference on Parallel Processing},
year = {1995},
pages = {11--14},
publisher = {CRC Press}
}
@inproceedings{Hori:2015:SSF:2802658.2802670,
author = {Hori, Atsushi and Yoshinaga, Kazumi and Herault, Thomas and Bouteiller, Aur{\'e}lien and Bosilca, George and Ishikawa, Yutaka},
title = "{Sliding Substitution of Failed Nodes}",
booktitle = {Proceedings of the 22Nd European MPI Users' Group Meeting},
series = {EuroMPI '15},
year = {2015},
isbn = {978-1-4503-3795-3},
location = {Bordeaux, France},
pages = {14:1--14:10},
articleno = {14},
numpages = {10},
url = {http://doi.acm.org/10.1145/2802658.2802670},
doi = {10.1145/2802658.2802670},
acmid = {2802670},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {communication performance, fault mitigation, fault tolerance, spare node, CREST Project},
}
@article{110009850784,
author="Akio Shimada and Atsushi Hori and Yutaka Ishikawa and Pavan Balaji",
title="User-level Process towards Exascale Systems",
publisher="IPSJ",
year="2014",
month="dec",
volume="2014",
number="22",
pages="1-7",
URL="http://ci.nii.ac.jp/naid/110009850784/",
DOI="",
keywords = {CREST Project},
}
@inproceedings{Takagi:2015:ATS:2831129.2831132,
author = {Takagi, Masamichi and Yamaguchi, Norio and Gerofi, Balazs and Hori, Atsushi and Ishikawa, Yutaka},
title = "{Adaptive Transport Service Selection for MPI with InfiniBand Network}",
booktitle = {Proceedings of the 3rd Workshop on Exascale MPI},
series = {ExaMPI '15},
year = {2015},
isbn = {978-1-4503-3998-8},
location = {Austin, Texas},
pages = {3:1--3:10},
articleno = {3},
numpages = {10},
url = {http://doi.acm.org/10.1145/2831129.2831132},
doi = {10.1145/2831129.2831132},
acmid = {2831132},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {CREST Project},
}
@incollection{,
year={2012},
isbn={978-3-642-33517-4},
booktitle={Recent Advances in the Message Passing Interface},
volume={7490},
series={Lecture Notes in Computer Science},
editor={Träff, Jesper Larsson and Benkner, Siegfried and Dongarra, JackJ.},
doi={10.1007/978-3-642-33518-1_20},
title="{An Efficient Kernel-Level Blocking MPI Implementation}",
url={http://dx.doi.org/10.1007/978-3-642-33518-1_20},
publisher={Springer Berlin Heidelberg},
author={Hori, Atsushi and Kameyama, Toyohisa and Tsujita, Yuichi and Namiki, Mitaro and Ishikawa, Yutaka},
pages={153-162},
keywords = {CREST Project}
}
@INPROCEEDINGS{6496025,
author={Yamamoto, Keiji and Hori, Atsushi and Ishikawa, Yutaka},
booktitle={High Performance Computing, Networking, Storage and Analysis (SCC), 2012 SC Companion:},
title="{Poster: Distributed Metadata Management for Exascale Parallel File System}",
year={2012},
month={Nov},
pages={1438-1438},
doi={10.1109/SC.Companion.2012.242},
keywords = {CREST Project}
}
@INPROCEEDINGS{6495965,
author={Gerofi, B. and Hori, A. and Shimada, A. and Ishikawa, Y.},
booktitle={High Performance Computing, Networking, Storage and Analysis (SCC), 2012 SC Companion:},
title="{Poster: Toward Operating System Assisted Hierarchical Memory Management for Heterogeneous Architectures}",
year={2012},
month={Nov},
pages={1352-1352},
keywords={coprocessors;operating systems (computers);parallel processing;peripheral interfaces;storage management;Intel MIC architecture;Intel many integrated core architecture;MMU;PCI DMA operation;PCI card;address mapping;coprocessor;heterogeneous architecture;hierarchical memory management;memory management unit;operating system;parallel workload processing;peripheral component interconnect;coprocessor;manycore;memory management;operating systems},
doi={10.1109/SC.Companion.2012.182},
keywords = {CREST Project}
}
@INPROCEEDINGS{6337830,
author={Gerofi, B. and Hori, A. and Ishikawa, Y.},
booktitle={Cluster Computing (CLUSTER), 2012 IEEE International Conference on},
title="{clone_n(): Parallel Thread Creation for Upcoming Many-Core Architectures}",
year={2012},
month={Sept},
pages={592-596},
keywords={application program interfaces;graphics processing units;multiprocessing systems;operating systems (computers);parallel architectures;processor scheduling;Intel many integrated core;NVIDIA GPU;OS API;clone_n();heterogeneous architectures;many-core architectures;multicore processor;operating system;parallel thread creation;parallel workloads;parallelism control;power-efficient cores;single-thread performance;software thread creation;software thread scheduling;system call;Cloning;Instruction sets;Kernel;Message systems;Multicore processing;coprocessor;manycore;operating systems;threading},
doi={10.1109/CLUSTER.2012.85},
keywords = {CREST Project}
}
@InProceedings{tsujita:isc2015,
author = {Yuichi Tsuita and Atsushi Hori and Yutaka Ishikawa},
title = {Striping Layout Aware Data Aggregation for High Performance {I/O}
on a Lustre File System},
booktitle = {High Performance Computing, 30th International Conference, ISC High Performance 2015,
Frankfurt, Germany, July 12-16, 2015, Proceedings},
pages = {282-290},
year = {2015},
editor = {Julian M. Kunkel and Thomas Ludwig},
volume = {9137},
series = {Lecture Notes in Computer Science},
publisher = {Springer},
keywords = {AICS}
}
@inproceedings{shimosawa2014,
author = {T. Shimosawa and B. Gerofi and M. Takagi and T. Shirasawa and M. Shimizu and A. Hori and Y. Ishikawa},
title = "{Interface for Heterogeneous Kernels: A Framework to Enable Hybrid OS Designs Tergeting High Performance Computing}",
booktitle = {IEEE International Conference on High Performance Computing (HiPC)},
location = {Goa, India},
year = {2014},
publisher = {IEEE},
keywords = {CREST Project}
}
@inproceedings{Sato:2014:DMP:2642769.2642795,
author = {Sato, Mikiko and Fukazawa, Go and Shimada, Akio and Hori, Atsushi and Ishikawa, Yutaka and Namiki, Mitaro},
title = {Design of Multiple PVAS on InfiniBand Cluster System Consisting of Many-core and Multi-core},
booktitle = {Proceedings of the 21st European MPI Users' Group Meeting},
series = {EuroMPI/ASIA '14},
year = {2014},
isbn = {978-1-4503-2875-3},
location = {Kyoto, Japan},
pages = {133:133--133:138},
articleno = {133},
numpages = {6},
url = {http://doi.acm.org/10.1145/2642769.2642795},
doi = {10.1145/2642769.2642795},
acmid = {2642795},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {CREST Project}
}
@inproceedings{Shimada:2014:ECC:2642769.2642790,
author = {Shimada, Akio and Hori, Atsushi and Ishikawa, Yutaka},
title = {Eliminating Costs for Crossing Process Boundary from MPI Intra-node Communication},
booktitle = {Proceedings of the 21st European MPI Users' Group Meeting},
series = {EuroMPI/ASIA '14},
year = {2014},
isbn = {978-1-4503-2875-3},
location = {Kyoto, Japan},
pages = {119:119--119:120},
articleno = {119},
numpages = {2},
url = {http://doi.acm.org/10.1145/2642769.2642790},
doi = {10.1145/2642769.2642790},
acmid = {2642790},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {CREST Project}
}
@inproceedings{SHIMADA:PGAS12,
author = {Akio Shimada and Balazs Gerofi and Atsushi Hori and Yutaka Ishikawa},
title = {PGAS Intra-node Communication towards Many-Core Architecture},
booktitle = {In PGAS 2012: 6th Conference on Partitioned Global Address Space Programing Model},
series = {PGAS'12},
year = {2012},
location = {Santa Barbara, California, USA},
}
@inproceedings{Gerofi:2014:CNP:2600212.2600231,
author = {Gerofi, Balazs and Shimada, Akio and Hori, Atsushi and Masamichi, Takagi and Ishikawa, Yutaka},
title = {CMCP: A Novel Page Replacement Policy for System Level Hierarchical Memory Management on Many-cores},
booktitle = {Proceedings of the 23rd International Symposium on High-performance Parallel and Distributed Computing},
series = {HPDC '14},
year = {2014},
isbn = {978-1-4503-2749-7},
location = {Vancouver, BC, Canada},
pages = {73--84},
numpages = {12},
url = {http://doi.acm.org/10.1145/2600212.2600231},
doi = {10.1145/2600212.2600231},
acmid = {2600231},
publisher = {ACM},
address = {New York, NY, USA},
}
@inproceedings{Hori:2014:DAA:2642769.2642801,
author = {Hori, Atsushi and Yoshinaga, Kazumi and Tokuhisa, Atsushi and Joti, Yasumasa and Okada, Kensuke and Sugimoto, Takashi and Yamaga, Mitsuhiro and Hatsui, Takaki and Yabashi, Makina and Sugita, Yuji and Ishikawa, Yutaka and Go, Nobuhiro},
title = {Decoupling Architecture for All-to-all Computation},
booktitle = {Proceedings of the 21st European MPI Users' Group Meeting},
series = {EuroMPI/ASIA '14},
year = {2014},
isbn = {978-1-4503-2875-3},
location = {Kyoto, Japan},
pages = {169:169--169:174},
articleno = {169},
numpages = {6},
url = {http://doi.acm.org/10.1145/2642769.2642801},
doi = {10.1145/2642769.2642801},
acmid = {2642801},
publisher = {ACM},
address = {New York, NY, USA},
}
@InProceedings{hpcs2014,
author = {Yuichi Tsujita and Atsushi Hori and Yutaka Ishikawa},
title = {Affinity-Aware Optimization of Multithreaded Two-Phase {I/O}
for High Throughput Collective I/O},
OPTcrossref = {},
OPTkey = {},
booktitle = {Proceedings of International Conference on High Performance Computing
{\&} Simulation, HPCS 2014, Bologna, Italy, July 21-25, 2014},
pages = {210-217},
year = {2014},
publisher = {IEEE},
OPTnote = {},
OPTannote = {},
}
@InProceedings{PDP2014,
author = {Yuichi Tsujita and Kazumi Yoshinaga and Atsushi Hori
and Mikiko Sato and Mitaro Namiki and Yutaka Ishikawa},
title = {Multithreaded Two-Phase {I/O}:
Improving Collective {MPI-IO} Performance on a {Lustre} File System},
booktitle = {Proceedings of PDP2014, Turin, February 12-14, 2014},
pages = {232-235},
year = {2014},
month = {Feb},
publisher = {IEEE CS},
}
@incollection{eurompi2012-ishikawa,
year={2012},
isbn={978-3-642-33517-4},
booktitle={Recent Advances in the Message Passing Interface},
volume={7490},
series={Lecture Notes in Computer Science},
editor={Träff, JesperLarsson and Benkner, Siegfried and Dongarra, JackJ.},
doi={10.1007/978-3-642-33518-1_39},
title={Revisiting Persistent Communication in MPI},
url={http://dx.doi.org/10.1007/978-3-642-33518-1_39},
publisher={Springer Berlin Heidelberg},
author={Ishikawa, Yutaka and Nakajima, Kengo and Hori, Atsushi},
pages={296-297},
}
@article{Tokuhisa:ys5079,
author = "Tokuhisa, Atsushi and Arai, Junya and Joti, Yasumasa and Ohno, Yoshiyuki and Kameyama, Toyohisa and Yamamoto, Keiji and Hatanaka, Masayuki and Gerofi, Balazs and Shimada, Akio and Kurokawa, Motoyoshi and Shoji, Fumiyoshi and Okada, Kensuke and Sugimoto, Takashi and Yamaga, Mitsuhiro and Tanaka, Ryotaro and Yokokawa, Mitsuo and Hori, Atsushi and Ishikawa, Yutaka and Hatsui, Takaki and Go, Nobuhiro",
title = "{High-speed classification of coherent X-ray diffraction~patterns on the K computer for high-resolution single biomolecule imaging}",
journal = "Journal of Synchrotron Radiation",
year = "2013",
volume = "20",
number = "6",
pages = "899--904",
month = "Nov",
doi = {10.1107/S0909049513022152},
url = {http://dx.doi.org/10.1107/S0909049513022152},
}
@inproceedings{mikiko:2013,
author="M. Sato and G. Fukazawa and K. Yoshinaga and Y. Tsujita and A. Hori and M. Namiki",
title={A Hybrid Operating System for a Computing Node with Multi-Core and Many-Core Processors},
booktitle={International Journal Advanced mputer Science (IJACSci)},
volume="3",
number="7",
pages={368--377},
month={July},
year={2013},
}
@inproceedings{Hatanaka:2013:OMP:2488551.2488566,
author = {Hatanaka, Masayuki and Hori, Atsushi and Ishikawa, Yutaka},
title = {Optimization of MPI Persistent Communication},
booktitle = {Proceedings of the 20th European MPI Users' Group Meeting},
series = {EuroMPI '13},
year = {2013},
isbn = {978-1-4503-1903-4},
location = {Madrid, Spain},
pages = {79--84},
numpages = {6},
url = {http://doi.acm.org/10.1145/2488551.2488566},
doi = {10.1145/2488551.2488566},
acmid = {2488566},
publisher = {ACM},
address = {New York, NY, USA},
}
@misc{bdec2014,
author = {A. Hori and A. Tokuhisa and K. Yoshinaga and T. Kameyama and K. Okada J. Arai and T. Sugimoto and M. Yamaga and R. Tanaka and Y. Joti and T. Hatsui and M. Yabashi and Y. Sugita and Y. Ishikawa and N. Go},
title = "{SACLA and the K Computer}",
year = {2014},
howpublished = "{White Paper presented in BDEC Fukuoka, JAPAN}",
}
@incollection{tsujita-2014,
year={2014},
isbn={978-3-642-55223-6},
booktitle={Parallel Processing and Applied Mathematics},
volume={8384},
series={Lecture Notes in Computer Science},
editor={Wyrzykowski, Roman and Dongarra, Jack and Karczewski, Konrad and Waśniewski, Jerzy},
doi={10.1007/978-3-642-55224-3_67},
title={Improving Parallel I/O Performance Using Multithreaded Two-Phase I/O with Processor Affinity Management},
url={http://dx.doi.org/10.1007/978-3-642-55224-3_67},
publisher={Springer Berlin Heidelberg},
author={Tsujita, Yuichi and Yoshinaga, Kazumi and Hori, Atsushi and Sato, Mikiko and Namiki, Mitaro and Ishikawa, Yutaka},
pages={714-723},
language={English},
}
@inproceedings{Shimada:2013:PNT:2489068.2489075,
author = {Shimada, Akio and Gerofi, Balazs and Hori, Atsushi and Ishikawa, Yutaka},
title = {Proposing a new task model towards many-core architecture},
booktitle = {Proceedings of the First International Workshop on Many-core Embedded Systems},
series = {MES '13},
year = {2013},
isbn = {978-1-4503-2063-4},
location = {Tel-Aviv, Israel},
pages = {45--48},
numpages = {4},
url = {http://doi.acm.org/10.1145/2489068.2489075},
doi = {10.1145/2489068.2489075},
acmid = {2489075},
publisher = {ACM},
address = {New York, NY, USA},
}
@inproceedings{DBLP:conf/ccgrid/GerofiSHI13,
author = {Balazs Gerofi and
Akio Shimada and
Atsushi Hori and
Yutaka Ishikawa},
title = {Partially Separated Page Tables for Efficient Operating
System Assisted Hierarchical Memory Management on Heterogeneous
Architectures},
booktitle = {CCGRID},
year = {2013},
pages = {360-368},
ee = {http://doi.ieeecomputersociety.org/10.1109/CCGrid.2013.59},
crossref = {DBLP:conf/ccgrid/2013},
bibsource = {DBLP, http://dblp.uni-trier.de},
}
@inproceedings{Sato:2012:DHO:2318916.2318927,
author = {Sato, Mikiko and Fukazawa, Go and Nagamine, Kiyohiko and Sakamoto, Ryuichi and Namiki, Mitaro and Yoshinaga, Kazumi and Tsujita, Yuichi and Hori, Atsushi and Ishikawa, Yutaka},
title = {A design of hybrid operating system for a parallel computer with multi-core and many-core processors},
booktitle = {Proceedings of the 2nd International Workshop on Runtime and Operating Systems for Supercomputers},
series = {ROSS '12},
year = {2012},
isbn = {978-1-4503-1460-2},
location = {Venice, Italy},
pages = {9:1--9:8},
articleno = {9},
numpages = {8},
url = {http://doi.acm.org/10.1145/2318916.2318927},
doi = {10.1145/2318916.2318927},
acmid = {2318927},
publisher = {ACM},
address = {New York, NY, USA},
}
@inproceedings{Yoshinaga:2013:DMM:2497369.2497589,
author = {Yoshinaga, Kazumi and Tsujita, Yuichi and Hori, Atsushi and Sato, Mikiko and Namiki, Mitaro and Ishikawa, Yutaka},
title = {A Delegation Mechanism on Many-Core Oriented Hybrid Parallel Computers for Scalability of Communicators and Communications in MPI},
booktitle = {Proceedings of the 2013 21st Euromicro International Conference on Parallel, Distributed, and Network-Based Processing},
series = {PDP '13},
year = {2013},
isbn = {978-0-7695-4939-2},
pages = {249--253},
numpages = {5},
url = {http://dx.doi.org/10.1109/PDP.2013.43},
doi = {10.1109/PDP.2013.43},
acmid = {2497589},
publisher = {IEEE Computer Society},
address = {Washington, DC, USA},
}
@incollection{Yoshinaga-2012,
year={2012},
isbn={978-3-642-33517-4},
booktitle={Recent Advances in the Message Passing Interface},
volume={7490},
series={Lecture Notes in Computer Science},
editor={Träff, JesperLarsson and Benkner, Siegfried and Dongarra, JackJ.},
doi={10.1007/978-3-642-33518-1_10},
title={Delegation-Based MPI Communications for a Hybrid Parallel Computer with Many-Core Architecture},
url={http://dx.doi.org/10.1007/978-3-642-33518-1_10},
publisher={Springer Berlin Heidelberg},
author={Yoshinaga, Kazumi and Tsujita, Yuichi and Hori, Atsushi and Sato, Mikiko and Namiki, Mitaro and Ishikawa, Yutaka},
pages={47-56}
}
@inproceedings{ohnofile,
title={File Composition Technique to Improve the Performance of Accessing a Number of Small Files},
author={Ohno, Yoshiyuki and Hori, Atsushi and Ishikawa, Yutaka},
booktitle = {Proceedings of the International Conference on Parallel and Distributed Processing Techniques and Applications},
volume = {I},
pages = {395-400},
year = {2012},
}
@inproceedings{Hori:2011:PMF:2148600.2148613,
author = {Hori, Atsushi and Ishikawa, Yutaka},
title = {Poster: MINT: a fast and green synchronization technique},
booktitle = {Proceedings of the 2011 companion on High Performance Computing Networking, Storage and Analysis Companion},
series = {SC '11 Companion},
year = {2011},
isbn = {978-1-4503-1030-7},
location = {Seattle, Washington, USA},
pages = {23--24},
numpages = {2},
url = {http://doi.acm.org/10.1145/2148600.2148613},
doi = {10.1145/2148600.2148613},
acmid = {2148613},
publisher = {ACM},
address = {New York, NY, USA},
}
@article{Hori2012,
title = "Audit: A new synchronization API for the GET/PUT protocol",
journal = "Journal of Parallel and Distributed Computing",
volume = "",
number = "0",
pages = " - ",
year = "2012",
issn = "0743-7315",
doi = "10.1016/j.jpdc.2012.01.019",
url = "http://www.sciencedirect.com/science/article/pii/S0743731512000317",
author = "Atsushi Hori and Jinpil Lee and Mitsuhisa Sato",
}
@inproceedings{Hori-audit,
author = {Atsushi Hori and Jinpil Lee and Mitsuhisa Sato},
title = "{Audit: New Synchronization for the GET/PUT Protocol}",
booktitle = {The 1st Workshop on Communication Architecture for Scalable Systems},
year = {2011},
month = {May},
}
@inproceedings{DBLP:conf/cluster/HoriKMOYSI09,
author = {Atsushi Hori and
Yoshikazu Kamoshida and
Hiroya Matsuba and
Kazuki Ohta and
Takashi Yasui and
Shinji Sumimoto and
Yutaka Ishikawa},
title = {On-demand file staging system for Linux clusters},
booktitle = {CLUSTER},
year = {2009},
pages = {1-10},
ee = {http://dx.doi.org/10.1109/CLUSTR.2009.5289189},
crossref = {DBLP:conf/cluster/2009},
bibsource = {DBLP, http://dblp.uni-trier.de},
}
@inproceedings{Hori:2011:CCM:2117686.2118434,
author = {Atsushi Hori and Keiji Yamamoto and Yutaka Ishikawa},
title = {Catwalk-ROMIO: A Cost-Effective MPI-IO},
booktitle = {Proceedings of the 2011 IEEE 17th International Conference on Parallel and Distributed Systems},
series = {ICPADS '11},
year = {2011},
isbn = {978-0-7695-4576-9},
pages = {120--126},
numpages = {7},
url = {http://dx.doi.org/10.1109/ICPADS.2011.40},
doi = {10.1109/ICPADS.2011.40},
acmid = {2118434},
publisher = {IEEE Computer Society},
address = {Washington, DC, USA},
keywords = {eScience Project}
}
@inproceedings{DBLP:conf/pvm/SumimotoNNKYKMHI09,
author = {Shinji Sumimoto and
Kohta Nakashima and
Akira Naruse and
Kouichi Kumon and
Takashi Yasui and
Yoshikazu Kamoshida and
Hiroya Matsuba and
Atsushi Hori and
Yutaka Ishikawa},
title = "{The Design of Seamless MPI Computing Environment for Commodity-Based
Clusters}",
booktitle = {PVM/MPI},
year = {2009},
pages = {9-19},
ee = {http://dx.doi.org/10.1007/978-3-642-03770-2_8},
crossref = {DBLP:conf/pvm/2009},
bibsource = {DBLP, http://dblp.uni-trier.de},
keywords = {eScience Project}
}
@inproceedings{Sumimoto:2009:DSM:1612208.1612219,
author = {Sumimoto, Shinji and Nakashima, Kohta and Naruse, Akira and Kumon, Kouichi and Yasui, Takashi and Kamoshida, Yoshikazu and Matsuba, Hiroya and Hori, Atsushi and Ishikawa, Yutaka},
title = "{The Design of Seamless MPI Computing Environment for Commodity-Based Clusters}",
booktitle = {Proceedings of the 16th European PVM/MPI Users' Group Meeting on Recent Advances in Parallel Virtual Machine and Message Passing Interface},
year = {2009},
isbn = {978-3-642-03769-6},
location = {Espoo, Finland},
pages = {9--19},
numpages = {11},
url = {http://dx.doi.org/10.1007/978-3-642-03770-2_8},
doi = {10.1007/978-3-642-03770-2_8},
acmid = {1612219},
publisher = {Springer-Verlag},
address = {Berlin, Heidelberg},
keywords = {eScience Project}
}
@inproceedings{tezuka:96,
author = "Hiroshi Tezuka and Atsushi Hori and Yutaka Ishikawa",
title = "{PM: a highperformance communication library for multi-user parallel environments}",
booktitle = "Usenix'97",
year = "1997",
url = "citeseer.nj.nec.com/tezuka96pm.html" }
@manual{ pmx,
author = "{Atsushi Hori}",
title = "{PMX Specification --DRAFT--}",
url = "http://www.pccluster.org/score\_doc/score-7.0.2/pdf/PMX-spec.pdf",
organization = "Allinea Software",
year = "2009",
keywords = {Allinea Software}
}
@inproceedings{Hori:1998:HEG:509058.509100,
author = {Atsushi Hori and Hiroshi Tezuka and Yutaka Ishikawa},
title = "{Highly efficient gang scheduling implementation}",
booktitle = {Proceedings of the 1998 ACM/IEEE conference on Supercomputing (CDROM)},
series = {Supercomputing '98},
year = {1998},
isbn = {0-89791-984-X},
location = {San Jose, CA},
pages = {1--14},
numpages = {14},
url = {http://dl.acm.org/citation.cfm?id=509058.509100},
acmid = {509100},
publisher = {IEEE Computer Society},
address = {Washington, DC, USA},
keywords = {RWCP Project}
}
@inproceedings{1998:PCV:876880.879528,
author = {Hiroshi Tezuka and Francis O'Carroll and Atsushi Hori and Yutaka Ishikawa},
title = "{Pin-down Cache: A Virtual Memory Management Technique for Zero-copy Communication}",
booktitle = {Proceedings of the 12th. International Parallel Processing Symposium on International Parallel Processing Symposium},
series = {IPPS '98},
year = {1998},
pages = {308--},
url = {http://dl.acm.org/citation.cfm?id=876880.879528},
acmid = {879528},
publisher = {IEEE Computer Society},
address = {Washington, DC, USA},
keywords = {RWCP Project}
}
@inproceedings{PM,
author = {Hiroshi Tezuka and Atsushi Hori and Yutaka Ishikawa and Mitsuhisa Sato},
title = "{PM: An Operating System Coordinated High Performance Communication Library}",
booktitle = {Proceedings of the International Conference and Exhibition on High-Performance Computing and Networking},
series = {HPCN Europe '97},
year = {1997},
isbn = {3-540-62898-3},
pages = {708--717},
numpages = {10},
url = {http://dl.acm.org/citation.cfm?id=645561.658906},
acmid = {658906},
publisher = {Springer-Verlag},
address = {London, UK},
keywords = {RWCP Project}
}
@inproceedings{DBLP:conf/cluster/Hori01,
author = {Atsushi Hori},
title = "{SCore: An Integrated Cluster System Software Package for
High Performance Cluster Computing}",
booktitle = {CLUSTER},
year = {2001},
pages = {449-},
ee = {http://csdl.computer.org/comp/proceedings/cluster/2001/1116/00/11160449.pdf},
crossref = {DBLP:conf/cluster/2001},
bibsource = {DBLP, http://dblp.uni-trier.de},
keywords = {RWCP Project}
}
@inproceedings{DBLP:conf/cluster/NishiokaHI00,
author = {Toshihiro Nishioka and
Atsushi Hori and
Yutaka Ishikawa},
title = "{Consistent Checkpointing for High Performance Clusters}",
booktitle = {CLUSTER},
year = {2000},
pages = {367-368},
ee = {http://doi.ieeecomputersociety.org/10.1109/CLUSTER.2000.10004},
crossref = {DBLP:conf/cluster/2000},
bibsource = {DBLP, http://dblp.uni-trier.de},
keywords = {RWCP Project}
}
@inproceedings{DBLP:conf/hpdc/SumimotoTHHTI00,
author = {Shinji Sumimoto and
Hiroshi Tezuka and
Atsushi Hori and
Hiroshi Harada and
Toshiyuki Takahashi and
Yutaka Ishikawa},
title = "{High Performance Communication using a Commodity Network
for Cluster Systems}",
booktitle = {HPDC},
year = {2000},
pages = {139-146},
ee = {http://computer.org/proceedings/hpdc/0783/07830139abs.htm},
bibsource = {DBLP, http://dblp.uni-trier.de},
keywords = {RWCP Project}
}
@article{DBLP:journals/ngc/SumiotoTHHTI00,
author = {Shinji Sumimoto and
Hiroshi Tezuka and
Atsushi Hori and
Hiroshi Harada and
Toshiyuki Takahashi and
Yutaka Ishikawa},
title = "{GigaE PM: a High Performance Communication Facility using
a Gigabit Ethernet}",
journal = {New Generation Comput.},
volume = {18},
number = {2},
year = {2000},
pages = {177-186},
ee = {http://dx.doi.org/10.1007/BF03037596},
bibsource = {DBLP, http://dblp.uni-trier.de},
keywords = {RWCP Project}
}
@inproceedings{DBLP:conf/sc/TakahashiSHHI00,
author = {Toshiyuki Takahashi and
Shinji Sumimoto and
Atsushi Hori and
Hiroshi Harada and
Yutaka Ishikawa},
title = "{PM2: A High Performance Communication Middleware for Heterogeneous
Network Environments}",
booktitle = {SC},
year = {2000},
ee = {http://www.supercomp.org/sc2000/Proceedings/techpapr/papers/pap205.pdf},
bibsource = {DBLP, http://dblp.uni-trier.de},
keywords = {RWCP Project}
}
@inproceedings{DBLP:conf/hcw/IshikawaHTSTH99,
author = {Yutaka Ishikawa and
Atsushi Hori and
Hiroshi Tezuka and
Shinji Sumimoto and
Toshiyuki Takahashi and
Hiroshi Harada},
title = "{Parallel C++ Programming System on Cluster of Heterogeneous
Computers}",
booktitle = {Heterogeneous Computing Workshop},
year = {1999},
pages = {73-82},
ee = {http://computer.org/proceedings/hcw/0107/01070073abs.htm},
bibsource = {DBLP, http://dblp.uni-trier.de},
keywords = {RWCP Project}
}
@inproceedings{DBLP:conf/ipps/TakahashiOTHSHIB99,
author = {Toshiyuki Takahashi and
Francis O'Carroll and
Hiroshi Tezuka and
Atsushi Hori and
Shinji Sumimoto and
Hiroshi Harada and
Yutaka Ishikawa and
Peter H. Beckman},
title = "{Implementation and Evaluation of MPI on an SMP Cluster}",
booktitle = {IPPS/SPDP Workshops},
year = {1999},
pages = {1178-1192},
ee = {http://dx.doi.org/10.1007/BFb0098001},
bibsource = {DBLP, http://dblp.uni-trier.de},