-
Notifications
You must be signed in to change notification settings - Fork 0
/
references.bib
185 lines (170 loc) · 7.66 KB
/
references.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
@article{nikolopoulos2001exploiting,
title={Exploiting memory affinity in OpenMP through schedule reuse},
author={Nikolopoulos, Dimitrios S and Artiaga, Ernest and Ayguad{\'e}, Eduard and Labarta, Jes{\'u}s},
journal={ACM SIGARCH Computer Architecture News},
volume={29},
number={5},
pages={49--55},
year={2001},
publisher={ACM}
}
@inproceedings{Su:2011,
author = {Su, ChunYi and Li, Dong and Nikolopoulos, Dimitrios and Grove, Matthew and Cameron, Kirk W. and de Supinski, Bronis R.},
title = {Critical Path-based Thread Placement for NUMA Systems},
booktitle = {Proceedings of the Second International Workshop on Performance Modeling, Benchmarking and Simulation of High Performance Computing Systems},
series = {PMBS '11},
year = {2011},
isbn = {978-1-4503-1102-1},
location = {Seattle, Washington, USA},
pages = {19--20},
numpages = {2},
url = {http://doi.acm.org/10.1145/2088457.2088471},
doi = {10.1145/2088457.2088471},
acmid = {2088471},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {NUMA, critical path, multicore processors, openMP, shared resource contention, thread placement},
}
@incollection{Matthias:2009,
year={2009},
isbn={978-3-642-02284-5},
booktitle={Evolving OpenMP in an Age of Extreme Parallelism},
volume={5568},
series={Lecture Notes in Computer Science},
editor={MÃŒller, MatthiasS. and de Supinski, BronisR. and Chapman, BarbaraM.},
doi={10.1007/978-3-642-02303-3_7},
title={Dynamic Task and Data Placement over NUMA Architectures: An OpenMP Runtime Perspective},
url={http://dx.doi.org/10.1007/978-3-642-02303-3_7},
publisher={Springer Berlin Heidelberg},
keywords={OpenMP; Memory; NUMA; Hierarchical Thread Scheduling; Multi-Core},
author={Broquedis, François and Furmento, Nathalie and Goglin, Brice and Namyst, Raymond and Wacrenier, Pierre-André},
pages={79-92},
language={English}
}
@INPROCEEDINGS{5581451,
author={Diener, M. and Madruga, F.L. and Rodrigues, E.R. and Alves, M.A.Z. and Schneider, J. and Navaux, P.O.A. and Heiss, H.-U.},
booktitle={High Performance Computing and Communications (HPCC), 2010 12th IEEE International Conference on},
title={Evaluating Thread Placement Based on Memory Access Patterns for Multi-core Processors},
year={2010},
pages={491-496},
keywords={message passing;multi-threading;parallel machines;shared memory systems;storage management;OpenMP;Pthreads;cluster computers;data sharing pattern;heterogeneous interconnect;implicit communication;memory access pattern;multicore processors;parallel machine;process placement;shared-memory environment;thread mapping;thread placement;memory access patterns;multi-core processor;process mapping;shared cache;thread placement},
doi={10.1109/HPCC.2010.114},
month={Sept},}
@article{DBLP:journals2011,
author = {Markus Wittmann and
Georg Hager},
title = {Optimizing ccNUMA locality for task-parallel execution under OpenMP
and {TBB} on multicore-based systems},
journal = {CoRR},
volume = {abs/1101.0093},
year = {2011},
url = {http://arxiv.org/abs/1101.0093},
timestamp = {Mon, 05 Dec 2011 18:05:15 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/journals/corr/abs-1101-0093},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@INPROCEEDINGS{Bull02,
author = {J. Mark Bull and Chris Johnson},
title = {Data Distribution, Migration and Replication on a ccNUMA Architecture},
booktitle = {In Proceedings of the Fourth European Workshop on OpenMP},
year = {2002}
}
@inproceedings{Terboven:2008,
author = {Terboven, Christian and an Mey, Dieter and Schmidl, Dirk and Jin, Henry and Reichstein, Thomas},
title = {Data and Thread Affinity in Openmp Programs},
booktitle = {Proceedings of the 2008 Workshop on Memory Access on Future Processors: A Solved Problem?},
series = {MAW '08},
year = {2008},
isbn = {978-1-60558-091-3},
location = {Ischia, Italy},
pages = {377--384},
numpages = {8},
url = {http://doi.acm.org/10.1145/1366219.1366222},
doi = {10.1145/1366219.1366222},
acmid = {1366222},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {affinity, binding, ccnuma, migration, openmp},
}
@inproceedings{Goglin:2009,
author = {Goglin, Brice and Furmento, Nathalie},
title = {Enabling High-performance Memory Migration for Multithreaded Applications on LINUX},
booktitle = {Proceedings of the 2009 IEEE International Symposium on Parallel\&Distributed Processing},
series = {IPDPS '09},
year = {2009},
isbn = {978-1-4244-3751-1},
pages = {1--9},
numpages = {9},
url = {http://dx.doi.org/10.1109/IPDPS.2009.5161101},
doi = {10.1109/IPDPS.2009.5161101},
acmid = {1587742},
publisher = {IEEE Computer Society},
address = {Washington, DC, USA},
}
@INPROCEEDINGS{4520191,
author={Yang, R. and Antony, J. and Janes, P.P. and Rendell, A.P.},
booktitle={Parallel Architectures, Algorithms, and Networks, 2008. I-SPAN 2008. International Symposium on},
title={Memory and Thread Placement Effects as a Function of Cache Usage: A Study of the Gaussian Chemistry Code on the SunFire X4600 M2},
year={2008},
pages={31-36},
keywords={cache storage;chemistry computing;Gaussian 03 computational chemistry code;Sunfire X4600 M2;cache blocking;cache usage;memory-thread placement;multicore shared memory parallel system;Bandwidth;Central Processing Unit;Chemistry;Concurrent computing;Delay;Hafnium;Libraries;Multicore processing;Parallel architectures;Yarn},
doi={10.1109/I-SPAN.2008.13},
ISSN={1087-4089},
month={May},}
@Inbook{Norden:2008,
author="Nord{\'e}n, Markus
and L{\"o}f, Henrik
and Rantakokko, Jarmo
and Holmgren, Sverker",
editor="Mueller, Matthias S.
and Chapman, Barbara M.
and Supinski, Bronis R.
and Malony, Allen D.
and Voss, Michael",
chapter="Geographical Locality and Dynamic Data Migration for OpenMP Implementations of Adaptive PDE Solvers",
title="OpenMP Shared Memory Parallel Programming: International Workshops, IWOMP 2005 and IWOMP 2006, Eugene, OR, USA, June 1-4, 2005, Reims, France, June 12-15, 2006. Proceedings",
year="2008",
publisher="Springer Berlin Heidelberg",
address="Berlin, Heidelberg",
pages="382--393",
isbn="978-3-540-68555-5",
doi="10.1007/978-3-540-68555-5_31",
url="http://dx.doi.org/10.1007/978-3-540-68555-5_31"
}
@Inbook{Smeds2003,
author="Smeds, Nils",
editor="Voss, Michael J.",
chapter="OpenMP Application Tuning Using Hardware Performance Counters",
title="OpenMP Shared Memory Parallel Programming: International Workshop on OpenMP Applications and Tools, WOMPAT 2003 Toronto, Canada, June 26--27, 2003 Proceedings",
year="2003",
publisher="Springer Berlin Heidelberg",
address="Berlin, Heidelberg",
pages="260--270",
isbn="978-3-540-45009-2",
doi="10.1007/3-540-45009-2_20",
url="http://dx.doi.org/10.1007/3-540-45009-2_20"
}
@inproceedings{Marathe:2006,
author = {Marathe, Jaydeep and Mueller, Frank},
title = {Hardware Profile-guided Automatic Page Placement for ccNUMA Systems},
booktitle = {Proceedings of the Eleventh ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming},
series = {PPoPP '06},
year = {2006},
isbn = {1-59593-189-9},
location = {New York, New York, USA},
pages = {90--99},
numpages = {10},
url = {http://doi.acm.org/10.1145/1122971.1122987},
doi = {10.1145/1122971.1122987},
acmid = {1122987},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {NUMA, hardware performance monitoring, page placement, profile-guided optimization},
}
@online{IBM_P8,
author = {Alexandre Bicas Caldeira and Volker Haug and Marc-Eric Kahle and Cesar Diniz Maciel and Monica Sanchez},
title = {{IBM} Power Systems {S812L} and {S822L} Technical Overview and Introduction},
year = 2014,
url = {http://www.redbooks.ibm.com/Redbooks.nsf/RedbookAbstracts/redp5098.html?Open},
urldate = {2016-03-17}
}