-
Notifications
You must be signed in to change notification settings - Fork 1
/
gpu_programming_bpg.bib
209 lines (201 loc) · 6.36 KB
/
gpu_programming_bpg.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
@MISC{microprocessor-trend-data,
HOWPUBLISHED = "\url{https://github.com/karlrupp/microprocessor-trend-data}"
}
@MISC{gpu_wiki,
HOWPUBLISHED = "\url{https://en.wikipedia.org/wiki/Graphics_processing_unit}"
}
@MISC{top500_1,
HOWPUBLISHED = "\url{https://en.wikipedia.org/wiki/TOP500}"
}
@MISC{top500_2,
HOWPUBLISHED = "\url{https://www.top500.org/lists/top500/2023/06/}"
}
@MISC{green500,
HOWPUBLISHED = "\url{https://www.top500.org/lists/green500/}"
}
@MISC{stackexchange,
HOWPUBLISHED = "\url{https://scicomp.stackexchange.com/questions/943}"
}
@article{barca2021faster,
title={Faster self-consistent field (SCF) calculations on GPU clusters},
author={Barca, Giuseppe MJ and Alkan, Melisa and Galvez-Vallejo, Jorge L and Poole, David L and Rendell, Alistair P and Gordon, Mark S},
journal={J Chem. Theory Comput.},
volume={17},
pages={7486--7503},
year={2021}
}
@MISC{indexing,
title={An Even Easier Introduction to CUDA},
HOWPUBLISHED = "\url{https://developer.nvidia.com/blog/even-easier-introduction-cuda/}"
}
@MISC{NVIDIA_SDK,
HOWPUBLISHED = "\url{https://developer.nvidia.com/hpc-sdk}"
}
@MISC{guideline_gpu_cpp,
HOWPUBLISHED = "\url{https://developer.nvidia.com/blog/accelerating-standard-c-with-gpus-using-stdpar/}"
}
@MISC{guideline_gpu_fortran,
HOWPUBLISHED = "\url{https://developer.nvidia.com/blog/accelerating-fortran-do-concurrent-with-gpus-and-the-nvidia-hpc-sdk/}"
}
@MISC{openacc,
HOWPUBLISHED = "\url{https://www.openacc.org/}"
}
@MISC{openmp,
HOWPUBLISHED = "\url{https://www.openmp.org/}"
}
@MISC{cuda,
HOWPUBLISHED = "\url{https://developer.nvidia.com/cuda-toolkit}"
}
@MISC{hip,
HOWPUBLISHED = "\url{https://github.com/ROCm-Developer-Tools/HIP}"
}
@MISC{alpaka,
HOWPUBLISHED = "\url{https://alpaka.readthedocs.io/en/latest/}"
}
@MISC{kokkos,
HOWPUBLISHED = "\url{https://github.com/kokkos/kokkos}"
}
@MISC{OpenCL,
HOWPUBLISHED = "\url{https://www.khronos.org/opencl/}"
}
@MISC{raja,
HOWPUBLISHED = "\url{https://github.com/LLNL/RAJA}"
}
@MISC{sycl,
HOWPUBLISHED = "\url{https://www.khronos.org/sycl/}"
}
@MISC{oneapi-dpc,
HOWPUBLISHED = "\url{https://www.intel.com/content/www/us/en/developer/tools/oneapi/dpc-compiler.html\#gs.39fbw9}"
}
@MISC{codeplay-oneapi,
HOWPUBLISHED = "\url{https://codeplay.com/solutions/oneapi/}"
}
@MISC{hipsycl,
HOWPUBLISHED = "\url{https://github.com/OpenSYCL/OpenSYCL}"
}
@MISC{trisycl,
HOWPUBLISHED = "\url{https://github.com/triSYCL/triSYCL}"
}
@MISC{computecpp,
HOWPUBLISHED = "\url{https://developer.codeplay.com/products/computecpp/ce/home/}"
}
@MISC{cupy,
HOWPUBLISHED = "\url{https://cupy.dev/}"
}
@MISC{cudf,
HOWPUBLISHED = "\url{https://github.com/rapidsai/cudf}"
}
@MISC{rapids,
HOWPUBLISHED = "\url{https://rapids.ai/}"
}
@MISC{pycuda,
HOWPUBLISHED = "\url{https://documen.tician.de/pycuda/}"
}
@MISC{numba,
HOWPUBLISHED = "\url{https://numba.pydata.org/}"
}
@MISC{pandas,
HOWPUBLISHED = "\url{https://pandas.pydata.org/}"
}
@MISC{jit,
HOWPUBLISHED = "\url{https://www.ibm.com/docs/en/sdk-java-technology/8?topic=reference-jit-compiler}"
}
@MISC{cudajl,
HOWPUBLISHED = "\url{https://cuda.juliagpu.org/stable/}"
}
@MISC{amdgpujl,
HOWPUBLISHED = "\url{https://amdgpu.juliagpu.org/stable/}"
}
@MISC{oneapijl,
HOWPUBLISHED = "\url{https://github.com/JuliaGPU/oneAPI.jl}"
}
@MISC{metaljl,
HOWPUBLISHED = "\url{https://github.com/JuliaGPU/Metal.jl}"
}
@MISC{julia,
HOWPUBLISHED = "\url{https://julialang.org/}"
}
@MISC{pytorch,
HOWPUBLISHED = "\url{https://pytorch.org/}"
}
@MISC{matlab,
HOWPUBLISHED = "\url{https://www.mathworks.com/products/matlab.html}"
}
@MISC{tensorflow,
HOWPUBLISHED = "\url{https://www.tensorflow.org/}"
}
@MISC{rproject,
HOWPUBLISHED = "\url{https://www.r-project.org/}"
}
@MISC{nvidia_driver,
HOWPUBLISHED = "\url{https://www.nvidia.com/Download/index.aspx}"
}
@MISC{benchmarktools,
HOWPUBLISHED = "\url{https://github.com/JuliaCI/BenchmarkTools.jl}"
}
@MISC{gpu_aware_mpi,
HOWPUBLISHED = "\url{https://docs.open-mpi.org/en/v5.0.0rc9/networking/cuda.html}"
}
@MISC{openacc_u_device,
HOWPUBLISHED = "\url{https://www.openacc.org/sites/default/files/inline-images/Specification/OpenACC-3.2-final.pdf}"
}
@MISC{gpudirect-rdma,
HOWPUBLISHED = "\url{https://docs.nvidia.com/cuda/gpudirect-rdma/index.html}"
}
@MISC{gpu-programming-examples,
HOWPUBLISHED = "\url{https://github.com/ENCCS/gpu-programming/tree/main/content/examples}"
}
@MISC{nvidia_hopper,
HOWPUBLISHED = "\url{https://www.nvidia.com/en-us/data-center/technologies/hopper-architecture/}"
}
@MISC{amd_mi300,
HOWPUBLISHED = "\url{https://www.semianalysis.com/p/amd-mi300-taming-the-hype-ai-performance}"
}
@MISC{matrix_transpose,
HOWPUBLISHED = "\url{https://en.wikipedia.org/wiki/Transpose}"
}
@MISC{matrix_transpose_efficient,
HOWPUBLISHED = "\url{https://developer.nvidia.com/blog/efficient-matrix-transpose-cuda-cc/}"
}
@MISC{matrix_transpose_advanced,
HOWPUBLISHED = "\url{https://developer.download.nvidia.com/compute/DevZone/C/html_x64/6_Advanced/transpose/doc/MatrixTranspose.pdf}"
}
@MISC{kokkos_sandia,
HOWPUBLISHED = "\url{https://www.sandia.gov/ccr/software/kokkos/}"
}
@MISC{kokkos_compiling,
HOWPUBLISHED = "\url{https://kokkos.github.io/kokkos-core-wiki/ProgrammingGuide/Compiling.html}"
}
@MISC{khronos_group,
HOWPUBLISHED = "\url{https://www.khronos.org/}"
}
@MISC{intel_oneapi_base_toolkit,
HOWPUBLISHED = "\url{https://www.intel.com/content/www/us/en/developer/tools/oneapi/base-toolkit.html}"
}
@MISC{hipify,
HOWPUBLISHED = "\url{https://github.com/ROCm-Developer-Tools/HIPIFY}"
}
@MISC{clacc,
HOWPUBLISHED = "\url{https://csmd.ornl.gov/project/clacc}"
}
@MISC{llvm_project,
HOWPUBLISHED = "\url{https://github.com/llvm-doe-org/llvm-project/tree/clacc/main}"
}
@MISC{prace-bpg,
HOWPUBLISHED = "\url{https://prace-ri.eu/training-support/best-practice-guides/}"
}
@MISC{modern-processors,
HOWPUBLISHED = "\url{https://prace-ri.eu/training-support/best-practice-guides/modern-processors/}"
}
@MISC{modern-accelerators,
HOWPUBLISHED = "\url{https://prace-ri.eu/training-support/best-practice-guides/modern-accelerators/}"
}
@MISC{gpgpu,
HOWPUBLISHED = "\url{https://prace-ri.eu/training-support/best-practice-guides/best-practice-guide-gpgpu/}"
}
@MISC{hpc,
HOWPUBLISHED = "\url{https://en.wikipedia.org/wiki/High-performance_computing}"
}
@MISC{,
HOWPUBLISHED = "\url{}"
}