Skip to content

Commit 1a45887

Browse files
gsitaramalazzaro
authored andcommitted
Add Mi300 arch
1 parent 24f88ba commit 1a45887

File tree

5 files changed

+453
-2
lines changed

5 files changed

+453
-2
lines changed

CMakeLists.txt

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -107,7 +107,7 @@ set(SUPPORTED_CUDA_ARCHITECTURES
107107
V100
108108
A100
109109
H100)
110-
set(SUPPORTED_HIP_ARCHITECTURES Mi50 Mi100 Mi250)
110+
set(SUPPORTED_HIP_ARCHITECTURES Mi50 Mi100 Mi250 Mi300)
111111
set(WITH_GPU
112112
$<IF:$<STREQUAL:${USE_ACCEL},"opencl">,"","P100">
113113
CACHE
@@ -247,6 +247,7 @@ if (USE_ACCEL MATCHES "cuda|hip")
247247
set(GPU_ARCH_NUMBER_Mi50 gfx906)
248248
set(GPU_ARCH_NUMBER_Mi100 gfx908)
249249
set(GPU_ARCH_NUMBER_Mi250 gfx90a)
250+
set(GPU_ARCH_NUMBER_Mi300 gfx942)
250251
endif ()
251252

252253
if (USE_ACCEL MATCHES "cuda")

docs/guide/2-user-guide/1-installation/index.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -72,7 +72,7 @@ make
7272
-DWITH_HIP_PROFILING=<OFF|ON>
7373
-DWITH_C_API=<ON|OFF>
7474
-DWITH_EXAMPLES=<ON|OFF>
75-
-DWITH_GPU=<P100|K20X|K40|K80|V100|Mi50|Mi100|Mi250>
75+
-DWITH_GPU=<P100|K20X|K40|K80|V100|Mi50|Mi100|Mi250|Mi300>
7676
-DCMAKE_BUILD_TYPE=<Release|Debug|Coverage>
7777
-DBUILD_TESTING=<ON|OFF>
7878
-DTEST_MPI_RANKS=<2|auto|N>

src/acc/libsmm_acc/kernels/gpu_properties.json

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -209,5 +209,20 @@
209209
"Stream_Multiprocessors": 13312,
210210
"Memory_Size_(GB)": 128,
211211
"Memory_Interface_(bits)": 8192
212+
},
213+
"gfx942" : {
214+
"GPU_Architecture": "CDNA2",
215+
"Product_Names": ["Instinct MI300"],
216+
"Threads_/_Warp" : 64,
217+
"Warps_/_Multiprocessor": 32,
218+
"Threads_/_Multiprocessor": 2048,
219+
"Thread_Blocks_/_Multiprocessor": 32,
220+
"Max_Thread_Block_Size": 1024,
221+
"Max_Shared_Memory_/_Block_(bytes)": 64000,
222+
"Shared_Memory_/_Multiprocessor_(bytes)": 64000,
223+
"Compute_Units": 304,
224+
"Stream_Multiprocessors": 304,
225+
"Memory_Size_(GB)": 128,
226+
"Memory_Interface_(bits)": 8192
212227
}
213228
}

src/acc/libsmm_acc/kernels/smm_acc.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -64,6 +64,7 @@
6464
"parameters_Mi50.json": "gfx906",
6565
"parameters_Mi100.json": "gfx908",
6666
"parameters_Mi250.json": "gfx90a",
67+
"parameters_Mi300.json": "gfx942",
6768
}
6869

6970

0 commit comments

Comments
 (0)