Skip to content

Commit 34e4567

Browse files
gsitaramalazzaro
authored andcommitted
Add gfx950 (Mi350) GPU architecture support
- Add Mi350 to SUPPORTED_HIP_ARCHITECTURES in CMakeLists.txt - Add GPU_ARCH_NUMBER_Mi350 mapping to gfx950 - Create parameters_Mi350.json parameter file - Add gfx950 to gpu_architectures dictionary in smm_acc.py - Add gfx950 GPU properties to gpu_properties.json (CDNA4, MI350X) - Update installation documentation to include Mi350
1 parent 634c6e5 commit 34e4567

File tree

5 files changed

+457
-6
lines changed

5 files changed

+457
-6
lines changed

CMakeLists.txt

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -110,7 +110,7 @@ set(SUPPORTED_CUDA_ARCHITECTURES
110110
V100
111111
A100
112112
H100)
113-
set(SUPPORTED_HIP_ARCHITECTURES Mi50 Mi100 Mi250 Mi300)
113+
set(SUPPORTED_HIP_ARCHITECTURES Mi50 Mi100 Mi250 Mi300 Mi350)
114114
set(WITH_GPU
115115
$<IF:$<STREQUAL:${USE_ACCEL},"opencl">,"","P100">
116116
CACHE
@@ -272,6 +272,7 @@ if (USE_ACCEL MATCHES "cuda|hip")
272272
set(GPU_ARCH_NUMBER_Mi100 gfx908)
273273
set(GPU_ARCH_NUMBER_Mi250 gfx90a)
274274
set(GPU_ARCH_NUMBER_Mi300 gfx942)
275+
set(GPU_ARCH_NUMBER_Mi350 gfx950)
275276
endif ()
276277

277278
if (USE_ACCEL MATCHES "cuda")

docs/guide/2-user-guide/1-installation/index.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -72,7 +72,7 @@ make
7272
-DWITH_HIP_PROFILING=<OFF|ON>
7373
-DWITH_C_API=<ON|OFF>
7474
-DWITH_EXAMPLES=<ON|OFF>
75-
-DWITH_GPU=<P100|K20X|K40|K80|V100|Mi50|Mi100|Mi250|Mi300>
75+
-DWITH_GPU=<P100|K20X|K40|K80|V100|Mi50|Mi100|Mi250|Mi300|Mi350>
7676
-DCMAKE_BUILD_TYPE=<Release|Debug|Coverage>
7777
-DBUILD_TESTING=<ON|OFF>
7878
-DTEST_MPI_RANKS=<2|auto|N>

src/acc/libsmm_acc/kernels/gpu_properties.json

Lines changed: 19 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -211,18 +211,33 @@
211211
"Memory_Interface_(bits)": 8192
212212
},
213213
"gfx942" : {
214-
"GPU_Architecture": "CDNA2",
215-
"Product_Names": ["Instinct MI300"],
214+
"GPU_Architecture": "CDNA3",
215+
"Product_Names": ["Instinct MI300A"],
216216
"Threads_/_Warp" : 64,
217217
"Warps_/_Multiprocessor": 32,
218218
"Threads_/_Multiprocessor": 2048,
219219
"Thread_Blocks_/_Multiprocessor": 32,
220220
"Max_Thread_Block_Size": 1024,
221221
"Max_Shared_Memory_/_Block_(bytes)": 64000,
222222
"Shared_Memory_/_Multiprocessor_(bytes)": 64000,
223-
"Compute_Units": 304,
224-
"Stream_Multiprocessors": 304,
223+
"Compute_Units": 228,
224+
"Stream_Multiprocessors": 14592,
225225
"Memory_Size_(GB)": 128,
226226
"Memory_Interface_(bits)": 8192
227+
},
228+
"gfx950" : {
229+
"GPU_Architecture": "CDNA4",
230+
"Product_Names": ["Instinct MI350X"],
231+
"Threads_/_Warp" : 64,
232+
"Warps_/_Multiprocessor": 32,
233+
"Threads_/_Multiprocessor": 2048,
234+
"Thread_Blocks_/_Multiprocessor": 32,
235+
"Max_Thread_Block_Size": 1024,
236+
"Max_Shared_Memory_/_Block_(bytes)": 64000,
237+
"Shared_Memory_/_Multiprocessor_(bytes)": 64000,
238+
"Compute_Units": 256,
239+
"Stream_Multiprocessors": 16384,
240+
"Memory_Size_(GB)": 288,
241+
"Memory_Interface_(bits)": 8192
227242
}
228243
}

src/acc/libsmm_acc/kernels/smm_acc.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -65,6 +65,7 @@
6565
"parameters_Mi100.json": "gfx908",
6666
"parameters_Mi250.json": "gfx90a",
6767
"parameters_Mi300.json": "gfx942",
68+
"parameters_Mi350.json": "gfx950",
6869
}
6970

7071

0 commit comments

Comments
 (0)