Skip to content

Commit 7ad67ba

Browse files
authored
HIP: add cmake option to enable compiler output of kernel resource usage metrics (#15103)
1 parent 9a96389 commit 7ad67ba

File tree

2 files changed

+5
-0
lines changed

2 files changed

+5
-0
lines changed

ggml/CMakeLists.txt

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -176,6 +176,7 @@ option(GGML_HIP_NO_VMM "ggml: do not try to use HIP VMM"
176176
option(GGML_HIP_ROCWMMA_FATTN "ggml: enable rocWMMA for FlashAttention" OFF)
177177
option(GGML_HIP_FORCE_ROCWMMA_FATTN_GFX12 "ggml: enable rocWMMA FlashAttention on GFX12" OFF)
178178
option(GGML_HIP_MMQ_MFMA "ggml: enable MFMA MMA for CDNA in MMQ" ON)
179+
option(GGML_HIP_EXPORT_METRICS "ggml: enable kernel perf metrics output" OFF)
179180
option(GGML_MUSA_GRAPHS "ggml: use MUSA graph, experimental, unstable" OFF)
180181
option(GGML_MUSA_MUDNN_COPY "ggml: enable muDNN for accelerated copy" OFF)
181182
option(GGML_VULKAN "ggml: use Vulkan" OFF)

ggml/src/ggml-hip/CMakeLists.txt

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -121,6 +121,10 @@ if (GGML_HIP_FORCE_ROCWMMA_FATTN_GFX12 OR ${hip_VERSION} VERSION_GREATER_EQUAL 7
121121
add_compile_definitions(GGML_HIP_ROCWMMA_FATTN_GFX12)
122122
endif()
123123

124+
if (GGML_HIP_EXPORT_METRICS)
125+
set(CMAKE_HIP_FLAGS "${CMAKE_HIP_FLAGS} -Rpass-analysis=kernel-resource-usage --save-temps")
126+
endif()
127+
124128
if (NOT GGML_CUDA_FA)
125129
add_compile_definitions(GGML_CUDA_NO_FA)
126130
endif()

0 commit comments

Comments
 (0)