File tree Expand file tree Collapse file tree 2 files changed +5
-0
lines changed Expand file tree Collapse file tree 2 files changed +5
-0
lines changed Original file line number Diff line number Diff line change @@ -176,6 +176,7 @@ option(GGML_HIP_NO_VMM "ggml: do not try to use HIP VMM"
176
176
option (GGML_HIP_ROCWMMA_FATTN "ggml: enable rocWMMA for FlashAttention" OFF )
177
177
option (GGML_HIP_FORCE_ROCWMMA_FATTN_GFX12 "ggml: enable rocWMMA FlashAttention on GFX12" OFF )
178
178
option (GGML_HIP_MMQ_MFMA "ggml: enable MFMA MMA for CDNA in MMQ" ON )
179
+ option (GGML_HIP_EXPORT_METRICS "ggml: enable kernel perf metrics output" OFF )
179
180
option (GGML_MUSA_GRAPHS "ggml: use MUSA graph, experimental, unstable" OFF )
180
181
option (GGML_MUSA_MUDNN_COPY "ggml: enable muDNN for accelerated copy" OFF )
181
182
option (GGML_VULKAN "ggml: use Vulkan" OFF )
Original file line number Diff line number Diff line change @@ -121,6 +121,10 @@ if (GGML_HIP_FORCE_ROCWMMA_FATTN_GFX12 OR ${hip_VERSION} VERSION_GREATER_EQUAL 7
121
121
add_compile_definitions (GGML_HIP_ROCWMMA_FATTN_GFX12 )
122
122
endif ()
123
123
124
+ if (GGML_HIP_EXPORT_METRICS )
125
+ set (CMAKE_HIP_FLAGS "${CMAKE_HIP_FLAGS} -Rpass-analysis=kernel-resource-usage --save-temps" )
126
+ endif ()
127
+
124
128
if (NOT GGML_CUDA_FA )
125
129
add_compile_definitions (GGML_CUDA_NO_FA )
126
130
endif ()
You can’t perform that action at this time.
0 commit comments