File tree Expand file tree Collapse file tree 2 files changed +5
-0
lines changed Expand file tree Collapse file tree 2 files changed +5
-0
lines changed Original file line number Diff line number Diff line change @@ -176,6 +176,7 @@ option(GGML_HIP_NO_VMM                      "ggml: do not try to use HIP VMM"
176176option (GGML_HIP_ROCWMMA_FATTN               "ggml: enable rocWMMA for FlashAttention"          OFF )
177177option (GGML_HIP_FORCE_ROCWMMA_FATTN_GFX12   "ggml: enable rocWMMA FlashAttention on GFX12"     OFF )
178178option (GGML_HIP_MMQ_MFMA                    "ggml: enable MFMA MMA for CDNA in MMQ"            ON )
179+ option (GGML_HIP_EXPORT_METRICS              "ggml: enable kernel perf metrics output"          OFF )
179180option (GGML_MUSA_GRAPHS                     "ggml: use MUSA graph, experimental, unstable"     OFF )
180181option (GGML_MUSA_MUDNN_COPY                 "ggml: enable muDNN for accelerated copy"          OFF )
181182option (GGML_VULKAN                          "ggml: use Vulkan"                                 OFF )
Original file line number Diff line number Diff line change @@ -121,6 +121,10 @@ if (GGML_HIP_FORCE_ROCWMMA_FATTN_GFX12 OR ${hip_VERSION} VERSION_GREATER_EQUAL 7
121121    add_compile_definitions (GGML_HIP_ROCWMMA_FATTN_GFX12)
122122endif ()
123123
124+ if  (GGML_HIP_EXPORT_METRICS)
125+     set (CMAKE_HIP_FLAGS "${CMAKE_HIP_FLAGS}  -Rpass-analysis=kernel-resource-usage --save-temps" )
126+ endif ()
127+ 
124128if  (NOT  GGML_CUDA_FA)
125129    add_compile_definitions (GGML_CUDA_NO_FA)
126130endif ()
    
 
   
 
     
   
   
          
     
  
    
     
 
    
      
     
 
     
    You can’t perform that action at this time.
  
 
    
  
     
    
      
        
     
 
       
      
     
   
 
    
    
  
 
  
 
     
    
0 commit comments