uvos commited on
Commit
577f7e4
·
1 Parent(s): f84562e

HIP: add cmake option to enable compiler output of kernel resource usage metrics (llama/15103)

Browse files
ggml/CMakeLists.txt CHANGED
@@ -176,6 +176,7 @@ option(GGML_HIP_NO_VMM "ggml: do not try to use HIP VMM"
176
  option(GGML_HIP_ROCWMMA_FATTN "ggml: enable rocWMMA for FlashAttention" OFF)
177
  option(GGML_HIP_FORCE_ROCWMMA_FATTN_GFX12 "ggml: enable rocWMMA FlashAttention on GFX12" OFF)
178
  option(GGML_HIP_MMQ_MFMA "ggml: enable MFMA MMA for CDNA in MMQ" ON)
 
179
  option(GGML_MUSA_GRAPHS "ggml: use MUSA graph, experimental, unstable" OFF)
180
  option(GGML_MUSA_MUDNN_COPY "ggml: enable muDNN for accelerated copy" OFF)
181
  option(GGML_VULKAN "ggml: use Vulkan" OFF)
 
176
  option(GGML_HIP_ROCWMMA_FATTN "ggml: enable rocWMMA for FlashAttention" OFF)
177
  option(GGML_HIP_FORCE_ROCWMMA_FATTN_GFX12 "ggml: enable rocWMMA FlashAttention on GFX12" OFF)
178
  option(GGML_HIP_MMQ_MFMA "ggml: enable MFMA MMA for CDNA in MMQ" ON)
179
+ option(GGML_HIP_EXPORT_METRICS "ggml: enable kernel perf metrics output" OFF)
180
  option(GGML_MUSA_GRAPHS "ggml: use MUSA graph, experimental, unstable" OFF)
181
  option(GGML_MUSA_MUDNN_COPY "ggml: enable muDNN for accelerated copy" OFF)
182
  option(GGML_VULKAN "ggml: use Vulkan" OFF)
ggml/src/ggml-hip/CMakeLists.txt CHANGED
@@ -121,6 +121,10 @@ if (GGML_HIP_FORCE_ROCWMMA_FATTN_GFX12 OR ${hip_VERSION} VERSION_GREATER_EQUAL 7
121
  add_compile_definitions(GGML_HIP_ROCWMMA_FATTN_GFX12)
122
  endif()
123
 
 
 
 
 
124
  if (NOT GGML_CUDA_FA)
125
  add_compile_definitions(GGML_CUDA_NO_FA)
126
  endif()
 
121
  add_compile_definitions(GGML_HIP_ROCWMMA_FATTN_GFX12)
122
  endif()
123
 
124
+ if (GGML_HIP_EXPORT_METRICS)
125
+ set(CMAKE_HIP_FLAGS "${CMAKE_HIP_FLAGS} -Rpass-analysis=kernel-resource-usage --save-temps")
126
+ endif()
127
+
128
  if (NOT GGML_CUDA_FA)
129
  add_compile_definitions(GGML_CUDA_NO_FA)
130
  endif()