Skip to content

Commit d7580f2

Browse files
committed
CUDA: compress mode size
cuda 12.8 added the option to specify stronger compression for binaries.
1 parent 36c258e commit d7580f2

File tree

1 file changed

+9
-0
lines changed

1 file changed

+9
-0
lines changed

ggml/src/ggml-cuda/CMakeLists.txt

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -98,6 +98,15 @@ if (CUDAToolkit_FOUND)
9898

9999
set(CUDA_FLAGS -use_fast_math)
100100

101+
if (CUDAToolkit_VERSION VERSION_GREATER_EQUAL "12.8")
102+
# Options are:
103+
# - none (not recommended)
104+
# - speed (default)
105+
# - balance
106+
# - size
107+
list(APPEND CUDA_FLAGS -compress-mode=size)
108+
endif()
109+
101110
if (GGML_FATAL_WARNINGS)
102111
list(APPEND CUDA_FLAGS -Werror all-warnings)
103112
endif()

0 commit comments

Comments
 (0)