Skip to content

Commit 6086d52

Browse files
committed
Revert "Disable CUDA fusion by default for now (ikawrakow#903)"
This reverts commit 320fc60.
1 parent 46f1c50 commit 6086d52

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml/CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -133,7 +133,7 @@ option(GGML_CUDA_NO_PEER_COPY "ggml: do not use peer to peer copie
133133
option(GGML_CUDA_NO_VMM "ggml: do not try to use CUDA VMM" OFF)
134134
option(GGML_CUDA_FA_ALL_QUANTS "ggml: compile all quants for FlashAttention" OFF)
135135
option(GGML_CUDA_USE_GRAPHS "ggml: use CUDA graphs (llama.cpp only)" ON)
136-
set (GGML_CUDA_FUSION "0" CACHE STRING "ggml: enable/disable fusion")
136+
set (GGML_CUDA_FUSION "1" CACHE STRING "ggml: enable/disable fusion")
137137

138138
option(GGML_IQK_FLASH_ATTENTION "ggml: enable the IQK FlashAttention CPU kernels" ON)
139139
option(GGML_IQK_FA_ALL_QUANTS "ggml: compile all quants for IQK FlashAttention" OFF)

0 commit comments

Comments
 (0)