We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 92c0fad commit 4aa0153Copy full SHA for 4aa0153
.github/workflows/_build.yml
@@ -172,12 +172,12 @@ jobs:
172
173
export MAX_JOBS=$([ "$MATRIX_CUDA_VERSION" == "129" ] && echo 1 || echo 2)
174
export NVCC_THREADS=2
175
- export FLASH_DMATTN_FORCE_BUILD="TRUE"
176
- export FLASH_DMATTN_FORCE_CXX11_ABI=${{ inputs.cxx11_abi }}
+ export FLASH_SPARSE_ATTENTION_FORCE_BUILD="TRUE"
+ export FLASH_SPARSE_ATTENTION_FORCE_CXX11_ABI=${{ inputs.cxx11_abi }}
177
178
# If specified, limit to a single compute capability to speed up build
179
if [ -n "${MATRIX_ARCH}" ]; then
180
- export FLASH_DMATTN_CUDA_ARCHS="${MATRIX_ARCH}"
+ export FLASH_SPARSE_ATTENTION_CUDA_ARCHS="${MATRIX_ARCH}"
181
fi
182
183
# GH allows max 6h
0 commit comments