Skip to content

Commit 28dd5c5

Browse files
committed
fix A800 not supper 'movmatrix' module
1 parent d7b31a9 commit 28dd5c5

File tree

2 files changed

+2
-1
lines changed

2 files changed

+2
-1
lines changed

ggml/src/ggml-cuda/common.cuh

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -47,6 +47,7 @@
4747
#define GGML_CUDA_CC_TURING 750
4848
#define GGML_CUDA_CC_AMPERE 800
4949
#define GGML_CUDA_CC_OFFSET_AMD 0x1000000
50+
#define GGML_CUDA_CC_HOPPER 900
5051

5152
// GCN/CNDA, wave size is 64
5253
#define GGML_CUDA_CC_GCN4 (GGML_CUDA_CC_OFFSET_AMD + 0x803) // Tonga, Fiji, Polaris, minimum for fast fp16

ggml/src/ggml-cuda/mma.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@
1616
#include "common.cuh"
1717

1818

19-
#if CUDART_VERSION >= 11080
19+
#if (CUDART_VERSION >= 11080) && (__CUDA_ARCH__ >= GGML_CUDA_CC_HOPPER)
2020

2121
static __device__ __forceinline__ int ggml_cuda_movmatrix(const int x) {
2222
int ret = 0;

0 commit comments

Comments
 (0)