Skip to content

Commit 274bff3

Browse files
committed
Address review comments
Signed-off-by: Xiaodong Ye <[email protected]>
1 parent f7ef983 commit 274bff3

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

ggml/src/ggml-cuda/common.cuh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -199,9 +199,9 @@ typedef float2 dfloat2;
199199
#define FP16_AVAILABLE
200200
#endif // (defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)) || __CUDA_ARCH__ >= GGML_CUDA_CC_PASCAL
201201

202-
#if defined(FP16_AVAILABLE) && __CUDA_ARCH__ != GGML_CUDA_CC_DP4A
202+
#if defined(FP16_AVAILABLE) && __CUDA_ARCH__ != 610
203203
#define FAST_FP16_AVAILABLE
204-
#endif // defined(FP16_AVAILABLE) && __CUDA_ARCH__ != GGML_CUDA_CC_DP4A
204+
#endif // defined(FP16_AVAILABLE) && __CUDA_ARCH__ != 610
205205

206206
#if !(defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)) && __CUDA_ARCH__ >= GGML_CUDA_CC_VOLTA
207207
#define FP16_MMA_AVAILABLE
@@ -232,7 +232,7 @@ static bool fp16_available(const int cc) {
232232
}
233233

234234
static bool fast_fp16_available(const int cc) {
235-
return (GGML_CUDA_CC_IS_NVIDIA(cc) && fp16_available(cc) && cc != GGML_CUDA_CC_DP4A) || GGML_CUDA_CC_IS_AMD(cc);
235+
return (GGML_CUDA_CC_IS_NVIDIA(cc) && fp16_available(cc) && cc != 610) || GGML_CUDA_CC_IS_AMD(cc);
236236
}
237237

238238
// To be used for feature selection of external libraries, e.g. cuBLAS.

0 commit comments

Comments
 (0)