File tree Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -199,9 +199,9 @@ typedef float2 dfloat2;
199199#define FP16_AVAILABLE
200200#endif // (defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)) || __CUDA_ARCH__ >= GGML_CUDA_CC_PASCAL
201201
202- #if defined(FP16_AVAILABLE) && __CUDA_ARCH__ != GGML_CUDA_CC_DP4A
202+ #if defined(FP16_AVAILABLE) && __CUDA_ARCH__ != 610
203203#define FAST_FP16_AVAILABLE
204- #endif // defined(FP16_AVAILABLE) && __CUDA_ARCH__ != GGML_CUDA_CC_DP4A
204+ #endif // defined(FP16_AVAILABLE) && __CUDA_ARCH__ != 610
205205
206206#if !(defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)) && __CUDA_ARCH__ >= GGML_CUDA_CC_VOLTA
207207#define FP16_MMA_AVAILABLE
@@ -232,7 +232,7 @@ static bool fp16_available(const int cc) {
232232}
233233
234234static bool fast_fp16_available (const int cc) {
235- return (GGML_CUDA_CC_IS_NVIDIA (cc) && fp16_available (cc) && cc != GGML_CUDA_CC_DP4A ) || GGML_CUDA_CC_IS_AMD (cc);
235+ return (GGML_CUDA_CC_IS_NVIDIA (cc) && fp16_available (cc) && cc != 610 ) || GGML_CUDA_CC_IS_AMD (cc);
236236}
237237
238238// To be used for feature selection of external libraries, e.g. cuBLAS.
You can’t perform that action at this time.
0 commit comments