We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents 0fa2a81 + 25ff6f7 commit 20208e9Copy full SHA for 20208e9
ggml/src/ggml-cuda/common.cuh
@@ -312,11 +312,11 @@ static bool turing_mma_available(const int cc) {
312
}
313
314
static bool ampere_mma_available(const int cc) {
315
- return cc < GGML_CUDA_CC_OFFSET_AMD && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
+ return GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
316
317
318
static bool cp_async_available(const int cc) {
319
320
321
322
static constexpr __device__ int ggml_cuda_get_physical_warp_size() {
0 commit comments