We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3420909 commit 9a240e6Copy full SHA for 9a240e6
ggml/src/ggml-impl.h
@@ -310,14 +310,14 @@ void ggml_aligned_free(void * ptr, size_t size);
310
// FP16 to FP32 conversion
311
312
#if defined(__ARM_NEON)
313
- #ifdef _MSC_VER
+ #ifdef _MSC_VER || (defined(__CUDACC__) && __CUDACC_VER_MAJOR__ <= 11)
314
typedef uint16_t ggml_fp16_internal_t;
315
#else
316
typedef __fp16 ggml_fp16_internal_t;
317
#endif
318
319
320
-#if defined(__ARM_NEON) && !defined(_MSC_VER)
+#if defined(__ARM_NEON) && !defined(_MSC_VER) && !(defined(__CUDACC__) && __CUDACC_VER_MAJOR__ <= 11)
321
#define GGML_COMPUTE_FP16_TO_FP32(x) ggml_compute_fp16_to_fp32(x)
322
#define GGML_COMPUTE_FP32_TO_FP16(x) ggml_compute_fp32_to_fp16(x)
323
0 commit comments