We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6bd7a3d commit bd5017eCopy full SHA for bd5017e
ggml/src/ggml-cpu/llamafile/sgemm.cpp
@@ -63,6 +63,7 @@
63
#define NOINLINE __attribute__((__noinline__))
64
#endif
65
66
+#if defined(__ARM_NEON) || defined(__AVX512F__) || defined(__VXE__) || defined(__VXE2__)
67
#if defined(__ARM_NEON) || defined(__AVX512F__) || defined(__VXE__) || defined(__VXE2__)
68
#define VECTOR_REGISTERS 32
69
#else
@@ -253,7 +254,7 @@ template <> inline float32x4_t load(const ggml_fp16_t * p) {
253
254
float tmp[4];
255
256
for (int i = 0; i < 4; i++) {
- tmp[i] = GGML_CPU_FP16_TO_FP32(p[i]);
257
+ tmp[i] = GGML_FP16_TO_FP32(p[i]);
258
}
259
260
return vec_xl(0, (const float *)(tmp));
0 commit comments