Skip to content

Commit bd5017e

Browse files
taronaeoMinh141120
authored andcommitted
llamafile : support s390x SIMD instruction set (ggml-org#14273)
1 parent 6bd7a3d commit bd5017e

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

ggml/src/ggml-cpu/llamafile/sgemm.cpp

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -63,6 +63,7 @@
6363
#define NOINLINE __attribute__((__noinline__))
6464
#endif
6565

66+
#if defined(__ARM_NEON) || defined(__AVX512F__) || defined(__VXE__) || defined(__VXE2__)
6667
#if defined(__ARM_NEON) || defined(__AVX512F__) || defined(__VXE__) || defined(__VXE2__)
6768
#define VECTOR_REGISTERS 32
6869
#else
@@ -253,7 +254,7 @@ template <> inline float32x4_t load(const ggml_fp16_t * p) {
253254
float tmp[4];
254255

255256
for (int i = 0; i < 4; i++) {
256-
tmp[i] = GGML_CPU_FP16_TO_FP32(p[i]);
257+
tmp[i] = GGML_FP16_TO_FP32(p[i]);
257258
}
258259

259260
return vec_xl(0, (const float *)(tmp));

0 commit comments

Comments
 (0)