Skip to content

Commit c7c4d03

Browse files
committed
Fix merge
1 parent 6841888 commit c7c4d03

File tree

1 file changed

+7
-7
lines changed

1 file changed

+7
-7
lines changed

ggml/src/ggml-cpu/vec.h

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1425,19 +1425,19 @@ inline static void ggml_vec_geglu_erf_f32(const int n, float * y, const float *
14251425

14261426
inline static void ggml_vec_geglu_erf_f16(const int n, ggml_fp16_t * y, const ggml_fp16_t * x, const ggml_fp16_t * g) {
14271427
for (int i = 0; i < n; ++i) {
1428-
float xi = GGML_CPU_FP16_TO_FP32(x[i]);
1429-
float gi = GGML_CPU_FP16_TO_FP32(g[i]);
1430-
y[i] = GGML_CPU_FP32_TO_FP16(0.5f * xi * (1.0f + erff(xi*SQRT_2_INV)) * gi);
1428+
float xi = GGML_FP16_TO_FP32(x[i]);
1429+
float gi = GGML_FP16_TO_FP32(g[i]);
1430+
y[i] = GGML_FP32_TO_FP16(0.5f * xi * (1.0f + erff(xi*SQRT_2_INV)) * gi);
14311431
}
14321432
}
14331433

14341434
#ifdef GGML_GELU_QUICK_FP16
14351435
inline static void ggml_vec_geglu_quick_f32(const int n, float * y, const float * x, const float * g) {
14361436
uint16_t t;
14371437
for (int i = 0; i < n; ++i) {
1438-
ggml_fp16_t fp16 = GGML_CPU_FP32_TO_FP16(x[i]);
1438+
ggml_fp16_t fp16 = GGML_FP32_TO_FP16(x[i]);
14391439
memcpy(&t, &fp16, sizeof(uint16_t));
1440-
y[i] = GGML_CPU_FP16_TO_FP32(ggml_table_gelu_quick_f16[t]) * g[i];
1440+
y[i] = GGML_FP16_TO_FP32(ggml_table_gelu_quick_f16[t]) * g[i];
14411441
}
14421442
}
14431443
#else
@@ -1451,8 +1451,8 @@ inline static void ggml_vec_geglu_quick_f32(const int n, float * y, const float
14511451
inline static void ggml_vec_geglu_quick_f16(const int n, ggml_fp16_t * y, const ggml_fp16_t * x, const ggml_fp16_t * g) {
14521452
const uint16_t * i16 = (const uint16_t *) x;
14531453
for (int i = 0; i < n; ++i) {
1454-
float v = GGML_CPU_FP16_TO_FP32(g[i]);
1455-
y[i] = GGML_CPU_FP32_TO_FP16(GGML_CPU_FP16_TO_FP32(ggml_table_gelu_quick_f16[i16[i]]) * v);
1454+
float v = GGML_FP16_TO_FP32(g[i]);
1455+
y[i] = GGML_FP32_TO_FP16(GGML_FP16_TO_FP32(ggml_table_gelu_quick_f16[i16[i]]) * v);
14561456
}
14571457
}
14581458

0 commit comments

Comments
 (0)