@@ -1425,19 +1425,19 @@ inline static void ggml_vec_geglu_erf_f32(const int n, float * y, const float *
14251425
14261426inline static void ggml_vec_geglu_erf_f16 (const int n , ggml_fp16_t * y , const ggml_fp16_t * x , const ggml_fp16_t * g ) {
14271427 for (int i = 0 ; i < n ; ++ i ) {
1428- float xi = GGML_CPU_FP16_TO_FP32 (x [i ]);
1429- float gi = GGML_CPU_FP16_TO_FP32 (g [i ]);
1430- y [i ] = GGML_CPU_FP32_TO_FP16 (0.5f * xi * (1.0f + erff (xi * SQRT_2_INV )) * gi );
1428+ float xi = GGML_FP16_TO_FP32 (x [i ]);
1429+ float gi = GGML_FP16_TO_FP32 (g [i ]);
1430+ y [i ] = GGML_FP32_TO_FP16 (0.5f * xi * (1.0f + erff (xi * SQRT_2_INV )) * gi );
14311431 }
14321432}
14331433
14341434#ifdef GGML_GELU_QUICK_FP16
14351435inline static void ggml_vec_geglu_quick_f32 (const int n , float * y , const float * x , const float * g ) {
14361436 uint16_t t ;
14371437 for (int i = 0 ; i < n ; ++ i ) {
1438- ggml_fp16_t fp16 = GGML_CPU_FP32_TO_FP16 (x [i ]);
1438+ ggml_fp16_t fp16 = GGML_FP32_TO_FP16 (x [i ]);
14391439 memcpy (& t , & fp16 , sizeof (uint16_t ));
1440- y [i ] = GGML_CPU_FP16_TO_FP32 (ggml_table_gelu_quick_f16 [t ]) * g [i ];
1440+ y [i ] = GGML_FP16_TO_FP32 (ggml_table_gelu_quick_f16 [t ]) * g [i ];
14411441 }
14421442}
14431443#else
@@ -1451,8 +1451,8 @@ inline static void ggml_vec_geglu_quick_f32(const int n, float * y, const float
14511451inline static void ggml_vec_geglu_quick_f16 (const int n , ggml_fp16_t * y , const ggml_fp16_t * x , const ggml_fp16_t * g ) {
14521452 const uint16_t * i16 = (const uint16_t * ) x ;
14531453 for (int i = 0 ; i < n ; ++ i ) {
1454- float v = GGML_CPU_FP16_TO_FP32 (g [i ]);
1455- y [i ] = GGML_CPU_FP32_TO_FP16 ( GGML_CPU_FP16_TO_FP32 (ggml_table_gelu_quick_f16 [i16 [i ]]) * v );
1454+ float v = GGML_FP16_TO_FP32 (g [i ]);
1455+ y [i ] = GGML_FP32_TO_FP16 ( GGML_FP16_TO_FP32 (ggml_table_gelu_quick_f16 [i16 [i ]]) * v );
14561456 }
14571457}
14581458
0 commit comments