@@ -1386,19 +1386,19 @@ inline static void ggml_vec_geglu_erf_f32(const int n, float * y, const float *
13861386
13871387inline static void ggml_vec_geglu_erf_f16 (const int n , ggml_fp16_t * y , const ggml_fp16_t * x , const ggml_fp16_t * g ) {
13881388 for (int i = 0 ; i < n ; ++ i ) {
1389- float xi = GGML_CPU_FP16_TO_FP32 (x [i ]);
1390- float gi = GGML_CPU_FP16_TO_FP32 (g [i ]);
1391- y [i ] = GGML_CPU_FP32_TO_FP16 (0.5f * xi * (1.0f + erff (xi * SQRT_2_INV )) * gi );
1389+ float xi = GGML_FP16_TO_FP32 (x [i ]);
1390+ float gi = GGML_FP16_TO_FP32 (g [i ]);
1391+ y [i ] = GGML_FP32_TO_FP16 (0.5f * xi * (1.0f + erff (xi * SQRT_2_INV )) * gi );
13921392 }
13931393}
13941394
13951395#ifdef GGML_GELU_QUICK_FP16
13961396inline static void ggml_vec_geglu_quick_f32 (const int n , float * y , const float * x , const float * g ) {
13971397 uint16_t t ;
13981398 for (int i = 0 ; i < n ; ++ i ) {
1399- ggml_fp16_t fp16 = GGML_CPU_FP32_TO_FP16 (x [i ]);
1399+ ggml_fp16_t fp16 = GGML_FP32_TO_FP16 (x [i ]);
14001400 memcpy (& t , & fp16 , sizeof (uint16_t ));
1401- y [i ] = GGML_CPU_FP16_TO_FP32 (ggml_table_gelu_quick_f16 [t ]) * g [i ];
1401+ y [i ] = GGML_FP16_TO_FP32 (ggml_table_gelu_quick_f16 [t ]) * g [i ];
14021402 }
14031403}
14041404#else
@@ -1412,8 +1412,8 @@ inline static void ggml_vec_geglu_quick_f32(const int n, float * y, const float
14121412inline static void ggml_vec_geglu_quick_f16 (const int n , ggml_fp16_t * y , const ggml_fp16_t * x , const ggml_fp16_t * g ) {
14131413 const uint16_t * i16 = (const uint16_t * ) x ;
14141414 for (int i = 0 ; i < n ; ++ i ) {
1415- float v = GGML_CPU_FP16_TO_FP32 (g [i ]);
1416- y [i ] = GGML_CPU_FP32_TO_FP16 ( GGML_CPU_FP16_TO_FP32 (ggml_table_gelu_quick_f16 [i16 [i ]]) * v );
1415+ float v = GGML_FP16_TO_FP32 (g [i ]);
1416+ y [i ] = GGML_FP32_TO_FP16 ( GGML_FP16_TO_FP32 (ggml_table_gelu_quick_f16 [i16 [i ]]) * v );
14171417 }
14181418}
14191419
0 commit comments