ggml-org
diff --git a/‎ggml/src/ggml-cpu/ggml-cpu.c‎
Lines changed: 1 addition & 1 deletion b/‎ggml/src/ggml-cpu/ggml-cpu.c‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎ggml/src/ggml-cpu/unary-ops.cpp‎
Lines changed: 0 additions & 3 deletions b/‎ggml/src/ggml-cpu/unary-ops.cpp‎
Lines changed: 0 additions & 3 deletions
diff --git a/‎ggml/src/ggml-cuda/ggml-cuda.cu‎
Lines changed: 3 additions & 0 deletions b/‎ggml/src/ggml-cuda/ggml-cuda.cu‎
Lines changed: 3 additions & 0 deletions
@@ -2144,6 +2144,7 @@ static int ggml_get_n_tasks(struct ggml_tensor * node, int n_threads) {
         case GGML_OP_ADD_ID:
         case GGML_OP_ADD1:
         case GGML_OP_ACC:
+        case GGML_OP_XIELU:
             {
                 n_tasks = n_threads;
             } break;
@@ -2167,7 +2168,6 @@ static int ggml_get_n_tasks(struct ggml_tensor * node, int n_threads) {
         case GGML_OP_REPEAT:
         case GGML_OP_REPEAT_BACK:
         case GGML_OP_LEAKY_RELU:
-        case GGML_OP_XIELU:
             {
                 n_tasks = 1;
             } break;
 
@@ -207,9 +207,6 @@ void ggml_compute_forward_xielu(const ggml_compute_params * params, ggml_tensor
     const float beta = op_params[2];
     const float eps = op_params[3];
 
-//    alpha_p = softplus(alpha_p);
-//    alpha_n = beta + softplus(alpha_n);
-
     const auto xielu_op_params = [alpha_n, alpha_p, beta, eps](float f) {
         return op_xielu(f, alpha_n, alpha_p, beta, eps);
     };
 
@@ -2517,6 +2517,9 @@ static bool ggml_cuda_compute_forward(ggml_backend_cuda_context & ctx, struct gg
         case GGML_OP_OPT_STEP_SGD:
             ggml_cuda_opt_step_sgd(ctx, dst);
             break;
+        case GGML_OP_XIELU:
+            ggml_cuda_op_xielu(ctx, dst);
+            break;
         default:
             return false;
     }