Skip to content

Commit 8bf8519

Browse files
committed
Test on GGML_OP_FUSED_RMS_NORM
Similar to LCPP ggml-org#10111
1 parent e8dc308 commit 8bf8519

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

ggml/src/ggml-cuda.cu

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3133,6 +3133,8 @@ static bool ggml_backend_cuda_device_supports_op(ggml_backend_dev_t dev, const g
31333133
case GGML_OP_MUL:
31343134
case GGML_OP_DIV:
31353135
case GGML_OP_FUSED_RMS_NORM:
3136+
return ggml_is_contiguous(op->src[0]) && op->ne[0] % WARP_SIZE == 0;
3137+
break;
31363138
case GGML_OP_SCALE:
31373139
case GGML_OP_SQR:
31383140
case GGML_OP_SQRT:

0 commit comments

Comments
 (0)