Skip to content

Commit ebc7744

Browse files
committed
Up Fused RMS Norm
Update ggml-cuda.cu Update ggml-alloc.c
1 parent e88f28b commit ebc7744

File tree

2 files changed

+3
-0
lines changed

2 files changed

+3
-0
lines changed

ggml/src/ggml-alloc.c

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -53,6 +53,7 @@ static bool ggml_op_can_inplace(enum ggml_op op) {
5353
case GGML_OP_UNARY:
5454
case GGML_OP_ROPE:
5555
case GGML_OP_RMS_NORM:
56+
case GGML_OP_FUSED_RMS_NORM:
5657
case GGML_OP_SOFT_MAX:
5758
return true;
5859

ggml/src/ggml-cuda/ggml-cuda.cu

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3141,6 +3141,8 @@ static bool ggml_backend_cuda_device_supports_op(ggml_backend_dev_t dev, const g
31413141
return ggml_is_contiguous(op->src[0]) && op->ne[0] % WARP_SIZE == 0;
31423142
break;
31433143
case GGML_OP_FUSED_RMS_NORM:
3144+
return ggml_is_contiguous(op->src[0]) && op->ne[0] % WARP_SIZE == 0;
3145+
break;
31443146
case GGML_OP_NONE:
31453147
case GGML_OP_RESHAPE:
31463148
case GGML_OP_VIEW:

0 commit comments

Comments
 (0)