Skip to content

Commit b0e95db

Browse files
committed
fix rms norm.
1 parent 9d262f4 commit b0e95db

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

ggml/src/ggml-cann/aclnn_ops.cpp

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -885,9 +885,10 @@ void ggml_cann_rms_norm(ggml_backend_cann_context& ctx, ggml_tensor* dst) {
885885
size_t zero_tensor_n_bytes =
886886
src->ne[1] * src->ne[2] * src->ne[3] * ggml_element_size(src);
887887
ggml_cann_pool_alloc zero_tensor_allocator(ctx.pool(), zero_tensor_n_bytes);
888+
int64_t rstd_ne[GGML_MAX_DIMS] = {src->ne[1] , src->ne[2] , src->ne[3] , 1};
888889
aclTensor* acl_rstd =
889890
aclnn_zero(ctx, zero_tensor_allocator.get(), zero_tensor_n_bytes,
890-
src->ne, GGML_MAX_DIMS, ggml_cann_type_mapping(src->type),
891+
rstd_ne, 3, ggml_cann_type_mapping(src->type),
891892
ggml_element_size(src));
892893
GGML_CANN_CALL_ACLNN_OP(ctx, RmsNorm, acl_src, acl_gamma, eps, acl_dst, acl_rstd);
893894
ggml_cann_release_resources(ctx, acl_src, acl_dst, acl_gamma, acl_rstd);

0 commit comments

Comments
 (0)