Skip to content

Commit 831021b

Browse files
Merge pull request #384 from InfiniTensor/issue/6/fix
issue/6/fix type convertion
2 parents 81a5f62 + 1529608 commit 831021b

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

src/infiniop/ops/rms_norm/cuda/kernel.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ __device__ void rmsnormBlock(
2222
// Thread_0 computes RMS=1/sqrt(ss/dim+epsilon) and stores in shared memory
2323
__shared__ Tcompute rms;
2424
if (threadIdx.x == 0) {
25-
rms = Tdata(rsqrtf(ss / Tcompute(dim) + epsilon));
25+
rms = Tcompute(rsqrtf(ss / Tcompute(dim) + epsilon));
2626
}
2727
__syncthreads();
2828

0 commit comments

Comments
 (0)