Skip to content

Commit b9f430f

Browse files
authored
Fix mistake on mat trans 2d when init grid. (#275)
1 parent da41328 commit b9f430f

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

kernels/mat-transpose/mat_transpose.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -310,7 +310,7 @@ __global__ void mat_transpose_f32x4_shared_bcf_row2col2d_kernel(
310310
const int N = x.size(1); \
311311
dim3 block(WARP_SIZE_S, WARP_SIZE_S); \
312312
dim3 grid((N + WARP_SIZE_S - 1) / (WARP_SIZE_S * n_element_col), \
313-
(M + WARP_SIZE_S - 1) / (WARP_SIZE_S / n_element_row)); \
313+
(M + WARP_SIZE_S - 1) / (WARP_SIZE_S * n_element_row)); \
314314
mat_transpose_##tag##2d_kernel <<<grid, block>>>( \
315315
reinterpret_cast<element_type *>(x.data_ptr()), \
316316
reinterpret_cast<element_type *>(y.data_ptr()), M, N); \

0 commit comments

Comments
 (0)