Skip to content

Commit 2e1c881

Browse files
committed
resolves @Green-Sky suggestions
1 parent e1ab1f0 commit 2e1c881

File tree

1 file changed

+2
-3
lines changed

1 file changed

+2
-3
lines changed

ggml/src/ggml-cuda/conv2d-tensor-core.cu

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -103,9 +103,8 @@ template <typename layout,
103103
const uint32_t NUM_WARPS_NOHOW,
104104
const uint32_t NUM_WARPS,
105105
const uint32_t WG_SIZE>
106-
__global__ void __launch_bounds__(NUM_WARPS * WARP_SIZE) conv2d_tensor_cores_kernel(const float * __restrict__ IN,
107-
const half * __restrict__ IK,
108-
float * __restrict__ Out) {
106+
__global__ void __launch_bounds__(NUM_WARPS * WARP_SIZE)
107+
conv2d_tensor_cores_kernel(const float * __restrict__ IN, const half * __restrict__ IK, float * __restrict__ Out) {
109108
const uint32_t warpId = threadIdx.y;
110109
const uint32_t block_tid = threadIdx.y * blockDim.x + threadIdx.x;
111110

0 commit comments

Comments
 (0)