Skip to content

Commit 3e32aa4

Browse files
committed
trailing whitespaces removed
1 parent 0fbcf97 commit 3e32aa4

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

ggml/src/ggml-cuda/cpy.cu

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -12,13 +12,13 @@ static __global__ void cpy_contiguous(const T * cx, T * cdst_direct, const int n
1212
T ** cdst_indirect, int graph_cpynode_index) {
1313
const int64_t tid = blockDim.x * blockIdx.x + threadIdx.x;
1414
const int64_t stride = blockDim.x * gridDim.x;
15-
15+
1616
T * cdst = (cdst_indirect != nullptr) ? cdst_indirect[graph_cpynode_index] : cdst_direct;
17-
17+
1818
const int elements_per_thread = 4;
1919
for (int64_t base_idx = tid * elements_per_thread; base_idx < ne_elements; base_idx += stride * elements_per_thread) {
2020
const int64_t remaining = ne_elements - base_idx;
21-
21+
2222
if (remaining >= elements_per_thread) {
2323
if (base_idx % 4 == 0) {
2424
*((float4*)(cdst + base_idx)) = *((const float4*)(cx + base_idx));
@@ -178,7 +178,7 @@ static void ggml_cpy_contiguous_cuda(
178178
const int elements_per_thread = 4;
179179
const int threads_needed = (ne_elements + elements_per_thread - 1) / elements_per_thread;
180180
const int num_blocks = max(1, min(65535, (threads_needed + CUDA_CPY_BLOCK_SIZE - 1) / CUDA_CPY_BLOCK_SIZE));
181-
181+
182182
cpy_contiguous<T><<<num_blocks, CUDA_CPY_BLOCK_SIZE, 0, stream>>>
183183
(cx, cdst, ne_elements, cdst_indirect, graph_cpynode_index++);
184184
}

0 commit comments

Comments
 (0)