Skip to content

Commit c66ccb3

Browse files
Update ggml/src/ggml-cuda/cpy.cu
Co-authored-by: Johannes Gäßler <[email protected]>
1 parent 1482871 commit c66ccb3

File tree

1 file changed

+3
-4
lines changed

1 file changed

+3
-4
lines changed

ggml/src/ggml-cuda/cpy.cu

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -603,12 +603,11 @@ void ggml_cuda_cpy(ggml_backend_cuda_context & ctx, const ggml_tensor * src0, gg
603603
#ifdef GGML_USE_MUSA
604604
if (src0->type == GGML_TYPE_F32 || src0->type == GGML_TYPE_F16) {
605605
CUDA_CHECK(mudnnMemcpyAsync(ctx, src1, src0));
606-
} else {
606+
} else
607+
#endif // GGML_USE_MUSA
608+
{
607609
CUDA_CHECK(cudaMemcpyAsync(src1_ddc, src0_ddc, ggml_nbytes(src0), cudaMemcpyDeviceToDevice, main_stream));
608610
}
609-
#else // GGML_USE_MUSA
610-
CUDA_CHECK(cudaMemcpyAsync(src1_ddc, src0_ddc, ggml_nbytes(src0), cudaMemcpyDeviceToDevice, main_stream));
611-
#endif // GGML_USE_MUSA
612611
} else if (src0->type == GGML_TYPE_F32 && src1->type == GGML_TYPE_F32) {
613612
ggml_cpy_f32_f32_cuda (src0_ddc, src1_ddc, ne, ne00, ne01, ne02, nb00, nb01, nb02, nb03, ne10, ne11, ne12, nb10, nb11, nb12, nb13, main_stream, dest_ptrs_d, graph_cpynode_index);
614613
} else if (src0->type == GGML_TYPE_F32 && src1->type == GGML_TYPE_BF16) {

0 commit comments

Comments
 (0)