We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e22e345 commit 2d24a9cCopy full SHA for 2d24a9c
ggml/src/ggml-cuda/mmv.cu
@@ -19,9 +19,9 @@ static __global__ void mul_mat_vec(
19
20
constexpr int warp_size = ggml_cuda_get_physical_warp_size();
21
22
- x += sample_x *stride_sample_x + channel_x *stride_channel_x + row*stride_row;
23
- y += sample_y *stride_sample_y + channel_y *stride_channel_y;
24
- dst += sample_dst*stride_sample_dst + channel_dst*stride_channel_dst;
+ x += int64_t(sample_x) *stride_sample_x + channel_x *stride_channel_x + row*stride_row;
+ y += int64_t(sample_y) *stride_sample_y + channel_y *stride_channel_y;
+ dst += int64_t(sample_dst)*stride_sample_dst + channel_dst*stride_channel_dst;
25
26
const float2 * y2 = (const float2 *) y;
27
0 commit comments