@@ -1244,7 +1244,7 @@ static __global__ void dequantize_mul_mat_vec(const void * vx, const dfloat * y,
12441244}
12451245
12461246static __global__ void mul_mat_p021_f16_f32 (const void * vx, const float * y, float * dst, const int ncols_x, const int nrows_x, const int nchannels_x) {
1247- const half * x = (half *) vx;
1247+ const half * x = (const half *) vx;
12481248
12491249 const int row_x = blockDim .y *blockIdx .y + threadIdx .y ;
12501250 const int channel = blockDim .z *blockIdx .z + threadIdx .z ;
@@ -1294,7 +1294,7 @@ static __global__ void mul_mat_vec_nc_f16_f32( // nc == non-contiguous
12941294 const void * vx, const float * y, float * dst, const int ncols_x, const int nrows_x,
12951295 const int row_stride_x, const int nchannels_x, const int channel_stride_x) {
12961296
1297- const half * x = (half *) vx;
1297+ const half * x = (const half *) vx;
12981298
12991299 const int row_x = blockDim .y *blockIdx .y + threadIdx .y ;
13001300 const int channel = blockDim .z *blockIdx .z + threadIdx .z ;
@@ -1337,14 +1337,14 @@ static __global__ void mul_mat_vec_nc_f16_f32( // nc == non-contiguous
13371337}
13381338
13391339static __device__ void cpy_1_f32_f32 (const char * cxi, char * cdsti) {
1340- const float * xi = (float *) cxi;
1340+ const float * xi = (const float *) cxi;
13411341 float * dsti = (float *) cdsti;
13421342
13431343 *dsti = *xi;
13441344}
13451345
13461346static __device__ void cpy_1_f32_f16 (const char * cxi, char * cdsti) {
1347- const float * xi = (float *) cxi;
1347+ const float * xi = (const float *) cxi;
13481348 half * dsti = (half *) cdsti;
13491349
13501350 *dsti = __float2half (*xi);
0 commit comments