@@ -299,7 +299,6 @@ struct vk_device_struct {
299299    vk_pipeline pipeline_cpy_f32_f32, pipeline_cpy_f32_f16, pipeline_cpy_f16_f16;
300300    vk_pipeline pipeline_contig_cpy_f32_f32, pipeline_contig_cpy_f32_f16, pipeline_contig_cpy_f16_f16;
301301    vk_pipeline pipeline_cpy_f32_quant[GGML_TYPE_COUNT];
302-     vk_pipeline pipeline_cpy_f32_quant_rte[GGML_TYPE_COUNT];
303302    vk_pipeline pipeline_cpy_quant_f32[GGML_TYPE_COUNT];
304303    vk_pipeline pipeline_norm_f32;
305304    vk_pipeline pipeline_group_norm_f32;
@@ -2283,12 +2282,12 @@ static void ggml_vk_load_shaders(vk_device& device) {
22832282    ggml_vk_create_pipeline (device, device->pipeline_contig_cpy_f32_f16 , " contig_cpy_f32_f16" " main" 2 , sizeof (vk_op_unary_push_constants), {512 , 1 , 1 }, {}, 1 );
22842283    ggml_vk_create_pipeline (device, device->pipeline_contig_cpy_f16_f16 , " contig_cpy_f16_f16" " main" 2 , sizeof (vk_op_unary_push_constants), {512 , 1 , 1 }, {}, 1 );
22852284    if  (device->float_controls_rte_fp16 ) {
2286-         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant_rte [GGML_TYPE_Q4_0], " cpy_f32_q4_0" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q4_0), 1 , 1 }, {}, 1 );
2287-         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant_rte [GGML_TYPE_Q4_1], " cpy_f32_q4_1" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q4_1), 1 , 1 }, {}, 1 );
2288-         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant_rte [GGML_TYPE_Q5_0], " cpy_f32_q5_0" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q5_0), 1 , 1 }, {}, 1 );
2289-         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant_rte [GGML_TYPE_Q5_1], " cpy_f32_q5_1" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q5_1), 1 , 1 }, {}, 1 );
2290-         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant_rte [GGML_TYPE_Q8_0], " cpy_f32_q8_0" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q8_0), 1 , 1 }, {}, 1 );
2291-         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant_rte [GGML_TYPE_IQ4_NL], " cpy_f32_iq4_nl" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_IQ4_NL), 1 , 1 }, {}, 1 );
2285+         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant [GGML_TYPE_Q4_0], " cpy_f32_q4_0" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q4_0), 1 , 1 }, {}, 1 );
2286+         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant [GGML_TYPE_Q4_1], " cpy_f32_q4_1" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q4_1), 1 , 1 }, {}, 1 );
2287+         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant [GGML_TYPE_Q5_0], " cpy_f32_q5_0" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q5_0), 1 , 1 }, {}, 1 );
2288+         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant [GGML_TYPE_Q5_1], " cpy_f32_q5_1" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q5_1), 1 , 1 }, {}, 1 );
2289+         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant [GGML_TYPE_Q8_0], " cpy_f32_q8_0" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q8_0), 1 , 1 }, {}, 1 );
2290+         ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant [GGML_TYPE_IQ4_NL], " cpy_f32_iq4_nl" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_IQ4_NL), 1 , 1 }, {}, 1 );
22922291    } else  {
22932292        ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant [GGML_TYPE_Q4_0], " cpy_f32_q4_0" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q4_0), 1 , 1 }, {}, 1 );
22942293        ggml_vk_create_pipeline (device, device->pipeline_cpy_f32_quant [GGML_TYPE_Q4_1], " cpy_f32_q4_1" " main" 2 , sizeof (vk_op_unary_push_constants), {(uint32_t )ggml_blck_size (GGML_TYPE_Q4_1), 1 , 1 }, {}, 1 );
@@ -4150,7 +4149,7 @@ static vk_pipeline ggml_vk_get_cpy_pipeline(ggml_backend_vk_context * ctx, const
41504149            case  GGML_TYPE_Q5_1:
41514150            case  GGML_TYPE_Q8_0:
41524151            case  GGML_TYPE_IQ4_NL:
4153-                 return  ctx->device ->pipeline_cpy_f32_quant_rte [to];
4152+                 return  ctx->device ->pipeline_cpy_f32_quant [to];
41544153            default :
41554154                break ;
41564155            }
0 commit comments