ggml-org
diff --git a/‎ggml/src/ggml-webgpu/ggml-webgpu.cpp‎
Lines changed: 22 additions & 2 deletions b/‎ggml/src/ggml-webgpu/ggml-webgpu.cpp‎
Lines changed: 22 additions & 2 deletions
@@ -129,7 +129,7 @@ struct webgpu_context_struct {
     webgpu_buf_pool set_rows_error_buf_pool;
 
     wgpu::ComputePipeline memset_pipeline;
-    wgpu::ComputePipeline mul_mat_pipeline[17][2];
+    wgpu::ComputePipeline mul_mat_pipeline[24][2];
     wgpu::ComputePipeline set_rows_pipeline;
     wgpu::ComputePipeline cpy_pipeline;
 
@@ -915,7 +915,7 @@ static void ggml_webgpu_init_memset_pipeline(webgpu_context & webgpu_ctx) {
 }
 
 static void ggml_webgpu_init_mul_mat_pipeline(webgpu_context & webgpu_ctx) {
-    webgpu_pipeline_info pipeline_infos[14] = {
+    webgpu_pipeline_info pipeline_infos[18] = {
         { .name        = "mul_mat_f32_f32",
          .shader_code = wgsl_mul_mat_f32_f32,
          .src0_type   = GGML_TYPE_F32,
@@ -971,6 +971,22 @@ static void ggml_webgpu_init_mul_mat_pipeline(webgpu_context & webgpu_ctx) {
          { .name        = "mul_mat_iq2_xxs_f32",
            .shader_code = wgsl_mul_mat_iq2_xxs_f32,
            .src0_type   = GGML_TYPE_IQ2_XXS,
+           .src1_type   = GGML_TYPE_F32 },
+         { .name        = "mul_mat_iq2_xs_f32",
+           .shader_code = wgsl_mul_mat_iq2_xs_f32,
+           .src0_type   = GGML_TYPE_IQ2_XS,
+           .src1_type   = GGML_TYPE_F32 },
+         { .name        = "mul_mat_iq2_s_f32",
+           .shader_code = wgsl_mul_mat_iq2_s_f32,
+           .src0_type   = GGML_TYPE_IQ2_S,
+           .src1_type   = GGML_TYPE_F32 },
+         { .name        = "mul_mat_iq3_xxs_f32",
+           .shader_code = wgsl_mul_mat_iq3_xxs_f32,
+           .src0_type   = GGML_TYPE_IQ3_XXS,
+           .src1_type   = GGML_TYPE_F32 },
+         { .name        = "mul_mat_iq3_s_f32",
+           .shader_code = wgsl_mul_mat_iq3_s_f32,
+           .src0_type   = GGML_TYPE_IQ3_S,
            .src1_type   = GGML_TYPE_F32 }
     };
 
@@ -1074,6 +1090,10 @@ static bool ggml_backend_webgpu_device_supports_op(ggml_backend_dev_t dev, const
                         case GGML_TYPE_Q5_K:
                         case GGML_TYPE_Q6_K:
                         case GGML_TYPE_IQ2_XXS:
+                        case GGML_TYPE_IQ2_XS:
+                        case GGML_TYPE_IQ2_S:
+                        case GGML_TYPE_IQ3_XXS:
+                        case GGML_TYPE_IQ3_S:
                             return true;
                         default:
                             return false;