pytorch
diff --git a/‎backends/vulkan/patterns/quantized_linear.py‎
Lines changed: 0 additions & 2 deletions b/‎backends/vulkan/patterns/quantized_linear.py‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎backends/vulkan/test/custom_ops/CMakeLists.txt‎
Lines changed: 2 additions & 2 deletions b/‎backends/vulkan/test/custom_ops/CMakeLists.txt‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎backends/vulkan/test/custom_ops/quantized_int4_linear.cpp‎
Lines changed: 0 additions & 366 deletions b/‎backends/vulkan/test/custom_ops/quantized_int4_linear.cpp‎
Lines changed: 0 additions & 366 deletions
@@ -116,7 +116,6 @@ def __init__(self, mm_node: torch.fx.Node) -> None:
 
         # If input is not quantized, then we are done
         if self.quantize_input_node is None:
-            raise Exception("Input is not quantized")
             self.match_found = True
             return
 
@@ -478,7 +477,6 @@ def replace_quantized_linear_patterns(
         and match.is_weight_pergroup_quantized()
         and utils.is_in_4bit_range(weight_tensor)
     ):
-        raise Exception("Unsupported pattern")
         make_linear_q4gsw_op(
             ep, graph_module, match, weight_tensor, weight_scales_tensor
         )
 
@@ -92,7 +92,7 @@ if(TARGET vulkan_backend)
   # Define operator prototypes
   add_operator_prototype(add)
   add_operator_prototype(q8csw_linear)
-  add_operator_prototype(quantized_q4gaw_linear)
-  add_operator_prototype(quantized_int4_linear)
   add_operator_prototype(q8csw_conv2d)
+  add_operator_prototype(q4gsw_linear)
+  add_operator_prototype(choose_qparams_per_row)
 endif()