Update on "[ET-VK] Implemement linear_dq8ta_q4gsw"

ssjia · ssjia · commit 45d9b43680b6 · 2025-09-08T12:32:38.000-07:00
Title says it all! Build upon the support for quantized linear introduced in the previous diffs to enable dynamically quantized linear. Also included in this diff is a cleanup of the glslh files used across quantized linear implementations. Differential Revision: [D81931060](https://our.internmc.facebook.com/intern/diff/D81931060/) [ghstack-poisoned]
diff --git a/backends/vulkan/patterns/quantized_linear.py b/backends/vulkan/patterns/quantized_linear.py
@@ -181,6 +181,9 @@ def is_input_dynamic_perchannel_quantized(self) -> bool:
         if self.quantize_input_node is None:
             return False
 
+        if not isinstance(self.input_scales_node, torch.fx.Node):
+            return False
+
         # For dynamic quantization, input scale node should be a getitem operator
         # retrieving the output of a choose_qparams op
         if self.input_scales_node.target != operator.getitem: