Qualcomm AI Engine Direct - Rope Fix (#14346)

pytorchbot · winskuo-quic · web-flow · commit b752a77fadb0 · 2025-09-17T13:15:57.000-07:00
### Summary Rope fix ### Test plan CI Passes cc: @haowhsu-quic Co-authored-by: winskuo-quic <143469905+winskuo-quic@users.noreply.github.com>
diff --git a/examples/qualcomm/oss_scripts/llama/model/static_llama.py b/examples/qualcomm/oss_scripts/llama/model/static_llama.py
@@ -75,9 +75,10 @@ def __init__(self, layer_idx: int, config: ModelArgs, output_new_cache_only=Fals
         self.enable_masked_softmax = getattr(config, "enable_masked_softmax", False)
         self.use_qk_norm = config.use_qk_norm
         self.qk_norm_before_rope = config.qk_norm_before_rope
+        # If None, assume each layer uses rope
         self.use_rope = (
-            config.no_rope_layer_interval
-            and (layer_idx + 1) % config.no_rope_layer_interval
+            config.no_rope_layer_interval is None
+            or (layer_idx + 1) % config.no_rope_layer_interval
         )
 
         if self.use_qk_norm: