remove layer_idx

Sanggyu Lee · Sanggyu Lee · commit f97e9883122d · 2025-11-04T14:09:20.000+09:00
diff --git a/tico/serialize/operators/onert/op_attention.py b/tico/serialize/operators/onert/op_attention.py
@@ -41,8 +41,7 @@
     Tensor attention_mask,
     Tensor past_key,
     Tensor past_value,
-    Tensor cache_position,
-    int layer_idx
+    Tensor cache_position
 ) -> Tensor
 """
 )
@@ -63,8 +62,7 @@ def attention_llama(*args, **kwargs):
         attention_mask,
         past_key,
         past_value,
-        cache_position,
-        layer_idx,
+        cache_position
     ) = args
     return hidden_states
 
@@ -104,8 +102,7 @@ def llama_attention_forward_adapter(
             #    k_cache[0] | k_cache[1] | ...  | k_cache[n]
             key_cache[self.layer_idx],
             value_cache[self.layer_idx],  # Same to value_cache
-            cache_position,
-            self.layer_idx,
+            cache_position
         ),
         None,
     )
@@ -136,7 +133,6 @@ def define_node(
             past_key,
             past_value,
             cache_position,
-            layer_idx,
         ) = node.args
 
         op_index = get_op_index(
@@ -153,9 +149,6 @@ def define_node(
         operator.builtinOptionsType = (
             circle.BuiltinOptions.BuiltinOptions.AttentionOptions
         )
-        option = circle.AttentionOptions.AttentionOptionsT()
-        option.layer_idx = layer_idx
-
-        operator.builtinOptions = option
+        operator.builtinOptions = circle.AttentionOptions.AttentionOptionsT()
 
         return operator