Clean up unused metadata

shewu-quic · shewu-quic · commit 614134434d08 · 2025-08-14T16:12:05.000+08:00
diff --git a/examples/qualcomm/oss_scripts/llm_utils/decoder_model_wrapper.py b/examples/qualcomm/oss_scripts/llm_utils/decoder_model_wrapper.py
@@ -25,31 +25,20 @@ def save_config_to_constant_methods(
 ):
     # Initialize metadata with values from model config
     metadata = {
-        "get_dtype": 5 if config.torch_dtype == torch.float16 else 6,
         "get_bos_id": getattr(config, "bos_token_id", None),
         "get_eos_id": getattr(config, "eos_token_id", None),
-        "get_head_dim": getattr(config, "head_dim", None),
-        "get_n_kv_heads": getattr(config, "num_key_value_heads", None),
-        "get_n_layers": getattr(config, "num_hidden_layers", None),
         "get_vocab_size": getattr(config, "vocab_size", None),
-        "get_max_batch_size": 1,
         "get_max_seq_len": getattr(config, "max_position_embeddings", None),
         "use_kv_cache": getattr(generation_config, "use_cache", None),
-        "sliding_window": getattr(config, "sliding_window", None),
-        "decoder_start_token_id": getattr(config, "decoder_start_token_id", None),
-        "use_sdpa_with_kv_cache": "custom_sdpa" in config._attn_implementation,
+        "use_sdpa_with_kv_cache": False,
     }
 
     # Safely access fields from generation_config if it exists
     if generation_config is not None:
         # Check for cache_config and its attributes
         cache_config = getattr(generation_config, "cache_config", None)
         if cache_config is not None:
-            max_batch_size = getattr(cache_config, "batch_size", None)
             max_seq_len = getattr(cache_config, "max_cache_len", None)
-
-            if max_batch_size is not None:
-                metadata["get_max_batch_size"] = max_batch_size
             if max_seq_len is not None:
                 metadata["get_max_seq_len"] = max_seq_len