Remove trust_remote_code and move save to after generate

fynnsu · fynnsu · commit 3756f105a8d1 · 2025-09-26T12:07:21.000-04:00
Signed-off-by: Fynn Schmitt-Ulms &lt;fschmitt@redhat.com&gt;
diff --git a/examples/awq/qwen3_coder_moe_example.py b/examples/awq/qwen3_coder_moe_example.py
@@ -51,10 +51,8 @@ def preprocess(example):
 
 
 if __name__ == "__main__":
-    model = AutoModelForCausalLM.from_pretrained(
-        MODEL_ID, torch_dtype="auto", trust_remote_code=True
-    )
-    tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)
+    model = AutoModelForCausalLM.from_pretrained(MODEL_ID, torch_dtype="auto")
+    tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
 
     ###
     ### Apply algorithms.
@@ -66,18 +64,18 @@ def preprocess(example):
         max_seq_length=MAX_SEQUENCE_LENGTH,
         num_calibration_samples=NUM_CALIBRATION_SAMPLES,
         log_dir=None,
-        trust_remote_code_model=True,
     )
 
-    model.save_pretrained(SAVE_DIR)
-    tokenizer.save_pretrained(SAVE_DIR)
-
     # Confirm generations of the quantized model look sane.
     print("========== SAMPLE GENERATION ==============")
     dispatch_for_generation(model)
     input_ids = tokenizer(
         "Write a binary search function", return_tensors="pt"
     ).input_ids.to(model.device)
-    output = model.generate(input_ids, max_new_tokens=100)
+    output = model.generate(input_ids, max_new_tokens=150)
     print(tokenizer.decode(output[0]))
     print("==========================================\n\n")
+
+    # Save model to disk
+    model.save_pretrained(SAVE_DIR)
+    tokenizer.save_pretrained(SAVE_DIR)