Skip to content

Commit 40c6211

Browse files
committed
updatE
1 parent a215aae commit 40c6211

File tree

2 files changed

+4
-2
lines changed

2 files changed

+4
-2
lines changed

examples/quantization_w4a4_fp4/qwen3_5_moe.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,7 @@
55
import torch
66

77
MODEL_ID = "/raid/engine/dsikka/models--Qwen--Qwen3.5-397B-A17B/snapshots/7cad2bae11cb49ca79f7d6a0954de2e2756f4e27"
8+
MODEL_ID = "Qwen/Qwen3.5-122B-A10B"
89

910
# Load model.
1011
model = Qwen3_5MoeForConditionalGeneration.from_pretrained(MODEL_ID, dtype="auto")
@@ -82,6 +83,6 @@ def data_collator(batch):
8283
moe_calibrate_all_experts=True)
8384

8485
# Save to disk in compressed-tensors format.
85-
SAVE_DIR = "/raid/engine/dsikka/" + "Qwen3.5-397B-A17B" + "-NVFP4"
86+
SAVE_DIR = "/mnt/nvme_stripe/playground/dsikka/" + "Qwen3.5-122B-A10B" + "-NVFP4"
8687
model.save_pretrained(SAVE_DIR)
8788
processor.save_pretrained(SAVE_DIR)

examples/quantization_w8a8_fp8/qwen3_5_moe.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,7 @@
44
from llmcompressor.modifiers.quantization import QuantizationModifier
55

66
MODEL_ID = "/raid/engine/dsikka/models--Qwen--Qwen3.5-397B-A17B/snapshots/7cad2bae11cb49ca79f7d6a0954de2e2756f4e27"
7+
MODEL_ID = "Qwen/Qwen3.5-122B-A10B"
78

89
# Load model.
910
model = Qwen3_5MoeForConditionalGeneration.from_pretrained(MODEL_ID, dtype="auto")
@@ -33,6 +34,6 @@
3334
oneshot(model=model, recipe=recipe)
3435

3536
# Save to disk in compressed-tensors format.
36-
SAVE_DIR = "/raid/engine/dsikka/" + "Qwen3.5-397B-A17B" + "-FP8-Dynamic-NoLinearAttn"
37+
SAVE_DIR = "/mnt/nvme_stripe/playground/dsikka/" + "Qwen3.5-122B-A10B" + "-FP8_DYNAMIC"
3738
model.save_pretrained(SAVE_DIR)
3839
processor.save_pretrained(SAVE_DIR)

0 commit comments

Comments
 (0)