Skip to content

Commit 96ace59

Browse files
authored
Update fp8_block_example.py (#1836)
- Should not be set to auto
1 parent 18eff29 commit 96ace59

File tree

1 file changed

+1
-3
lines changed

1 file changed

+1
-3
lines changed

examples/quantization_w8a8_fp8/fp8_block_example.py

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -7,9 +7,7 @@
77
MODEL_ID = "Qwen/Qwen3-30B-A3B"
88

99
# Load model.
10-
model = AutoModelForCausalLM.from_pretrained(
11-
MODEL_ID, device_map="auto", torch_dtype="auto"
12-
)
10+
model = AutoModelForCausalLM.from_pretrained(MODEL_ID, torch_dtype="auto")
1311
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
1412

1513
# Configure the quantization algorithm and scheme.

0 commit comments

Comments
 (0)