add note

dsikka · dsikka · commit 27e6f0755595 · 2025-09-30T11:53:17.000-04:00
diff --git a/examples/quantization_w8a8_fp8/qwen3_vl_moe_fp8_block_example.py b/examples/quantization_w8a8_fp8/qwen3_vl_moe_fp8_block_example.py
@@ -5,8 +5,12 @@
 from llmcompressor.modeling import replace_modules_for_calibration
 from llmcompressor.modifiers.quantization import QuantizationModifier
 
+# NOTE: Qwen3-VL-MoE support is not in transformers<=4.56.2
+# you may need to install transformes from source
+
 MODEL_ID = "Qwen/Qwen3-VL-235B-A22B-Instruct"
 
+
 # Load model.
 model = Qwen3VLMoeForConditionalGeneration.from_pretrained(MODEL_ID, torch_dtype="auto")
 model = replace_modules_for_calibration(model)