diff --git a/backends/cadence/aot/compiler.py b/backends/cadence/aot/compiler.py index 5ddcfcf414b..c19a4296f6a 100644 --- a/backends/cadence/aot/compiler.py +++ b/backends/cadence/aot/compiler.py @@ -131,7 +131,10 @@ def quantize_pt2( Prepare, convert and fuse the model using the given quantizer. Returns a GraphModule with the quantized model. """ - # Quantizer + # Make the model inference mode by calling model.eval() + model.eval() + + # Instantiate the quantizer to CadenceQuantizer if not supplied if not quantizer: quantizer = CadenceQuantizer()