|
52 | 52 | "import transformers\n", |
53 | 53 | "from pathlib import Path\n", |
54 | 54 | "from openvino.runtime import Core\n", |
55 | | - "from optimum.intel import OVStableDiffusionPipeline, OVWeightQuantizationConfig\n", |
| 55 | + "from optimum.intel import OVConfig, OVQuantizer, OVStableDiffusionPipeline, OVWeightQuantizationConfig\n", |
56 | 56 | "\n", |
57 | 57 | "transformers.logging.set_verbosity_error()\n", |
58 | 58 | "datasets.logging.set_verbosity_error()" |
|
198 | 198 | }, |
199 | 199 | "outputs": [], |
200 | 200 | "source": [ |
201 | | - "quantization_config = OVWeightQuantizationConfig(bits=8, dataset=calibration_dataset, num_samples=NUM_SAMPLES)\n", |
202 | | - "int8_pipe = OVStableDiffusionPipeline.from_pretrained(model_id=MODEL_ID, export=True, quantization_config=quantization_config)\n", |
203 | | - "int8_pipe.save_pretrained(int8_model_path)" |
| 201 | + "quantization_config = OVWeightQuantizationConfig(bits=8, num_samples=NUM_SAMPLES)\n", |
| 202 | + "int8_pipe = OVStableDiffusionPipeline.from_pretrained(model_id=MODEL_ID, export=True)\n", |
| 203 | + "quantizer = OVQuantizer(int8_pipe)\n", |
| 204 | + "quantizer.quantize(\n", |
| 205 | + " ov_config=OVConfig(quantization_config=quantization_config),\n", |
| 206 | + " calibration_dataset=calibration_dataset,\n", |
| 207 | + " save_directory=int8_model_path\n", |
| 208 | + ")" |
204 | 209 | ] |
205 | 210 | }, |
206 | 211 | { |
|
613 | 618 | "name": "python", |
614 | 619 | "nbconvert_exporter": "python", |
615 | 620 | "pygments_lexer": "ipython3", |
616 | | - "version": "3.11.7" |
| 621 | + "version": "3.8.10" |
617 | 622 | } |
618 | 623 | }, |
619 | 624 | "nbformat": 4, |
|
0 commit comments