|
52 | 52 | "import transformers\n",
|
53 | 53 | "from pathlib import Path\n",
|
54 | 54 | "from openvino.runtime import Core\n",
|
55 |
| - "from optimum.intel import OVStableDiffusionPipeline, OVWeightQuantizationConfig\n", |
| 55 | + "from optimum.intel import OVConfig, OVQuantizer, OVStableDiffusionPipeline, OVWeightQuantizationConfig\n", |
56 | 56 | "\n",
|
57 | 57 | "transformers.logging.set_verbosity_error()\n",
|
58 | 58 | "datasets.logging.set_verbosity_error()"
|
|
198 | 198 | },
|
199 | 199 | "outputs": [],
|
200 | 200 | "source": [
|
201 |
| - "quantization_config = OVWeightQuantizationConfig(bits=8, dataset=calibration_dataset, num_samples=NUM_SAMPLES)\n", |
202 |
| - "int8_pipe = OVStableDiffusionPipeline.from_pretrained(model_id=MODEL_ID, export=True, quantization_config=quantization_config)\n", |
203 |
| - "int8_pipe.save_pretrained(int8_model_path)" |
| 201 | + "quantization_config = OVWeightQuantizationConfig(bits=8, num_samples=NUM_SAMPLES)\n", |
| 202 | + "int8_pipe = OVStableDiffusionPipeline.from_pretrained(model_id=MODEL_ID, export=True)\n", |
| 203 | + "quantizer = OVQuantizer(int8_pipe)\n", |
| 204 | + "quantizer.quantize(\n", |
| 205 | + " ov_config=OVConfig(quantization_config=quantization_config),\n", |
| 206 | + " calibration_dataset=calibration_dataset,\n", |
| 207 | + " save_directory=int8_model_path\n", |
| 208 | + ")" |
204 | 209 | ]
|
205 | 210 | },
|
206 | 211 | {
|
|
613 | 618 | "name": "python",
|
614 | 619 | "nbconvert_exporter": "python",
|
615 | 620 | "pygments_lexer": "ipython3",
|
616 |
| - "version": "3.11.7" |
| 621 | + "version": "3.8.10" |
617 | 622 | }
|
618 | 623 | },
|
619 | 624 | "nbformat": 4,
|
|
0 commit comments