We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 814d96c commit beaf849Copy full SHA for beaf849
optimum/intel/openvino/modeling_decoder.py
@@ -761,6 +761,7 @@ def _from_pretrained(
761
config=config,
762
model_save_dir=model_cache_path.parent,
763
compile=enable_compilation,
764
+ quantization_config=quantization_config,
765
**kwargs,
766
)
767
@@ -782,7 +783,9 @@ def _from_pretrained(
782
783
quantizer = OVQuantizer(causal_model)
784
quantization_config_copy = copy.deepcopy(quantization_config)
785
quantization_config_copy.tokenizer = quantization_config.tokenizer or model_id
- quantizer.quantize(ov_config=OVConfig(quantization_config=quantization_config_copy))
786
+ ov_config = OVConfig(quantization_config=quantization_config_copy)
787
+ quantizer.quantize(ov_config=ov_config)
788
+
789
790
return causal_model
791
0 commit comments