Skip to content

Commit beaf849

Browse files
Bring back quantization_config parameter
1 parent 814d96c commit beaf849

File tree

1 file changed

+4
-1
lines changed

1 file changed

+4
-1
lines changed

optimum/intel/openvino/modeling_decoder.py

+4-1
Original file line numberDiff line numberDiff line change
@@ -761,6 +761,7 @@ def _from_pretrained(
761761
config=config,
762762
model_save_dir=model_cache_path.parent,
763763
compile=enable_compilation,
764+
quantization_config=quantization_config,
764765
**kwargs,
765766
)
766767

@@ -782,7 +783,9 @@ def _from_pretrained(
782783
quantizer = OVQuantizer(causal_model)
783784
quantization_config_copy = copy.deepcopy(quantization_config)
784785
quantization_config_copy.tokenizer = quantization_config.tokenizer or model_id
785-
quantizer.quantize(ov_config=OVConfig(quantization_config=quantization_config_copy))
786+
ov_config = OVConfig(quantization_config=quantization_config_copy)
787+
quantizer.quantize(ov_config=ov_config)
788+
786789

787790
return causal_model
788791

0 commit comments

Comments
 (0)