Add docs

nikita-savelyevv · nikita-savelyevv · commit 65679a5627ff · 2025-02-27T16:19:55.000+01:00
diff --git a/docs/source/openvino/optimization.mdx b/docs/source/openvino/optimization.mdx
@@ -87,6 +87,8 @@ quantization_config = OVWeightQuantizationConfig(
 )
 ```
 
+Note: `OVWeightQuantizationConfig` also accepts key word arguments not listed in its constructor. In this case such arguments will be passed directly to `nncf.compress_weights()` call. This is useful for passing additional parameters to the quantization algorithm.
+
 By default the quantization scheme will be [asymmetric](https://github.com/openvinotoolkit/nncf/blob/develop/docs/usage/training_time_compression/other_algorithms/LegacyQuantization.md#asymmetric-quantization), to make it [symmetric](https://github.com/openvinotoolkit/nncf/blob/develop/docs/usage/training_time_compression/other_algorithms/LegacyQuantization.md#symmetric-quantization) you can add `sym=True`.
 
 For 4-bit quantization you can also specify the following arguments in the quantization configuration :
diff --git a/optimum/intel/openvino/quantization.py b/optimum/intel/openvino/quantization.py
@@ -1044,6 +1044,7 @@ def _weight_only_quantization(
             f"by the ones given in _weight_only_quantization call kwargs: {kwargs_intersection}."
         )
     wc_kwargs.update(kwargs)
+    wc_kwargs.pop("weight_only", None)
 
     compressed_model = nncf.compress_weights(
         model,
@@ -1076,6 +1077,7 @@ def _full_quantization(
             f"by the ones given in _full_quantization call kwargs: {kwargs_intersection}."
         )
     q_kwargs.update(kwargs)
+    q_kwargs.pop("weight_only", None)
 
     quantized_model = nncf.quantize(model, calibration_dataset=calibration_dataset, **q_kwargs)
 

Original file line number	Diff line number	Diff line change
`@@ -87,6 +87,8 @@ quantization_config = OVWeightQuantizationConfig(`
`87`	`87`	`)`
`88`	`88`	```
`89`	`89`
	`90`	+Note: `OVWeightQuantizationConfig` also accepts key word arguments not listed in its constructor. In this case such arguments will be passed directly to `nncf.compress_weights()` call. This is useful for passing additional parameters to the quantization algorithm.
	`91`	`+`
`90`	`92`	By default the quantization scheme will be [asymmetric](https://github.com/openvinotoolkit/nncf/blob/develop/docs/usage/training_time_compression/other_algorithms/LegacyQuantization.md#asymmetric-quantization), to make it [symmetric](https://github.com/openvinotoolkit/nncf/blob/develop/docs/usage/training_time_compression/other_algorithms/LegacyQuantization.md#symmetric-quantization) you can add `sym=True`.
`91`	`93`
`92`	`94`	`For 4-bit quantization you can also specify the following arguments in the quantization configuration :`
Original file line number	Diff line number	Diff line change
`@@ -1044,6 +1044,7 @@ def _weight_only_quantization(`
`1044`	`1044`	`f"by the ones given in _weight_only_quantization call kwargs: {kwargs_intersection}."`
`1045`	`1045`	`)`
`1046`	`1046`	`wc_kwargs.update(kwargs)`
	`1047`	`+ wc_kwargs.pop("weight_only", None)`
`1047`	`1048`
`1048`	`1049`	`compressed_model = nncf.compress_weights(`
`1049`	`1050`	`model,`
`@@ -1076,6 +1077,7 @@ def _full_quantization(`
`1076`	`1077`	`f"by the ones given in _full_quantization call kwargs: {kwargs_intersection}."`
`1077`	`1078`	`)`
`1078`	`1079`	`q_kwargs.update(kwargs)`
	`1080`	`+ q_kwargs.pop("weight_only", None)`
`1079`	`1081`
`1080`	`1082`	`quantized_model = nncf.quantize(model, calibration_dataset=calibration_dataset, **q_kwargs)`
`1081`	`1083`