Skip to content

Commit a06522c

Browse files
authored
Add dynamic quantization config (#661)
* add warning * add model arch * remove calibration dataset argument * format * remove comments * replace preset with sym for compatibility between configs * format * add dynamic quantization * add dynamic config * remove test deprecated config parameter * add bits and sym to base config * add config test * format * add kv cache precision * format * add test * move compilation step * set kv cache precision for seq2seq models
1 parent 673b88b commit a06522c

10 files changed

+247
-260
lines changed

optimum/intel/__init__.py

+22-3
Original file line numberDiff line numberDiff line change
@@ -60,11 +60,23 @@
6060
raise OptionalDependencyNotAvailable()
6161
except OptionalDependencyNotAvailable:
6262
_import_structure["utils.dummy_openvino_and_nncf_objects"].extend(
63-
["OVQuantizer", "OVTrainingArguments", "OVQuantizationConfig", "OVWeightQuantizationConfig"]
63+
[
64+
"OVQuantizer",
65+
"OVTrainingArguments",
66+
"OVQuantizationConfig",
67+
"OVWeightQuantizationConfig",
68+
"OVDynamicQuantizationConfig",
69+
]
6470
)
6571
else:
6672
_import_structure["openvino"].extend(
67-
["OVQuantizer", "OVTrainingArguments", "OVQuantizationConfig", "OVWeightQuantizationConfig"]
73+
[
74+
"OVQuantizer",
75+
"OVTrainingArguments",
76+
"OVQuantizationConfig",
77+
"OVWeightQuantizationConfig",
78+
"OVDynamicQuantizationConfig",
79+
]
6880
)
6981

7082

@@ -192,13 +204,20 @@
192204
raise OptionalDependencyNotAvailable()
193205
except OptionalDependencyNotAvailable:
194206
from .utils.dummy_openvino_and_nncf_objects import (
207+
OVDynamicQuantizationConfig,
195208
OVQuantizationConfig,
196209
OVQuantizer,
197210
OVTrainingArguments,
198211
OVWeightQuantizationConfig,
199212
)
200213
else:
201-
from .openvino import OVQuantizationConfig, OVQuantizer, OVTrainingArguments, OVWeightQuantizationConfig
214+
from .openvino import (
215+
OVDynamicQuantizationConfig,
216+
OVQuantizationConfig,
217+
OVQuantizer,
218+
OVTrainingArguments,
219+
OVWeightQuantizationConfig,
220+
)
202221

203222
try:
204223
if not (is_openvino_available() and is_nncf_available() and is_accelerate_available()):

optimum/intel/openvino/__init__.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -43,7 +43,7 @@
4343
from .trainer import OVTrainer
4444

4545

46-
from .configuration import OVConfig, OVQuantizationConfig, OVWeightQuantizationConfig
46+
from .configuration import OVConfig, OVDynamicQuantizationConfig, OVQuantizationConfig, OVWeightQuantizationConfig
4747
from .modeling import (
4848
OVModelForAudioClassification,
4949
OVModelForAudioFrameClassification,

0 commit comments

Comments
 (0)