File tree 2 files changed +2
-6
lines changed
2 files changed +2
-6
lines changed Original file line number Diff line number Diff line change @@ -253,6 +253,8 @@ def _set_ov_config_parameters(self):
253
253
q_config = self ._openvino_config .quantization_config if self ._openvino_config else None
254
254
if isinstance (q_config , OVDynamicQuantizationConfig ):
255
255
self .ov_config ["DYNAMIC_QUANTIZATION_GROUP_SIZE" ] = str (q_config .activations_group_size )
256
+ if self .can_generate () and "KV_CACHE_PRECISION" not in self .ov_config :
257
+ self .ov_config ["KV_CACHE_PRECISION" ] = "u8"
256
258
257
259
@staticmethod
258
260
def _cached_file (
Original file line number Diff line number Diff line change @@ -328,12 +328,6 @@ def _make_stateful(self):
328
328
patch_stateful (self .config , self .model )
329
329
self .stateful = True
330
330
331
- def _set_ov_config_parameters (self ):
332
- super ()._set_ov_config_parameters ()
333
-
334
- if "DYNAMIC_QUANTIZATION_GROUP_SIZE" in self .ov_config and "KV_CACHE_PRECISION" not in self .ov_config :
335
- self .ov_config ["KV_CACHE_PRECISION" ] = "u8"
336
-
337
331
338
332
@add_start_docstrings (
339
333
"""
You can’t perform that action at this time.
0 commit comments