We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 35cf1d2 commit 1e519c7Copy full SHA for 1e519c7
optimum/exporters/openvino/__main__.py
@@ -474,9 +474,6 @@ class StoreAttr(object):
474
from optimum.intel.openvino.quantization import _weight_only_quantization
475
476
_weight_only_quantization(submodel, quantization_config)
477
- if "text-generation" in task:
478
- submodel.set_rt_info("u8", ["runtime_options", "KV_CACHE_PRECISION"])
479
-
480
compressed_submodel_path = submodel_path.parent / f"{submodel_path.stem}_compressed.xml"
481
save_model(submodel, compressed_submodel_path, compress_to_fp16=False)
482
del submodel
0 commit comments