Skip to content

Commit e8a9f57

Browse files
committed
add default config for causal LM
1 parent 9cefecf commit e8a9f57

File tree

1 file changed

+4
-1
lines changed

1 file changed

+4
-1
lines changed

optimum/intel/openvino/modeling_decoder.py

+4-1
Original file line numberDiff line numberDiff line change
@@ -34,7 +34,7 @@
3434
from ...exporters.openvino.stateful import model_has_state
3535
from ..utils.import_utils import is_nncf_available
3636
from ..utils.modeling_utils import MULTI_QUERY_ATTN_MODELS
37-
from .configuration import OVConfig, OVWeightQuantizationConfig, _check_default_4bit_configs
37+
from .configuration import _DEFAULT_4BIT_CONFIGS, OVConfig, OVWeightQuantizationConfig, _check_default_4bit_configs
3838
from .modeling import _TOKENIZER_FOR_DOC, INPUTS_DOCSTRING, MODEL_START_DOCSTRING, OVModel
3939
from .utils import ONNX_WEIGHTS_NAME, OV_XML_FILE_NAME, STR_TO_OV_TYPE
4040

@@ -581,6 +581,9 @@ def _from_pretrained(
581581
quantization_config = quantization_config or {"bits": 8}
582582

583583
if isinstance(quantization_config, dict):
584+
if quantization_config == {"bits": 4} and config.name_or_path in _DEFAULT_4BIT_CONFIGS:
585+
quantization_config = _DEFAULT_4BIT_CONFIGS[config.name_or_path]
586+
584587
quantization_config = OVWeightQuantizationConfig.from_dict(quantization_config)
585588

586589
load_in_4bit = quantization_config.bits == 4 if quantization_config else False

0 commit comments

Comments
 (0)