diff --git a/optimum/exporters/openvino/utils.py b/optimum/exporters/openvino/utils.py index 1743dc59b1..e00708c8eb 100644 --- a/optimum/exporters/openvino/utils.py +++ b/optimum/exporters/openvino/utils.py @@ -295,6 +295,14 @@ def save_preprocessors( if is_transformers_version(">=", "4.45") and model_type == "phi3-v" and len(preprocessors) > 1: if not hasattr(preprocessors[1], "chat_template"): preprocessors[1].chat_template = getattr(preprocessors[0], "chat_template", None) + if ( + is_transformers_version(">=", "4.45") + and model_type in ["llava", "llava-next"] + and preprocessors is not None + ): + if getattr(preprocessors[1], "patch_size", None) is None: + preprocessors[1].patch_size = config.vision_config.patch_size + preprocessors[1].vision_feature_select_strategy = config.vision_feature_select_strategy for processor in preprocessors: try: processor.save_pretrained(output) diff --git a/optimum/intel/openvino/modeling_visual_language.py b/optimum/intel/openvino/modeling_visual_language.py index 435f656c60..4b2c5ee031 100644 --- a/optimum/intel/openvino/modeling_visual_language.py +++ b/optimum/intel/openvino/modeling_visual_language.py @@ -1021,7 +1021,7 @@ def preprocess_inputs( else: prompt = text - if getattr(processor, "patch_size", None) is None: + if is_transformers_version(">", "4.47.99") and getattr(processor, "patch_size", None) is None: if ( getattr(config, "vision_config", None) is not None and getattr(config.vision_config, "patch_size", None) is not None