Update optimum/intel/openvino/modeling_visual_language.py

eaidova · eaidova · commit 5e732dae9311 · 2025-03-05T13:56:00.000+04:00
diff --git a/optimum/intel/openvino/modeling_visual_language.py b/optimum/intel/openvino/modeling_visual_language.py
@@ -1426,15 +1426,17 @@ def load_image(image, input_size=448, max_num=12):
             pixel_values = [transform(image) for image in images]
             pixel_values = torch.stack(pixel_values)
             return pixel_values
-        
+
         if image is not None and "<image>" not in text:
             text = "<image>\n" + text
 
         if tokenizer.chat_template is not None:
-            text = tokenizer.apply_chat_template([{"role": "user", "content": text}], add_generation_prompt=True, tokenize=False)
-        
+            text = tokenizer.apply_chat_template(
+                [{"role": "user", "content": text}], add_generation_prompt=True, tokenize=False
+            )
+
         inputs = {}
-            
+
         if image is not None:
             if config is None:
                 raise ValueError("Config is required.")
@@ -1446,7 +1448,6 @@ def load_image(image, input_size=448, max_num=12):
             )
             image_tokens = IMG_START_TOKEN + IMG_CONTEXT_TOKEN * num_image_token * num_patches + IMG_END_TOKEN
             text = text.replace("<image>", image_tokens, 1)
-            logger.warn(text)
             inputs.update({"pixel_values": pixel_values})
         inputs.update(tokenizer(text, return_tensors="pt"))
         return inputs