Skip to content

Commit 3c39f4d

Browse files
committed
fix model compilation
1 parent c8e5149 commit 3c39f4d

File tree

1 file changed

+27
-9
lines changed

1 file changed

+27
-9
lines changed

optimum/intel/openvino/modeling_visual_language.py

+27-9
Original file line numberDiff line numberDiff line change
@@ -43,25 +43,43 @@ def __init__(
4343
self.text_emb_model = text_embeds_model
4444
self.request = None
4545
self.text_emb_request = None
46+
self._device = device
4647
compile_only = kwargs.get("compile_only", False)
4748
if compile_only:
4849
self.text_emb_request = self.text_emb_model
4950
self.request = self.model.create_infer_request()
5051

5152
super().__init__(
52-
model, config, device, dynamic_shapes, ov_config, model_save_dir, quantization_config, **kwargs
53+
model=model,
54+
config=config,
55+
device=device,
56+
dynamic_shapes=dynamic_shapes,
57+
ov_config=ov_config,
58+
model_save_dir=model_save_dir,
59+
quantization_config=quantization_config,
60+
**kwargs,
5361
)
5462

5563
def compile(self):
5664
if self.request is None:
57-
logger.info(f"Compiling the Language model to {self._device} ...")
58-
self.request = core.compile_model(self.model, self._device, self.ov_config).create_infer_request()
65+
if self._compile_only:
66+
self.request = self.model.create_infer_request()
67+
else:
68+
logger.info(f"Compiling the Language model to {self._device} ...")
69+
self.request = self._compile_model(
70+
self.model, self._device, self.ov_config, self.model_save_dir
71+
).create_infer_request()
5972
self._compile_text_emb()
6073

6174
def _compile_text_emb(self):
6275
if self.text_emb_request is None:
63-
logger.info(f"Compiling the Text embeddings model to {self._device} ...")
64-
self.text_emb_request = core.compile_model(self.text_emb_model, self._device, self.ov_config)
76+
if self._compile_only:
77+
self.text_emb_request = self.text_emb_model
78+
else:
79+
logger.info(f"Compiling the Text embeddings model to {self._device} ...")
80+
self.text_emb_request = self._compile_model(
81+
self.text_emb_model, self._device, self.ov_config, self.model_save_dir
82+
)
6583

6684
def clear_requests(self):
6785
if self._compile_only:
@@ -258,14 +276,14 @@ def __init__(
258276
self._openvino_config = OVConfig(quantization_config=quantization_config)
259277
self._set_ov_config_parameters()
260278
self.language_model = OVModelWithEmbedForCausalLM(
261-
self.lm_model,
262-
self.text_embdings_model,
279+
model=self.lm_model,
280+
text_embeds_model=self.text_embdings_model,
263281
config=config,
264-
deivce=device,
282+
device=self._device,
265283
ov_config=ov_config,
266284
model_save_dir=model_save_dir,
267285
quantization_config=quantization_config,
268-
compile=not self._compile_only,
286+
compile=self._compile_only,
269287
compile_only=self._compile_only,
270288
)
271289
self.vision_embeddings = OVVisionEmbedding(self.vision_embeddings_model, self)

0 commit comments

Comments
 (0)