@@ -265,7 +265,8 @@ EncodedImage VisionEncoderPhi3V::encode(const ov::Tensor& image, const ov::AnyMa
265
265
encoder.set_input_tensor (pixel_values);
266
266
ov::Tensor res{ov::element::f32, encoder.get_output_tensor ().get_shape ()};
267
267
encoder.set_output_tensor (res);
268
- encoder.infer ();
268
+ encoder.start_async ();
269
+ encoder.wait ();
269
270
return {std::move (res), image_size};
270
271
}
271
272
@@ -410,7 +411,8 @@ ov::Tensor reshape_hd_patches_2x2merge(const ov::Tensor& image_features, size_t
410
411
hd_feature_transformer.set_input_tensor (1 , height);
411
412
ov::Tensor width{ov::element::i32, {}, &w_crop};
412
413
hd_feature_transformer.set_input_tensor (2 , width);
413
- hd_feature_transformer.infer ();
414
+ hd_feature_transformer.start_async ();
415
+ hd_feature_transformer.wait ();
414
416
return hd_feature_transformer.get_output_tensor ();
415
417
}
416
418
@@ -477,7 +479,8 @@ ov::Tensor hd_feature_transform(const EncodedImage& image_features, InferRequest
477
479
ov::Tensor sub_image_features_hd_newline = add_image_newline (sub_image_features_hd, sub_GN); // [1,h_crop*12*(w_crop*12+1), 4096]
478
480
ov::Tensor image_embeddings = concatenate_2d (sub_image_features_hd_newline, glb_GN, global_image_features_hd_newline); // [1,l,4096]
479
481
vision_projection.set_input_tensor (image_embeddings);
480
- vision_projection.infer ();
482
+ vision_projection.start_async ();
483
+ vision_projection.wait ();
481
484
ov::Tensor out = vision_projection.get_output_tensor ();
482
485
ov::Tensor res{out.get_element_type (), out.get_shape ()};
483
486
out.copy_to (res);
0 commit comments