@@ -265,7 +265,8 @@ EncodedImage VisionEncoderPhi3V::encode(const ov::Tensor& image, const ov::AnyMa
265265 encoder.set_input_tensor (pixel_values);
266266 ov::Tensor res{ov::element::f32 , encoder.get_output_tensor ().get_shape ()};
267267 encoder.set_output_tensor (res);
268- encoder.infer ();
268+ encoder.start_async ();
269+ encoder.wait ();
269270 return {std::move (res), image_size};
270271}
271272
@@ -410,7 +411,8 @@ ov::Tensor reshape_hd_patches_2x2merge(const ov::Tensor& image_features, size_t
410411 hd_feature_transformer.set_input_tensor (1 , height);
411412 ov::Tensor width{ov::element::i32 , {}, &w_crop};
412413 hd_feature_transformer.set_input_tensor (2 , width);
413- hd_feature_transformer.infer ();
414+ hd_feature_transformer.start_async ();
415+ hd_feature_transformer.wait ();
414416 return hd_feature_transformer.get_output_tensor ();
415417}
416418
@@ -477,7 +479,8 @@ ov::Tensor hd_feature_transform(const EncodedImage& image_features, InferRequest
477479 ov::Tensor sub_image_features_hd_newline = add_image_newline (sub_image_features_hd, sub_GN); // [1,h_crop*12*(w_crop*12+1), 4096]
478480 ov::Tensor image_embeddings = concatenate_2d (sub_image_features_hd_newline, glb_GN, global_image_features_hd_newline); // [1,l,4096]
479481 vision_projection.set_input_tensor (image_embeddings);
480- vision_projection.infer ();
482+ vision_projection.start_async ();
483+ vision_projection.wait ();
481484 ov::Tensor out = vision_projection.get_output_tensor ();
482485 ov::Tensor res{out.get_element_type (), out.get_shape ()};
483486 out.copy_to (res);
0 commit comments