kblaszczak-intel
diff --git a/‎src/bindings/c/tests/ov_remote_context_test.cpp
+4-4 b/‎src/bindings/c/tests/ov_remote_context_test.cpp
+4-4
diff --git a/‎src/inference/dev_api/openvino/runtime/isync_infer_request.hpp
+1-1 b/‎src/inference/dev_api/openvino/runtime/isync_infer_request.hpp
+1-1
diff --git a/‎src/inference/dev_api/openvino/runtime/make_tensor.hpp
+1-1 b/‎src/inference/dev_api/openvino/runtime/make_tensor.hpp
+1-1
diff --git a/‎src/inference/dev_api/remote_utils.hpp
+184 b/‎src/inference/dev_api/remote_utils.hpp
+184
diff --git a/‎src/inference/include/openvino/runtime/intel_gpu/ocl/dx.hpp
+1-1 b/‎src/inference/include/openvino/runtime/intel_gpu/ocl/dx.hpp
+1-1
diff --git a/‎src/inference/include/openvino/runtime/intel_gpu/ocl/ocl.hpp
+5 b/‎src/inference/include/openvino/runtime/intel_gpu/ocl/ocl.hpp
+5
diff --git a/‎src/inference/include/openvino/runtime/intel_gpu/ocl/va.hpp
+1-1 b/‎src/inference/include/openvino/runtime/intel_gpu/ocl/va.hpp
+1-1
diff --git a/‎src/inference/src/dev/converter_utils.cpp
+33-43 b/‎src/inference/src/dev/converter_utils.cpp
+33-43
diff --git a/‎src/inference/src/dev/converter_utils.hpp
+1-2 b/‎src/inference/src/dev/converter_utils.hpp
+1-2
@@ -360,9 +360,9 @@ TEST_P(ov_remote_context_ocl, create_remote_tensor_nv12_from_ocl_image2D) {
     const int height = 480;
     const int width = 640;
     ov_shape_t shape_y = {0, nullptr};
-    int64_t dims_y[4] = {1, 1, height, width};
+    int64_t dims_y[4] = {1, height, width, 1};
     ov_shape_t shape_uv = {0, nullptr};
-    int64_t dims_uv[4] = {1, 2, height / 2, width / 2};
+    int64_t dims_uv[4] = {1, height / 2, width / 2, 2};
 
     cl_int err;
     cl_image_format image_format;
@@ -555,9 +555,9 @@ TEST_P(ov_remote_context_ocl, remote_tensor_nv12_inference) {
     EXPECT_NE(nullptr, context);
 
     ov_shape_t shape_y = {0, nullptr};
-    int64_t dims_y[4] = {1, 1, height, width};
+    int64_t dims_y[4] = {1, height, width, 1};
     ov_shape_t shape_uv = {0, nullptr};
-    int64_t dims_uv[4] = {1, 2, height / 2, width / 2};
+    int64_t dims_uv[4] = {1, height / 2, width / 2, 2};
 
     cl_int err;
     cl_image_format image_format;
 
@@ -151,12 +151,12 @@ class OPENVINO_RUNTIME_API ISyncInferRequest : public IInferRequest {
                          const std::function<void(ov::SoPtr<ov::ITensor>& tensor)>& allocate_callback);
 
     std::unordered_map<std::shared_ptr<ov::descriptor::Tensor>, std::vector<ov::SoPtr<ov::ITensor>>> m_batched_tensors;
+    ov::SoPtr<ov::ITensor>& get_tensor_ptr(const ov::Output<const ov::Node>& port) const;
 
 private:
     std::shared_ptr<const ov::ICompiledModel> m_compiled_model;
     // Mutable to return reference to ov::Tensor
     mutable std::unordered_map<std::shared_ptr<ov::descriptor::Tensor>, ov::SoPtr<ov::ITensor>> m_tensors;
-    ov::SoPtr<ov::ITensor>& get_tensor_ptr(const ov::Output<const ov::Node>& port) const;
 
     /**
      * @brief Finds input or output port
 
@@ -67,7 +67,7 @@ OPENVINO_RUNTIME_API ov::SoPtr<ov::ITensor> get_tensor_impl(const ov::Tensor& te
 
 IE_SUPPRESS_DEPRECATED_START
 /** @cond INTERNAL */
-ov::SoPtr<ITensor> make_tensor(const std::shared_ptr<InferenceEngine::Blob>& tensor);
+ov::SoPtr<ITensor> make_tensor(const std::shared_ptr<InferenceEngine::Blob>& tensor, bool unwrap = false);
 const InferenceEngine::Blob* get_hardware_blob(const InferenceEngine::Blob* blob);
 InferenceEngine::Blob* get_hardware_blob(InferenceEngine::Blob* blob);
 
 
@@ -0,0 +1,184 @@
+// Copyright (C) 2018-2023 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ie_ngraph_utils.hpp"
+#include "ie_remote_blob.hpp"
+#include "ie_remote_context.hpp"
+#include "openvino/runtime/iremote_context.hpp"
+
+namespace ov {
+namespace legacy_convert {
+
+INFERENCE_ENGINE_API_CPP(ov::SoPtr<ov::IRemoteContext>)
+convert_remote_context(const std::shared_ptr<InferenceEngine::RemoteContext>& context);
+INFERENCE_ENGINE_API_CPP(ie::Blob*) get_hardware_blob(ie::Blob* blob);
+
+class INFERENCE_ENGINE_API_CLASS(TensorHolder) {
+public:
+    TensorHolder(ov::SoPtr<ov::ITensor> tensor) : _tensor(tensor) {}
+
+    const ov::SoPtr<ov::ITensor>& get_tensor() const {
+        return _tensor;
+    }
+
+private:
+    ov::SoPtr<ov::ITensor> _tensor;
+};
+
+}  // namespace legacy_convert
+
+/**
+ * @brief Tensor what contains InferenceEngine::RemoteBlob inside
+ * Blob owns the memory
+ */
+class INFERENCE_ENGINE_API_CLASS(RemoteBlobTensor) : public IRemoteTensor {
+    mutable element::Type m_type;
+    mutable Shape m_shape;
+    mutable Strides m_strides;
+    mutable ov::AnyMap m_properties;
+    mutable std::string m_dev_name;
+
+public:
+    std::shared_ptr<ie::RemoteBlob> blob;
+
+    RemoteBlobTensor(const InferenceEngine::RemoteBlob::Ptr& blob) : blob{blob} {
+        OPENVINO_ASSERT(blob);
+        m_shape = blob->getTensorDesc().getBlockingDesc().getBlockDims();
+    }
+
+    const element::Type& get_element_type() const override {
+        m_type = InferenceEngine::details::convertPrecision(blob->getTensorDesc().getPrecision());
+        return m_type;
+    }
+
+    void set_shape(ov::Shape shape) override {
+        blob->setShape({shape.begin(), shape.end()});
+    }
+
+    const Shape& get_shape() const override {
+        m_shape = blob->getTensorDesc().getBlockingDesc().getBlockDims();
+        return m_shape;
+    }
+
+    const Strides& get_strides() const override {
+        OPENVINO_ASSERT(get_element_type().bitwidth() >= 8,
+                        "Could not get strides for types with bitwidths less then 8 bit. Tensor type: ",
+                        get_element_type());
+        const auto& element_strides = blob->getTensorDesc().getBlockingDesc().getStrides();
+        const size_t elem_size = get_element_type().size();
+        m_strides.clear();
+        m_strides.resize(element_strides.size());
+        std::transform(element_strides.begin(), element_strides.end(), m_strides.begin(), [&elem_size](size_t stride) {
+            return stride * elem_size;
+        });
+        return m_strides;
+    }
+
+    size_t get_size() const override {
+        return blob->size();
+    }
+
+    size_t get_byte_size() const override {
+        return blob->byteSize();
+    }
+
+    const AnyMap& get_properties() const override {
+        m_properties = blob->getParams();
+        return m_properties;
+    }
+
+    const std::string& get_device_name() const override {
+        m_dev_name = blob->getDeviceName();
+        return m_dev_name;
+    }
+};
+
+/**
+ * @brief Create InferenceEngine::RemoteBlob from the Tensor
+ */
+class INFERENCE_ENGINE_API_CLASS(TensorRemoteBlob) : public ie::RemoteBlob, public ov::legacy_convert::TensorHolder {
+public:
+    TensorRemoteBlob(const ov::SoPtr<ITensor>& tensor, ie::TensorDesc desc)
+        : ie::RemoteBlob{desc},
+          ov::legacy_convert::TensorHolder(tensor) {
+        OPENVINO_ASSERT(this->get_tensor());
+    }
+    std::shared_ptr<ov::IRemoteTensor> cast_tensor() const {
+        auto remote = std::dynamic_pointer_cast<ov::IRemoteTensor>(get_tensor()._ptr);
+        OPENVINO_ASSERT(remote);
+        return remote;
+    }
+    AnyMap getParams() const override {
+        return cast_tensor()->get_properties();
+    }
+    std::string getDeviceName() const noexcept override {
+        try {
+            return cast_tensor()->get_device_name();
+        } catch (...) {
+            return {};
+        }
+    }
+    std::shared_ptr<ie::RemoteContext> getContext() const noexcept override {
+        return {};
+    }
+
+    void allocate() noexcept override {}
+    bool deallocate() noexcept override {
+        return true;
+    }
+    ie::LockedMemory<void> buffer() noexcept override {
+        return {nullptr, nullptr, 0};
+    }
+    ie::LockedMemory<const void> cbuffer() const noexcept override {
+        return {nullptr, nullptr, 0};
+    }
+    ie::LockedMemory<void> rwmap() noexcept override {
+        return {nullptr, nullptr, 0};
+    }
+    ie::LockedMemory<const void> rmap() const noexcept override {
+        return {nullptr, nullptr, 0};
+    }
+    ie::LockedMemory<void> wmap() noexcept override {
+        return {nullptr, nullptr, 0};
+    }
+    const std::shared_ptr<ie::IAllocator>& getAllocator() const noexcept override {
+        return m_allocator;
+    }
+    void* getHandle() const noexcept override {
+        return nullptr;
+    }
+
+    using TensorHolder::get_tensor;
+
+private:
+    std::shared_ptr<ie::IAllocator> m_allocator;
+};
+
+}  // namespace ov
+
+namespace InferenceEngine {
+
+class INFERENCE_ENGINE_API_CLASS(IRemoteContextWrapper) : public ov::IRemoteContext {
+private:
+    std::shared_ptr<InferenceEngine::RemoteContext> m_context;
+    mutable std::string m_name;
+    mutable ov::AnyMap m_params;
+
+public:
+    IRemoteContextWrapper(const std::shared_ptr<InferenceEngine::RemoteContext>& context) : m_context(context) {}
+    virtual ~IRemoteContextWrapper() = default;
+    const std::shared_ptr<InferenceEngine::RemoteContext>& get_context();
+    const std::string& get_device_name() const override;
+
+    const ov::AnyMap& get_property() const override;
+
+    ov::SoPtr<ov::IRemoteTensor> create_tensor(const ov::element::Type& type,
+                                               const ov::Shape& shape,
+                                               const ov::AnyMap& params = {}) override;
+    ov::SoPtr<ov::ITensor> create_host_tensor(const ov::element::Type type, const ov::Shape& shape) override;
+};
+
+}  // namespace InferenceEngine
@@ -139,7 +139,7 @@ class D3DContext : public ClContext {
      * @param target_tile_id Desired tile id within given context for multi-tile system. Default value (-1) means
      * that root device should be used
      */
-    D3DContext(Core& core, ID3D11Device* device, int target_tile_id = -1) : ClContext(core, (cl_context) nullptr) {
+    D3DContext(Core& core, ID3D11Device* device, int target_tile_id = -1) : ClContext() {
         // clang-format off
         AnyMap context_params = {
             {ov::intel_gpu::context_type.name(), ov::intel_gpu::ContextType::VA_SHARED},
 
@@ -177,6 +177,11 @@ class ClContext : public RemoteContext {
      */
     static constexpr const char* device_name = "GPU";
 
+    /**
+     * @brief Default constructor which can be used in derived classes to avoid multiple create_context() calls
+     */
+    ClContext() = default;
+
 public:
     // Needed to make create_tensor overloads from base class visible for user
     using RemoteContext::create_tensor;
 
@@ -104,7 +104,7 @@ class VAContext : public ClContext {
      * @param target_tile_id Desired tile id within given context for multi-tile system. Default value (-1) means
      * that root device should be used
      */
-    VAContext(Core& core, VADisplay device, int target_tile_id = -1) : ClContext(core, (cl_context) nullptr) {
+    VAContext(Core& core, VADisplay device, int target_tile_id = -1) : ClContext() {
         AnyMap context_params = {{ov::intel_gpu::context_type.name(), ov::intel_gpu::ContextType::VA_SHARED},
                                  {ov::intel_gpu::va_device.name(), static_cast<gpu_handle_param>(device)},
                                  {ov::intel_gpu::tile_id.name(), target_tile_id}};
 
@@ -215,7 +215,7 @@ class IVariableStateInternalWrapper : public InferenceEngine::IVariableStateInte
     }
 
     void SetState(const InferenceEngine::Blob::Ptr& newState) override {
-        m_state->set_state(ov::make_tensor(newState));
+        m_state->set_state(ov::make_tensor(newState, true));
     }
 
     InferenceEngine::Blob::CPtr GetState() const override {
@@ -542,7 +542,7 @@ class IInferRequestInternalWrapper : public InferenceEngine::IInferRequestIntern
 
     void SetBlob(const std::string& name, const InferenceEngine::Blob::Ptr& data) override {
         try {
-            m_request->set_tensor(find_port(name), ov::make_tensor(data));
+            m_request->set_tensor(find_port(name), ov::make_tensor(data, true));
         } catch (const ov::Exception& ex) {
             const std::string what = ex.what();
             if (what.find("Failed to set tensor") != std::string::npos) {
@@ -556,7 +556,7 @@ class IInferRequestInternalWrapper : public InferenceEngine::IInferRequestIntern
         try {
             std::vector<ov::SoPtr<ov::ITensor>> tensors;
             for (const auto& blob : blobs) {
-                tensors.emplace_back(ov::make_tensor(blob));
+                tensors.emplace_back(ov::make_tensor(blob, true));
             }
             m_request->set_tensors(find_port(name), tensors);
         } catch (const ov::Exception& ex) {
@@ -860,50 +860,40 @@ ov::SoPtr<::ov::IAsyncInferRequest> ov::legacy_convert::convert_infer_request(
 }
 
 namespace InferenceEngine {
+const std::shared_ptr<InferenceEngine::RemoteContext>& IRemoteContextWrapper::get_context() {
+    return m_context;
+}
 
-class IRemoteContextWrapper : public ov::IRemoteContext {
-private:
-    std::shared_ptr<InferenceEngine::RemoteContext> m_context;
-    mutable std::string m_name;
-    mutable ov::AnyMap m_params;
-
-public:
-    IRemoteContextWrapper(const std::shared_ptr<InferenceEngine::RemoteContext>& context) : m_context(context) {}
-    virtual ~IRemoteContextWrapper() = default;
-    const std::shared_ptr<InferenceEngine::RemoteContext>& get_context() {
-        return m_context;
-    }
-    const std::string& get_device_name() const override {
-        m_name = m_context->getDeviceName();
-        return m_name;
-    }
+const std::string& IRemoteContextWrapper::get_device_name() const {
+    m_name = m_context->getDeviceName();
+    return m_name;
+}
 
-    const ov::AnyMap& get_property() const override {
-        m_params = m_context->getParams();
-        return m_params;
-    }
+const ov::AnyMap& IRemoteContextWrapper::get_property() const {
+    m_params = m_context->getParams();
+    return m_params;
+}
 
-    ov::SoPtr<ov::IRemoteTensor> create_tensor(const ov::element::Type& type,
-                                               const ov::Shape& shape,
-                                               const ov::AnyMap& params = {}) override {
-        InferenceEngine::TensorDesc desc(InferenceEngine::details::convertPrecision(type),
-                                         shape,
-                                         InferenceEngine::TensorDesc::getLayoutByDims(shape));
-        auto blob = m_context->CreateBlob(desc, params);
-        blob->allocate();
-        auto tensor = ov::make_tensor(blob);
-        return {std::dynamic_pointer_cast<ov::IRemoteTensor>(tensor._ptr), tensor._so};
-    }
+ov::SoPtr<ov::IRemoteTensor> IRemoteContextWrapper::create_tensor(const ov::element::Type& type,
+                                                                  const ov::Shape& shape,
+                                                                  const ov::AnyMap& params) {
+    InferenceEngine::TensorDesc desc(InferenceEngine::details::convertPrecision(type),
+                                     shape,
+                                     InferenceEngine::TensorDesc::getLayoutByDims(shape));
+    auto blob = m_context->CreateBlob(desc, params);
+    blob->allocate();
+    auto tensor = ov::make_tensor(blob);
+    return {std::dynamic_pointer_cast<ov::IRemoteTensor>(tensor._ptr), tensor._so};
+}
 
-    ov::SoPtr<ov::ITensor> create_host_tensor(const ov::element::Type type, const ov::Shape& shape) override {
-        InferenceEngine::TensorDesc desc(InferenceEngine::details::convertPrecision(type),
-                                         shape,
-                                         InferenceEngine::TensorDesc::getLayoutByDims(shape));
-        auto blob = m_context->CreateHostBlob(desc);
-        blob->allocate();
-        return ov::make_tensor(blob);
-    }
-};
+ov::SoPtr<ov::ITensor> IRemoteContextWrapper::create_host_tensor(const ov::element::Type type, const ov::Shape& shape) {
+    InferenceEngine::TensorDesc desc(InferenceEngine::details::convertPrecision(type),
+                                     shape,
+                                     InferenceEngine::TensorDesc::getLayoutByDims(shape));
+    auto blob = m_context->CreateHostBlob(desc);
+    blob->allocate();
+    return ov::make_tensor(blob);
+}
 
 }  // namespace InferenceEngine
 
 
@@ -15,6 +15,7 @@
 #include "openvino/runtime/icompiled_model.hpp"
 #include "openvino/runtime/iplugin.hpp"
 #include "openvino/runtime/iremote_context.hpp"
+#include "remote_utils.hpp"
 
 namespace ov {
 namespace legacy_convert {
@@ -40,11 +41,9 @@ ov::SoPtr<::ov::IAsyncInferRequest> convert_infer_request(
     const std::string& plugin_name = "");
 
 std::shared_ptr<InferenceEngine::RemoteContext> convert_remote_context(const ov::SoPtr<ov::IRemoteContext>& context);
-ov::SoPtr<ov::IRemoteContext> convert_remote_context(const std::shared_ptr<InferenceEngine::RemoteContext>& context);
 
 std::vector<ov::Extension::Ptr> convert_extension(const std::vector<InferenceEngine::IExtensionPtr>& exts);
 std::vector<InferenceEngine::IExtensionPtr> convert_extension(const std::vector<ov::Extension::Ptr>& exts);
 
 }  // namespace legacy_convert
 }  // namespace ov
-