Disable oneDNN cache cleanup

sshlyapn · sshlyapn · commit 409731b33f82 · 2024-02-12T18:19:58.000+04:00
diff --git a/samples/cpp/hello_classification/main.cpp b/samples/cpp/hello_classification/main.cpp
@@ -22,98 +22,117 @@
  * @brief Main with support Unicode paths, wide strings
  */
 int tmain(int argc, tchar* argv[]) {
-    try {
+     {
         // -------- Get OpenVINO runtime version --------
         slog::info << ov::get_openvino_version() << slog::endl;
 
         // -------- Parsing and validation of input arguments --------
-        if (argc != 4) {
-            slog::info << "Usage : " << argv[0] << " <path_to_model> <path_to_image> <device_name>" << slog::endl;
-            return EXIT_FAILURE;
+        if (argc != 3) {
+           slog::info << "Usage : " << argv[0] << " <path_to_model> <device_name>" << slog::endl;
+           return EXIT_FAILURE;
         }
-
-        const std::string args = TSTRING2STRING(argv[0]);
+        //
+        //const std::string args = TSTRING2STRING(argv[0]);
         const std::string model_path = TSTRING2STRING(argv[1]);
-        const std::string image_path = TSTRING2STRING(argv[2]);
-        const std::string device_name = TSTRING2STRING(argv[3]);
+        // const std::string image_path = TSTRING2STRING(argv[2]);
+        const std::string device_name = TSTRING2STRING(argv[2]);
 
         // -------- Step 1. Initialize OpenVINO Runtime Core --------
         ov::Core core;
 
+        // std::vector<std::string> availableDevices = core.get_available_devices();
+        // for (auto&& device : availableDevices) {
+        //     slog::info << device << slog::endl;
+
+        //     // Query supported properties and print all of them
+        //     slog::info << "\tSUPPORTED_PROPERTIES: " << slog::endl;
+        //     auto supported_properties = core.get_property(device, ov::supported_properties);
+        //     for (auto&& property : supported_properties) {
+        //         if (property != ov::supported_properties.name()) {
+        //             slog::info << "\t\t" << (property.is_mutable() ? "Mutable: " : "Immutable: ") << property << " : "
+        //                        << slog::flush;
+
+        //         }
+        //     }
+
+        //     slog::info << slog::endl;
+        // }
+        //core.set_property(ov::cache_dir("C:\\Intel\\XeSDK"));
         // -------- Step 2. Read a model --------
-        slog::info << "Loading model files: " << model_path << slog::endl;
+        //slog::info << "Loading model files: " << model_path << slog::endl;
         std::shared_ptr<ov::Model> model = core.read_model(model_path);
-        printInputAndOutputsInfo(*model);
+        //printInputAndOutputsInfo(*model);
 
         OPENVINO_ASSERT(model->inputs().size() == 1, "Sample supports models with 1 input only");
-        OPENVINO_ASSERT(model->outputs().size() == 1, "Sample supports models with 1 output only");
+        //OPENVINO_ASSERT(model->outputs().size() == 1, "Sample supports models with 1 output only");
 
         // -------- Step 3. Set up input
 
         // Read input image to a tensor and set it to an infer request
         // without resize and layout conversions
-        FormatReader::ReaderPtr reader(image_path.c_str());
-        if (reader.get() == nullptr) {
-            std::stringstream ss;
-            ss << "Image " + image_path + " cannot be read!";
-            throw std::logic_error(ss.str());
-        }
-
-        ov::element::Type input_type = ov::element::u8;
-        ov::Shape input_shape = {1, reader->height(), reader->width(), 3};
-        std::shared_ptr<unsigned char> input_data = reader->getData();
-
-        // just wrap image data by ov::Tensor without allocating of new memory
-        ov::Tensor input_tensor = ov::Tensor(input_type, input_shape, input_data.get());
-
-        const ov::Layout tensor_layout{"NHWC"};
-
-        // -------- Step 4. Configure preprocessing --------
-
-        ov::preprocess::PrePostProcessor ppp(model);
-
-        // 1) Set input tensor information:
-        // - input() provides information about a single model input
-        // - reuse precision and shape from already available `input_tensor`
-        // - layout of data is 'NHWC'
-        ppp.input().tensor().set_shape(input_shape).set_element_type(input_type).set_layout(tensor_layout);
-        // 2) Adding explicit preprocessing steps:
-        // - convert layout to 'NCHW' (from 'NHWC' specified above at tensor layout)
-        // - apply linear resize from tensor spatial dims to model spatial dims
-        ppp.input().preprocess().resize(ov::preprocess::ResizeAlgorithm::RESIZE_LINEAR);
-        // 4) Here we suppose model has 'NCHW' layout for input
-        ppp.input().model().set_layout("NCHW");
-        // 5) Set output tensor information:
-        // - precision of tensor is supposed to be 'f32'
-        ppp.output().tensor().set_element_type(ov::element::f32);
-
-        // 6) Apply preprocessing modifying the original 'model'
-        model = ppp.build();
+        //FormatReader::ReaderPtr reader(image_path.c_str());
+        //if (reader.get() == nullptr) {
+        //    std::stringstream ss;
+        //    ss << "Image " + image_path + " cannot be read!";
+        //    throw std::logic_error(ss.str());
+        //}
+
+        //ov::element::Type input_type = ov::element::u8;
+        //ov::Shape input_shape = {1, reader->height(), reader->width(), 3};
+        //std::shared_ptr<unsigned char> input_data = reader->getData();
+        //
+        //// just wrap image data by ov::Tensor without allocating of new memory
+        //ov::Tensor input_tensor = ov::Tensor(input_type, input_shape, input_data.get());
+        //
+        //const ov::Layout tensor_layout{"NHWC"};
+        //
+        //// -------- Step 4. Configure preprocessing --------
+        //
+        //ov::preprocess::PrePostProcessor ppp(model);
+        //
+        //// 1) Set input tensor information:
+        //// - input() provides information about a single model input
+        //// - reuse precision and shape from already available `input_tensor`
+        //// - layout of data is 'NHWC'
+        //ppp.input().tensor().set_shape(input_shape).set_element_type(input_type).set_layout(tensor_layout);
+        //// 2) Adding explicit preprocessing steps:
+        //// - convert layout to 'NCHW' (from 'NHWC' specified above at tensor layout)
+        //// - apply linear resize from tensor spatial dims to model spatial dims
+        //ppp.input().preprocess().resize(ov::preprocess::ResizeAlgorithm::RESIZE_LINEAR);
+        //// 4) Here we suppose model has 'NCHW' layout for input
+        //ppp.input().model().set_layout("NCHW");
+        //// 5) Set output tensor information:
+        //// - precision of tensor is supposed to be 'f32'
+        //ppp.output().tensor().set_element_type(ov::element::f32);
+        //
+        //// 6) Apply preprocessing modifying the original 'model'
+        //model = ppp.build();
 
         // -------- Step 5. Loading a model to the device --------
         ov::CompiledModel compiled_model = core.compile_model(model, device_name);
 
         // -------- Step 6. Create an infer request --------
         ov::InferRequest infer_request = compiled_model.create_infer_request();
+
         // -----------------------------------------------------------------------------------------------------
 
         // -------- Step 7. Prepare input --------
-        infer_request.set_input_tensor(input_tensor);
-
-        // -------- Step 8. Do inference synchronously --------
-        infer_request.infer();
-
-        // -------- Step 9. Process output
-        const ov::Tensor& output_tensor = infer_request.get_output_tensor();
-
-        // Print classification results
-        ClassificationResult classification_result(output_tensor, {image_path});
-        classification_result.show();
+        //infer_request.set_input_tensor(input_tensor);
+        //
+        //// -------- Step 8. Do inference synchronously --------
+        //infer_request.infer();
+        //
+        //// -------- Step 9. Process output
+        //const ov::Tensor& output_tensor = infer_request.get_output_tensor();
+        //
+        //// Print classification results
+        //ClassificationResult classification_result(output_tensor, {image_path});
+        //classification_result.show();
         // -----------------------------------------------------------------------------------------------------
-    } catch (const std::exception& ex) {
-        std::cerr << ex.what() << std::endl;
-        return EXIT_FAILURE;
+    //} catch (const std::exception& ex) {
+    //    std::cerr << ex.what() << std::endl;
+    //    return EXIT_FAILURE;
     }
 
     return EXIT_SUCCESS;
-}
+}
diff --git a/src/plugins/intel_gpu/src/plugin/plugin.cpp b/src/plugins/intel_gpu/src/plugin/plugin.cpp
@@ -165,13 +165,13 @@ Plugin::~Plugin() {
     // To prevent hanging during oneDNN's primitive cache desctruction,
     // trigger earlier cache cleanup by setting its capacity to 0.
     // Related ticket: 106154.
-    dnnl::set_primitive_cache_capacity(0);
+    // dnnl::set_primitive_cache_capacity(0);
 
     // In case of multiple ov::Core instances (and multiple GPU plugins) we need to restore original
     // cache capacity to prevent working with zero-capacity cache in other GPU Plugin instances, since
     // cache is shared between all of GPU Plugin instances and cache clean up affects all of them.
-    const int default_cache_capacity = 1024;
-    dnnl::set_primitive_cache_capacity(default_cache_capacity);
+    // const int default_cache_capacity = 1024;
+    // dnnl::set_primitive_cache_capacity(default_cache_capacity);
 #endif
 }