openvinotoolkit
diff --git a/‎client/e2e/resources.json
+3-3 b/‎client/e2e/resources.json
+3-3
diff --git a/‎client/e2e/src/accuracy-reports.e2e-spec.ts
+8-7 b/‎client/e2e/src/accuracy-reports.e2e-spec.ts
+8-7
diff --git a/‎client/e2e/src/gan.e2e-spec.ts
+1-1 b/‎client/e2e/src/gan.e2e-spec.ts
+1-1
diff --git a/‎client/e2e/src/inference-test-image.e2e-spec.ts
+1-1 b/‎client/e2e/src/inference-test-image.e2e-spec.ts
+1-1
diff --git a/‎client/e2e/src/int8-basic-cases.e2e-spec.ts
+10-7 b/‎client/e2e/src/int8-basic-cases.e2e-spec.ts
+10-7
diff --git a/‎client/e2e/src/model-visualization.e2e-spec.ts
+1-1 b/‎client/e2e/src/model-visualization.e2e-spec.ts
+1-1
diff --git a/‎client/e2e/src/not-annotated-model-visualization.e2e-spec.ts
+2-1 b/‎client/e2e/src/not-annotated-model-visualization.e2e-spec.ts
+2-1
diff --git a/‎client/e2e/src/parent-predictions-visualization.e2e-spec.ts
+3-2 b/‎client/e2e/src/parent-predictions-visualization.e2e-spec.ts
+3-2
diff --git a/‎client/e2e/src/semantic-segmentation.e2e-spec.ts
+1-1 b/‎client/e2e/src/semantic-segmentation.e2e-spec.ts
+1-1
diff --git a/‎client/e2e/src/upload-dataset.e2e-spec.ts
+2-1 b/‎client/e2e/src/upload-dataset.e2e-spec.ts
+2-1
diff --git a/‎config/constants.py
+1 b/‎config/constants.py
+1
diff --git a/‎docker/dockerfiles/Dockerfile
+3-1 b/‎docker/dockerfiles/Dockerfile
+3-1
diff --git a/‎requirements/requirements.txt
+2-1 b/‎requirements/requirements.txt
+2-1
diff --git a/‎wb/main/console_tool_wrapper/datumaro_tool/tool.py
+21-6 b/‎wb/main/console_tool_wrapper/datumaro_tool/tool.py
+21-6
diff --git a/‎wb/main/dataset_utils/dataset_adapters.py
+8-4 b/‎wb/main/dataset_utils/dataset_adapters.py
+8-4
diff --git a/‎wb/main/enumerates.py
+1 b/‎wb/main/enumerates.py
+1
diff --git a/‎wb/main/jobs/datasets/convert_dataset_job.py
+5-3 b/‎wb/main/jobs/datasets/convert_dataset_job.py
+5-3
@@ -2663,7 +2663,7 @@
     }
   },
   "cocoDataset": {
-    "path": "datasets/coco200.zip",
+    "path": "datasets_v2/coco200.zip",
     "name": "coco200Dataset",
     "format": "Coco",
     "type": "dataset",
@@ -2751,7 +2751,7 @@
     }
   },
   "LFWDataset": {
-    "path": "datasets/LFW.tar.gz",
+    "path": "datasets_v2/LFW.zip",
     "name": "LFWDataset",
     "type": "dataset",
     "accuracyData": {
@@ -2769,7 +2769,7 @@
     }
   },
   "WiderFaceDataset": {
-    "path": "datasets/WIDER_val.zip",
+    "path": "datasets_v2/WIDER_val.zip",
     "name": "WIDER FACE",
     "type": "dataset",
     "accuracyData": {
 
@@ -46,8 +46,9 @@ describe('UI tests on Accuracy Reports', () => {
     imageNetNotAnnotated.name = testUtils.helpers.generateName();
     await testUtils.uploadDataset(datasetFileVOC);
     await testUtils.uploadDataset(datasetFileImageNet);
-    await testUtils.uploadDataset(dataSetFileSemantic);
-    await testUtils.uploadDataset(imageNetNotAnnotated);
+    // TODO: 83042
+    // await testUtils.uploadDataset(dataSetFileSemantic);
+    // await testUtils.uploadDataset(imageNetNotAnnotated);
 
     if (browser.params.isDevCloud) {
       jasmine.DEFAULT_TIMEOUT_INTERVAL *= 2.5;
@@ -179,7 +180,7 @@ describe('UI tests on Accuracy Reports', () => {
     expect(await TestUtils.getAllElementsByDataTestId('predictions-table').count()).toBeGreaterThan(1);
   });
 
-  // 70558
+  // TODO: 70558
   xit(
     'should download a semantic segmentation model (deeplabv3), ' +
       'int8 calibration, check that predictions comparison is available and that tensor comparison is available, ' +
@@ -270,7 +271,7 @@ describe('UI tests on Accuracy Reports', () => {
     }
   );
 
-  // 70558
+  // TODO: 70558, 83248
   xit(
     'should download a semantic segmentation model (deeplabv3), not-annotated dataset' +
       'int8 calibration, check that predictions comparison is available and that tensor comparison is available, ' +
@@ -322,7 +323,7 @@ describe('UI tests on Accuracy Reports', () => {
     }
   );
 
-  // 73953
+  // TODO: 73953, 83248
   xit(
     'should create a project with a generic model, calibrate it, configure accuracy (OD), ' +
       'create accuracy report (predictions comparison)',
@@ -373,7 +374,7 @@ describe('UI tests on Accuracy Reports', () => {
     }
   );
 
-  // 73953
+  // TODO: 73953, 83248
   xit(
     'should create a project with a generic model and not-annotated dataset, calibrate, ' +
       'create another project with annotated dataset, ' +
@@ -447,7 +448,7 @@ describe('UI tests on Accuracy Reports', () => {
     }
   );
 
-  // 73953
+  // TODO: 73953, 83248
   xit(
     'should create a project with a classification model & ' +
       'not-annotated dataset, calibrate it, create accuracy report (predictions comparison), ' +
 
@@ -72,7 +72,7 @@ xdescribe('Instance segmentation tests', () => {
     await calibrationUtils.runCalibrationWithAccuracyCheck(modelFile, dataSetFileSuperRes, InferenceType.CPU, true);
   });
 
-  // 43320
+  // TODO: 43320
   xit('Upload GAN model (tensor_layer_srgan), check accuracy, run calibration', async () => {
     const modelFile = browser.params.precommit_scope.resources.ganModels.tensorLayerSrgan;
     modelFile.name = testUtils.helpers.generateName();
 
@@ -122,7 +122,7 @@ describe('UI tests on Running inference', () => {
     await visualizeInferenceResultPage.checkImageLabel(0.9);
   });
 
-  xit('should create project with Semantic Segmentation model, upload image, test, check for predictions', async () => {
+  it('should create project with Semantic Segmentation model, upload image, test, check for predictions', async () => {
     const model = { name: 'semantic-segmentation-adas-0001', framework: 'openvino' };
     const imageFile = browser.params.precommit_scope.resources.testImages.semanticSegmImage;
     const inferenceTarget = InferenceType.CPU;
 
@@ -16,7 +16,7 @@ describe('UI tests on Running Int8 Calibration', () => {
   const datasetFileImageNet = browser.params.precommit_scope.resources.smallImageNetDataset;
   const datasetWiderFace = browser.params.precommit_scope.resources.WiderFaceDataset;
   const notAnnotatedDataset = browser.params.precommit_scope.resources.imageNetNotAnnotated;
-  // 73948
+  // TODO: 73948
   // const datasetCityScapes = browser.params.precommit_scope.resources.CityscapesDataset;
 
   beforeAll(async () => {
@@ -35,8 +35,9 @@ describe('UI tests on Running Int8 Calibration', () => {
     await testUtils.uploadDataset(datasetFileVOC);
     await testUtils.uploadDataset(datasetFileImageNet);
     await testUtils.uploadDataset(datasetWiderFace);
-    await testUtils.uploadDataset(notAnnotatedDataset);
-    // 73948
+    // TODO: 83248
+    // await testUtils.uploadDataset(notAnnotatedDataset);
+    // TODO: 73948
     // await testUtils.uploadDataset(datasetCityScapes);
   });
 
@@ -46,14 +47,14 @@ describe('UI tests on Running Int8 Calibration', () => {
     await testUtils.modelManagerPage.goToModelManager();
   });
 
-  // 76569
+  // TODO: 76569
   xit('Upload FP32 Mobilenet SSD Lite V2, use VOC dataset, infer (CPU), int8 calibrate (batch 1), infer (CPU)', async () => {
     const modelFile = browser.params.precommit_scope.resources.ODModels.ssdliteMobileNetV2;
     const inferenceTarget = InferenceType.CPU;
     await calibrationUtils.runInt8PipelineThroughUpload(modelFile, datasetFileVOC, inferenceTarget);
   });
 
-  // 76569
+  // TODO: 76569, 83248
   xit(
     'Upload FP32 Mobilenet SSD Lite V2, use Not Annotated dataset, ' +
       'infer (CPU), int8 calibrate - Simplified Mode, infer (CPU)',
@@ -64,7 +65,8 @@ describe('UI tests on Running Int8 Calibration', () => {
     }
   );
 
-  it(
+  // TODO: 83248
+  xit(
     'Should upload original Caffe model, convert to IR V10, run inference, run Int-8 Tune with Not Annotated dataset, ' +
       'Simplified Mode',
     async () => {
@@ -74,7 +76,8 @@ describe('UI tests on Running Int8 Calibration', () => {
     }
   );
 
-  it(
+  // TODO: 83248
+  xit(
     'Select squeezenet1.1 from table + Not Annotated dataset, infer (CPU), int8 Simplified Mode, ' +
       'check wait message ',
     async () => {
 
@@ -137,7 +137,7 @@ describe('UI tests on Model visualization', () => {
     );
   });
 
-  // 75981
+  // TODO: 75981
   xit('should check visualization GAN single-image-super-resolution-1032 model', async () => {
     const model = { name: 'single-image-super-resolution-1032', framework: 'openvino' };
     const imageFile = browser.params.precommit_scope.resources.testImages.streetImage;
 
@@ -8,7 +8,8 @@ import { VisualizeInferenceResultPage } from './pages/inference-test-image.po';
 import { TargetMachines, DevCloudTargets } from './pages/target-machines.po';
 import { Helpers } from './pages/helpers';
 
-describe('UI tests on visualization for model with not annotated dataset', () => {
+// TODO: 83248
+xdescribe('UI tests on visualization for model with not annotated dataset', () => {
   const testUtils = new TestUtils();
   const inferenceUtils = new InferenceUtils(testUtils);
   const visualizeInferenceResultPage = new VisualizeInferenceResultPage();
 
@@ -47,7 +47,8 @@ describe('UI tests on parent predictions visualization', () => {
     dataSetFileSemantic.name = testUtils.helpers.generateName();
     await testUtils.uploadDataset(datasetFileVOC);
     await testUtils.uploadDataset(datasetFileImageNet);
-    await testUtils.uploadDataset(dataSetFileSemantic);
+    // TODO: 83248
+    // await testUtils.uploadDataset(dataSetFileSemantic);
   });
 
   beforeEach(async () => {
@@ -151,7 +152,7 @@ describe('UI tests on parent predictions visualization', () => {
     ).toBeTruthy();
   });
 
-  // 70558
+  // TODO: 70558
   xit(
     'should download an instance segmentation model (deeplabv3), ' +
       'int8 calibration, check that predictions comparison is not available and that tensor comparison is available',
 
@@ -67,7 +67,7 @@ xdescribe('Semantic segmentation tests', () => {
     console.log(`Accuracy check end: ${{ accuracy }}`);
   });
 
-  // 70558
+  // TODO: 70558
   xit('Upload instance segmentation model (deeplabv3), int8 calibration, check accuracy', async () => {
     const model = {
       name: 'deeplabv3',
 
@@ -109,7 +109,8 @@ describe('UI tests on Uploading Datasets', () => {
     }
   );
 
-  it(
+  // TODO: Rework test to expect an error
+  xit(
     'should import COCO dataset with unrelated files and folders inside, ' + 'check that it is uploaded and delete it',
     async () => {
       const datasetFile = browser.params.precommit_scope.resources.cocoWithUnrelatedFiles;
 
@@ -59,6 +59,7 @@
 VGGFACE2_BBOX_LENGTH = 5
 LNDREID_LANDMARK_LENGTH = 11
 ORIGINAL_FOLDER = 'original'
+DATASET_REPORTS_FOLDER = UPLOAD_FOLDER_DATASETS / 'reports'
 
 DEFAULT_LOG_FILE = os.path.join(ROOT_FOLDER, 'server.log') if SERVER_MODE == 'production' else None
 LOG_FILE = get_env_var(name='WB_LOG_FILE', default=DEFAULT_LOG_FILE)
 
@@ -84,7 +84,9 @@ RUN apt update && \
     # For E2E in non-headless mode
     xvfb \
     gnupg2 \
-    build-essential && \
+    build-essential  \
+    # for running packages from git commits \
+    git && \
     apt clean && \
     rm -rf /var/lib/apt/lists/*
 
 
@@ -9,7 +9,7 @@ cffi==1.15.0
 chardet==4.0.0
 click==8.0.0
 cryptography==3.4.8
-datumaro==0.2.1
+git+https://github.com/openvinotoolkit/datumaro.git@develop#egg=datumaro
 defusedxml==0.7.1
 distlib==0.3.2
 dnspython==1.16.0
@@ -32,6 +32,7 @@ lxml==4.6.5
 Mako==1.1.5
 MarkupSafe==2.0.1
 monotonic==1.6
+numpy==1.19.5
 packaging==21.3
 paramiko==2.7.2
 pg8000==1.21.1
 
@@ -35,11 +35,26 @@ def set_conversion(self, input_format: DatasetTypesEnum, output_format: DatasetT
         self.set_parameter('--input-format', input_format.value, ConsoleParametersTypes.dataset_format)
         self.set_parameter('--output-format', output_format.value, ConsoleParametersTypes.dataset_format)
 
-    def set_input_output_paths(self, input_path: str, output_path: Optional[str]):
-        self.set_parameter('--input-path', input_path, ConsoleParametersTypes.path)
-        if output_path:
-            self.set_parameter('--output-dir', output_path, ConsoleParametersTypes.path)
+    def _set_path(self, param_name: Optional[str], path: str):
+        self.set_parameter(param_name, path, ConsoleParametersTypes.path)
 
-    def enable_image_copy(self):
+    def set_input_path(self, path: str):
+        self._set_path('--input-path', path)
+
+    def set_output_path(self, path: str):
+        self._set_path('--output-dir', path)
+
+    def set_report_path(self, path: str):
+        self._set_path('--json-report', path)
+
+    def set_target(self, path: str):
+        self._set_path('', path)
+
+    def _set_flag(self, param_name: str):
+        self.set_parameter(f'--{param_name}', True, ConsoleParametersTypes.flag)
+
+    def enable_image_save(self):
+        self._set_flag('save-images')
+
+    def add_separator(self):
         self.set_parameter('--', True, ConsoleParametersTypes.flag)
-        self.set_parameter('--save-images', True, ConsoleParametersTypes.flag)
 
@@ -758,13 +758,17 @@ class VGGFace2LandmarkCustomAdapter(VGGFace2BaseAdapter):
 class WiderFaceBaseAdapter(BaseImageDatasetAdapter):
 
     def get_images_dir(self) -> Optional[Path]:
-        for item in self.dataset_path.iterdir():
-            if item.is_dir() and all(path.is_dir()
-                                     and all(subpath.suffix[1:] in ALLOWED_EXTENSIONS_IMG for subpath in path.iterdir())
-                                     for path in item.iterdir()):
+        dirs = self.dataset_path.glob('**/*')
+        for item in dirs:
+            if item.is_dir() and item.name == 'images' and all(self.is_event_class_dir(path)
+                                                               for path in item.iterdir()):
                 return item
         return None
 
+    @staticmethod
+    def is_event_class_dir(path: Path) -> bool:
+        return path.is_dir() and all(subpath.suffix[1:] in ALLOWED_EXTENSIONS_IMG for subpath in path.iterdir())
+
     def get_task_specific_constants(self) -> dict:
         raise NotImplementedError
 
 
@@ -664,6 +664,7 @@ class ModelShapeTypeEnum(enum.Enum):
 
 class DatumaroModesEnum(enum.Enum):
     convert = 'convert'
+    detect_format = 'detect-format'
 
 
 class TokenizerTypeEnum(enum.Enum):
 
@@ -87,14 +87,16 @@ def run_conversion(self, original_dataset: DatasetsModel,
                        dataset_format: DatasetTypesEnum):
         tool = DatumaroTool()
         tool.set_mode(DatumaroModesEnum.convert)
-        tool.set_input_output_paths(original_dataset.path, result_dataset.path)
+        tool.set_input_path(original_dataset.path)
+        tool.set_output_path(result_dataset.path)
         tool.set_conversion(dataset_format, self._format_conversion_map[dataset_format])
-        tool.enable_image_copy()
+        tool.add_separator()
+        tool.enable_image_save()
 
         runner = LocalRunner(tool)
         return_code, _ = runner.run_console_tool()
         if return_code:
-            raise DatumaroError('Error during Datumaro conversion.')
+            raise DatumaroError('Error during Datumaro conversion.', self.job_id)
 
         result_format = self._format_compatibility_map.get(self._format_conversion_map[dataset_format],
                                                            self._format_conversion_map[dataset_format])
Original file line number	Diff line number	Diff line change
`@@ -109,7 +109,8 @@ describe('UI tests on Uploading Datasets', () => {`
`109`	`109`	`}`
`110`	`110`	`);`
`111`	`111`
`112`		`- it(`
	`112`	`+ // TODO: Rework test to expect an error`
	`113`	`+ xit(`
`113`	`114`	`'should import COCO dataset with unrelated files and folders inside, ' + 'check that it is uploaded and delete it',`
`114`	`115`	`async () => {`
`115`	`116`	`const datasetFile = browser.params.precommit_scope.resources.cocoWithUnrelatedFiles;`