Skip to content
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.

Commit 412a10c

Browse files
committedFeb 28, 2024·
Remove the need for real test data
1 parent f3a84a4 commit 412a10c

File tree

2 files changed

+9
-12
lines changed

2 files changed

+9
-12
lines changed
 

‎setup.py

-2
Original file line numberDiff line numberDiff line change
@@ -34,8 +34,6 @@
3434
"timm",
3535
"invisible-watermark>=0.2.0",
3636
"auto-gptq",
37-
"librosa",
38-
"soundfile",
3937
]
4038

4139
QUALITY_REQUIRE = ["black~=23.1", "ruff>=0.0.241"]

‎tests/openvino/test_quantization.py

+9-10
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,6 @@
1818
import unittest
1919
from collections import defaultdict
2020
from functools import partial
21-
from itertools import islice
2221

2322
import evaluate
2423
import numpy as np
@@ -599,27 +598,27 @@ def compute_metrics(p):
599598

600599
class InferRequestWrapperTest(unittest.TestCase):
601600
MODEL_ID = ("openai/whisper-tiny.en",)
602-
DATASET_ID = ("hf-internal-testing/librispeech_asr_dummy",)
603601

604602
@staticmethod
605-
def _extract_input_features(processor, sample):
603+
def _generate_random_audio_data(processor):
604+
t = np.linspace(0, 1.0, int(1000), endpoint=False)
605+
audio_data = 0.5 * np.sin((2 + np.random.random()) * np.pi * t)
606606
input_features = processor(
607-
sample["audio"]["array"],
608-
sampling_rate=sample["audio"]["sampling_rate"],
607+
audio_data,
608+
sampling_rate=16000,
609609
return_tensors="pt",
610610
).input_features
611611
return input_features
612612

613-
@parameterized.expand(zip(MODEL_ID, DATASET_ID))
614-
def test_calibration_data_uniqueness(self, model_id, dataset_id):
613+
@parameterized.expand(MODEL_ID)
614+
def test_calibration_data_uniqueness(self, model_id):
615615
ov_model = OVModelForSpeechSeq2Seq.from_pretrained(model_id, export=True, compile=True)
616616
processor = AutoProcessor.from_pretrained(model_id)
617617

618-
dataset = load_dataset(dataset_id, "clean", split="validation")
619618
calibration_data = []
620619
ov_model.decoder_with_past.request = InferRequestWrapper(ov_model.decoder_with_past.request, calibration_data)
621-
for data in islice(dataset, 2):
622-
input_features = self._extract_input_features(processor, data)
620+
for _ in range(2):
621+
input_features = self._generate_random_audio_data(processor)
623622
ov_model.generate(input_features)
624623

625624
data_hashes_per_key = defaultdict(list)

0 commit comments

Comments
 (0)
Please sign in to comment.