Skip to content

Commit d1dedd1

Browse files
Add quantization tests for llava_next_video
1 parent 3fbd0b1 commit d1dedd1

File tree

3 files changed

+38
-0
lines changed

3 files changed

+38
-0
lines changed

tests/openvino/test_exporters_cli.py

+13
Original file line numberDiff line numberDiff line change
@@ -341,6 +341,19 @@ class OVCLIExportTestCase(unittest.TestCase):
341341
]
342342
)
343343

344+
if is_transformers_version(">=", "4.42.0"):
345+
TEST_4BIT_CONFIGURATIONS.extend(
346+
[
347+
(
348+
"image-text-to-text",
349+
"llava_next_video",
350+
'int4 --group-size 16 --ratio 0.8 --sensitivity-metric "hessian_input_activation" '
351+
"--dataset contextual --num-samples 1",
352+
[{"int8": 6, "int4": 24}, {"int8": 1}, {"int8": 7}, {}, {"int8": 2}],
353+
),
354+
]
355+
)
356+
344357
if is_transformers_version(">=", "4.45.0"):
345358
TEST_4BIT_CONFIGURATIONS.extend(
346359
[

tests/openvino/test_quantization.py

+24
Original file line numberDiff line numberDiff line change
@@ -581,6 +581,27 @@ class OVWeightCompressionTest(unittest.TestCase):
581581
]
582582
)
583583

584+
if is_transformers_version(">=", "4.42.0"):
585+
LOAD_IN_4_BITS_SCOPE.extend(
586+
[
587+
(
588+
OVModelForVisualCausalLM,
589+
"llava_next_video",
590+
False,
591+
dict(
592+
bits=4,
593+
group_size=16,
594+
dataset="contextual",
595+
ratio=0.8,
596+
sensitivity_metric="hessian_input_activation",
597+
num_samples=1,
598+
processor=MODEL_NAMES["llava_next"],
599+
),
600+
[{"int8": 6, "int4": 24}, {"int8": 1}, {"int8": 7}, {}, {"int8": 2}],
601+
),
602+
]
603+
)
604+
584605
if is_transformers_version(">=", "4.45.0"):
585606
LOAD_IN_4_BITS_SCOPE.extend(
586607
[
@@ -668,6 +689,9 @@ class OVWeightCompressionTest(unittest.TestCase):
668689
if is_transformers_version(">=", "4.40.0"):
669690
SUPPORTED_ARCHITECTURES_WITH_AUTO_COMPRESSION.append((OVModelForVisualCausalLM, "nanollava", True))
670691

692+
if is_transformers_version(">=", "4.42.0"):
693+
SUPPORTED_ARCHITECTURES_WITH_AUTO_COMPRESSION.append((OVModelForVisualCausalLM, "llava_next_video", False))
694+
671695
if is_transformers_version(">=", "4.45.0"):
672696
SUPPORTED_ARCHITECTURES_WITH_AUTO_COMPRESSION.append((OVModelForVisualCausalLM, "minicpmv", True))
673697
SUPPORTED_ARCHITECTURES_WITH_AUTO_COMPRESSION.append((OVModelForVisualCausalLM, "qwen2_vl", False))

tests/openvino/utils_tests.py

+1
Original file line numberDiff line numberDiff line change
@@ -202,6 +202,7 @@
202202
"flux-fill": (56, 28, 24, 64, 64),
203203
"llava": (30, 1, 9),
204204
"llava_next": (30, 1, 9),
205+
"llava_next_video": (30, 1, 7, 0, 2),
205206
"minicpmv": (30, 1, 26, 6),
206207
"nanollava": (30, 1, 15),
207208
"qwen2_vl": (30, 1, 1, 10),

0 commit comments

Comments
 (0)