From 312f5556a189cdb149e642071d9f5b2f29bc3a63 Mon Sep 17 00:00:00 2001 From: Nikita Savelyev Date: Tue, 18 Feb 2025 18:37:31 +0100 Subject: [PATCH] Add default int4 configurations for DeepSeek-R1-Distill-Qwen models --- optimum/intel/openvino/configuration.py | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) diff --git a/optimum/intel/openvino/configuration.py b/optimum/intel/openvino/configuration.py index 9c443d37c5..0b92f4ee5e 100644 --- a/optimum/intel/openvino/configuration.py +++ b/optimum/intel/openvino/configuration.py @@ -210,6 +210,24 @@ class OVQuantizationMethod(str, Enum): "quant_method": OVQuantizationMethod.AWQ, "scale_estimation": True, }, + "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": { + "bits": 4, + "sym": False, + "group_size": 32, + "ratio": 0.7, + "dataset": "wikitext2", + "quant_method": OVQuantizationMethod.AWQ, + "scale_estimation": True, + }, + "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B": { + "bits": 4, + "sym": False, + "group_size": 128, + "ratio": 1.0, + "dataset": "wikitext2", + "quant_method": OVQuantizationMethod.AWQ, + "scale_estimation": True, + }, "deepseek-ai/DeepSeek-R1-Distill-Llama-8B": { "bits": 4, "sym": False,