From 1d8e174f1ee180877b7225269048df202cc318ca Mon Sep 17 00:00:00 2001 From: Nikita Savelyev Date: Wed, 12 Feb 2025 17:20:05 +0100 Subject: [PATCH] Add default int4 config for DeepSeek-R1-Distill-Llama-8B --- optimum/intel/openvino/configuration.py | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/optimum/intel/openvino/configuration.py b/optimum/intel/openvino/configuration.py index 966ab57c51..06fbe2109e 100644 --- a/optimum/intel/openvino/configuration.py +++ b/optimum/intel/openvino/configuration.py @@ -210,6 +210,14 @@ class OVQuantizationMethod(str, Enum): "quant_method": OVQuantizationMethod.AWQ, "scale_estimation": True, }, + "deepseek-ai/DeepSeek-R1-Distill-Llama-8B": { + "bits": 4, + "sym": False, + "group_size": 64, + "ratio": 0.8, + "dataset": "wikitext2", + "quant_method": OVQuantizationMethod.AWQ, + }, } _DEFAULT_4BIT_CONFIG = {