Skip to content

Commit f423b30

Browse files
Add AWQ
1 parent 30c5496 commit f423b30

File tree

1 file changed

+8
-1
lines changed

1 file changed

+8
-1
lines changed

optimum/intel/openvino/configuration.py

+8-1
Original file line numberDiff line numberDiff line change
@@ -77,7 +77,14 @@ class OVQuantizationMethod(str, Enum):
7777
"THUDM/chatglm2-6b": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.72},
7878
"Qwen/Qwen-7B-Chat": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.6},
7979
"openlm-research/open_llama_3b": {"bits": 4, "sym": False, "group_size": 64, "all_layers": True},
80-
"openlm-research/open_llama_3b_v2": {"bits": 4, "sym": False, "group_size": 64},
80+
"openlm-research/open_llama_3b_v2": {
81+
"bits": 4,
82+
"sym": False,
83+
"group_size": 64,
84+
"ratio": 1.0,
85+
"dataset": "wikitext2",
86+
"quant_method": OVQuantizationMethod.AWQ,
87+
},
8188
"tiiuae/falcon-7b-instruct": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True},
8289
"psmathur/orca_mini_3b": {
8390
"bits": 4,

0 commit comments

Comments
 (0)