@@ -38,15 +38,16 @@ def get_compressed_path(output_dir: str, base_precision, option: str):
38
38
"opt-6.7b" : {"mode" : nncf .CompressWeightsMode .INT4_ASYM , "group_size" : 64 , "ratio" : 0.8 },
39
39
"bloomz-7b1" : {"mode" : nncf .CompressWeightsMode .INT4_ASYM , "group_size" : 32 , "ratio" : 0.6 },
40
40
"red-pajama-incite-7b-instruct" : {"mode" : nncf .CompressWeightsMode .INT4_ASYM , "group_size" : 128 },
41
- "zephyr-7b-beta" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 64 , "ratio" : 0.6 },
41
+ "zephyr-7b-beta" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 128 , "ratio" : 0.8 ,
42
+ "dataset" : {"name" : "wikitext,wikitext-2-v1,train[:1000],text" , "awq" : True }},
42
43
"llama-2-7b" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 128 , "ratio" : 0.6 },
43
44
"llama-2-7b-chat" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 128 , "ratio" : 0.8 },
44
45
"llama-2-13b-chat" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 64 , "ratio" : 0.8 },
45
46
"stablelm-3b-4e1t" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 64 , "ratio" : 0.8 ,
46
47
"dataset" : {"name" : "wikitext,wikitext-2-v1,train[:1000],text" , "awq" : True }},
47
48
"stablelm-epoch-3b-preview" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 64 , "ratio" : 0.8 ,
48
49
"dataset" : {"name" : "wikitext,wikitext-2-v1,train[:1000],text" , "awq" : True }},
49
- "stable-zephyr-3b-dpo" : {"mode" : nncf .CompressWeightsMode .INT4_ASYM , "group_size" : 64 , "ratio" : 0.8 ,
50
+ "stable-zephyr-3b-dpo" : {"mode" : nncf .CompressWeightsMode .INT4_ASYM , "group_size" : 128 , "ratio" : 1.0 ,
50
51
"dataset" : {"name" : "wikitext,wikitext-2-v1,train[:1000],text" , "awq" : True }},
51
52
"stable-code-3b" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 64 , "ratio" : 0.8 },
52
53
"rocket-3b" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 128 , "ratio" : 0.8 },
@@ -59,4 +60,8 @@ def get_compressed_path(output_dir: str, base_precision, option: str):
59
60
"bloomz-560m" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 64 , "ratio" : 0.8 ,
60
61
"dataset" : {"name" : "wikitext,wikitext-2-v1,train[:1000],text" , "awq" : True }},
61
62
"mixtral-8x7b-v0.1" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 128 , "ratio" : 0.8 },
63
+ "baichuan2-7b-chat" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 128 , "ratio" : 0.8 ,
64
+ "dataset" : {"name" : "wikitext,wikitext-2-v1,train[:1000],text" , "awq" : True }},
65
+ "mistral-7b-v0.1" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 128 , "ratio" : 0.9 },
66
+ "llama-7b" : {"mode" : nncf .CompressWeightsMode .INT4_SYM , "group_size" : 128 , "ratio" : 0.7 },
62
67
}
0 commit comments