Skip to content

Commit 2ec2a54

Browse files
committed
Style
1 parent 54f8fe0 commit 2ec2a54

File tree

2 files changed

+28
-3
lines changed

2 files changed

+28
-3
lines changed

optimum/intel/openvino/weight_quantization.py

+3-1
Original file line numberDiff line numberDiff line change
@@ -96,6 +96,7 @@ def post_init(self):
9696
['wikitext2','c4','c4-new','ptb','ptb-new'], but we found {self.dataset}"""
9797
)
9898

99+
99100
DEFAULT_4BIT_CONFIGS = {
100101
"dolly-v2-3b": {"mode": nncf.CompressWeightsMode.INT4_ASYM, "group_size": 32, "ratio": 0.5},
101102
"gpt-j-6b": {"mode": nncf.CompressWeightsMode.INT4_ASYM, "group_size": 64},
@@ -114,6 +115,7 @@ def post_init(self):
114115
"qwen-7b-chat": {"mode": nncf.CompressWeightsMode.INT4_SYM, "group_size": 128, "ratio": 0.6},
115116
}
116117

118+
117119
def _check_default_4bit_configs(config: PretrainedConfig):
118120
return DEFAULT_4BIT_CONFIGS.get(config.name_or_path, None)
119121

@@ -150,7 +152,7 @@ def compress_decoder_weights(model, quantization_config: Union[OVWeightQuantizat
150152
group_size=config.group_size,
151153
all_layers=config.all_layers,
152154
sensitivity_metric=config.sensitivity_metric,
153-
awq = config.awq,
155+
awq=config.awq,
154156
ignored_scope=config.ignored_scope,
155157
dataset=dataset,
156158
)

tests/openvino/test_quantization.py

+25-2
Original file line numberDiff line numberDiff line change
@@ -181,8 +181,31 @@ class OVWeightCompressionTest(unittest.TestCase):
181181
dict(mode=nncf.CompressWeightsMode.INT4_ASYM, group_size=-1, ratio=0.8, all_layers=True),
182182
22,
183183
),
184-
# TODO: uncomment after fix
185-
# (OVModelForCausalLM, "hf-internal-testing/tiny-random-gpt2", dict(mode=nncf.CompressWeightsMode.INT4_SYM, group_size=-1, ratio=0.8, sensitivity_metric=nncf.SensitivityMetric.MEAN_ACTIVATION_MAGNITUDE, dataset="ptb"), 16),
184+
(
185+
OVModelForCausalLM,
186+
"hf-internal-testing/tiny-random-gpt2",
187+
dict(
188+
mode=nncf.CompressWeightsMode.INT4_SYM,
189+
group_size=-1,
190+
ratio=0.8,
191+
sensitivity_metric=nncf.SensitivityMetric.MEAN_ACTIVATION_MAGNITUDE,
192+
dataset="ptb",
193+
),
194+
16,
195+
),
196+
(
197+
OVModelForCausalLM,
198+
"hf-internal-testing/tiny-random-gpt2",
199+
dict(
200+
mode=nncf.CompressWeightsMode.INT4_SYM,
201+
group_size=-1,
202+
ratio=0.8,
203+
sensitivity_metric=nncf.SensitivityMetric.MEAN_ACTIVATION_MAGNITUDE,
204+
dataset="ptb",
205+
awq=True,
206+
),
207+
16,
208+
),
186209
)
187210

188211
SUPPORTED_ARCHITECTURES_WITH_AUTO_COMPRESSION = (

0 commit comments

Comments
 (0)