Skip to content

Commit 42c4b05

Browse files
committedFeb 15, 2024
[CPU] Enabled dynamic quantization be default
1 parent d247233 commit 42c4b05

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed
 

‎src/plugins/intel_cpu/src/config.h

+1-1
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,7 @@ struct Config {
5555
std::string dumpToDot = {};
5656
std::string device_id = {};
5757
float fcSparseWeiDecompressionRate = 1.0f;
58-
uint64_t fcDynamicQuantizationGroupSize = 0;
58+
uint64_t fcDynamicQuantizationGroupSize = 32;
5959
ov::element::Type kvCachePrecision = ov::element::f16;
6060
#if defined(OPENVINO_ARCH_X86_64)
6161
size_t rtCacheCapacity = 5000ul;

‎src/plugins/intel_cpu/src/transformations/transformation_pipeline.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -289,7 +289,7 @@ void Transformations::PreLpt(const std::vector<ov::element::Type>& defaultPrecis
289289
ov::element::i4,
290290
ov::element::nf4};
291291
CPU_REGISTER_PASS_X64(decompression_handling_manager, ov::pass::MarkDequantizationSubgraph, decompression_precisions,
292-
config.fcDynamicQuantizationGroupSize != 0);
292+
config.fcDynamicQuantizationGroupSize == 0);
293293
CPU_SET_CALLBACK_X64(decompression_handling_manager, [&](const_node_ptr &node) -> bool {
294294
return !is_decompression_multiply(node);
295295
}, ov::pass::MarkDequantizationSubgraph);

0 commit comments

Comments
 (0)