|
12 | 12 | #include "openvino/runtime/properties.hpp"
|
13 | 13 | #include "utils/debug_capabilities.h"
|
14 | 14 | #include "utils/precision_support.h"
|
| 15 | +#include "utils/cpu_utils.hpp" |
15 | 16 |
|
16 | 17 | #include <algorithm>
|
17 | 18 | #include <map>
|
@@ -215,12 +216,12 @@ void Config::readProperties(const ov::AnyMap& prop, const ModelType modelType) {
|
215 | 216 | } else {
|
216 | 217 | fcSparseWeiDecompressionRate = val_f;
|
217 | 218 | }
|
218 |
| - } else if (key == ov::dynamic_quantization_group_size.name()) { |
| 219 | + } else if (key == ov::hint::dynamic_quantization_group_size.name()) { |
219 | 220 | try {
|
220 | 221 | fcDynamicQuantizationGroupSize = val.as<uint64_t>();
|
221 | 222 | } catch (const ov::Exception&) {
|
222 | 223 | OPENVINO_THROW("Wrong value for property key ",
|
223 |
| - ov::dynamic_quantization_group_size.name(), |
| 224 | + ov::hint::dynamic_quantization_group_size.name(), |
224 | 225 | ". Expected only unsinged integer numbers");
|
225 | 226 | }
|
226 | 227 | } else if (key == ov::enable_profiling.name()) {
|
@@ -341,6 +342,21 @@ void Config::readProperties(const ov::AnyMap& prop, const ModelType modelType) {
|
341 | 342 | ov::hint::execution_mode.name(),
|
342 | 343 | ". Supported values: ov::hint::ExecutionMode::PERFORMANCE/ACCURACY");
|
343 | 344 | }
|
| 345 | + } else if (key == ov::hint::kv_cache_precision.name()) { |
| 346 | + try { |
| 347 | + auto const prec = val.as<ov::element::Type>(); |
| 348 | + if (one_of(prec, ov::element::f32, ov::element::f16, ov::element::bf16, ov::element::u8)) { |
| 349 | + kvCachePrecision = prec; |
| 350 | + } else { |
| 351 | + OPENVINO_THROW("invalid value"); |
| 352 | + } |
| 353 | + } catch (ov::Exception&) { |
| 354 | + OPENVINO_THROW("Wrong value ", |
| 355 | + val.as<std::string>(), |
| 356 | + " for property key ", |
| 357 | + ov::hint::kv_cache_precision.name(), |
| 358 | + ". Supported values: s8, bf16, f16, f32"); |
| 359 | + } |
344 | 360 | } else {
|
345 | 361 | OPENVINO_THROW("NotFound: Unsupported property ", key, " by CPU plugin.");
|
346 | 362 | }
|
|
0 commit comments