Skip to content

Commit 8bf2b6c

Browse files
dynamic quant for first token
1 parent ae63629 commit 8bf2b6c

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

src/plugins/intel_cpu/tests/functional/subgraph_tests/src/matmul_weights_decompression.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -366,7 +366,7 @@ const std::vector<ov::test::ElementType> weights_precisions = {//ov::element::u8
366366
const std::vector<ShapeParams> input_shapes_basic = {
367367
// {{{-1, -1, -1}, {{1, 4, 16}, {10, 16, 16}}}, {16, 32}},
368368
// {{{}, {{1, 8, 16}}}, {16, 32}, 4ul},
369-
{{{}, {{1, 16, 256}}}, {1, 256, 128}},
369+
{{{}, {{1, 64, 32}}}, {1, 32, 8}},
370370
{{{}, {{1, 8, 256}}}, {1, 256, 512}},
371371
{{{}, {{1, 3, 4096}}}, {4096, 4096}, 128},
372372
{{{}, {{1, 3, 4096}}}, {4096, 11008}, 128},

0 commit comments

Comments
 (0)