Skip to content

Commit 9ede790

Browse files
authored
fix int8 pipeline init on arm (#2837)
CVS-164848
1 parent 9b3cc65 commit 9ede790

File tree

2 files changed

+4
-1
lines changed

2 files changed

+4
-1
lines changed

notebooks/grammar-correction/grammar-correction.ipynb

+1
Original file line numberDiff line numberDiff line change
@@ -981,6 +981,7 @@
981981
" quantized_model_path,\n",
982982
" device.value,\n",
983983
" calibration_dataset_size=CALIBRATION_DATASET_SIZE,\n",
984+
" additional_args=additional_args\n",
984985
" )"
985986
]
986987
},

notebooks/grammar-correction/utils.py

+3-1
Original file line numberDiff line numberDiff line change
@@ -87,6 +87,7 @@ def get_quantized_pipeline(
8787
quantized_model_path: Path,
8888
device: str,
8989
calibration_dataset_size=CALIBRATION_DATASET_SIZE,
90+
additional_args=None,
9091
):
9192
# Get quantized OV model
9293
quantized_model = quantize(grammar_corrector_pipe, core, quantized_model_path, calibration_dataset_size)
@@ -96,7 +97,8 @@ def get_quantized_pipeline(
9697
grammar_corrector_model_int8.decoder.model = quantized_model
9798
grammar_corrector_model_int8.decoder.request = None
9899
grammar_corrector_model_int8.decoder._compile()
99-
grammar_corrector_pipe_int8 = pipeline("text2text-generation", model=grammar_corrector_model_int8, tokenizer=grammar_corrector_tokenizer)
100+
additional_args = additional_args or {}
101+
grammar_corrector_pipe_int8 = pipeline("text2text-generation", model=grammar_corrector_model_int8, tokenizer=grammar_corrector_tokenizer, **additional_args)
100102

101103
return grammar_corrector_pipe_int8
102104

0 commit comments

Comments
 (0)