@@ -102,23 +102,19 @@ StatefulLLMPipeline::StatefulLLMPipeline(
102
102
): StatefulLLMPipeline(
103
103
genai::utils::singleton_core ().read_model(models_path / " openvino_model.xml" , {}, config),
104
104
tokenizer, config,
105
- utils::from_config_json_if_exists(models_path),
106
- models_path
105
+ utils::from_config_json_if_exists(models_path)
107
106
) {
108
107
}
109
108
110
109
StatefulLLMPipeline::StatefulLLMPipeline (
111
110
const std::shared_ptr<ov::Model>& model,
112
111
const ov::genai::Tokenizer& tokenizer,
113
112
const ov::AnyMap& properties,
114
- const ov::genai::GenerationConfig& generation_config,
115
- const std::filesystem::path& models_path
113
+ const ov::genai::GenerationConfig& generation_config
116
114
) : LLMPipelineImplBase(tokenizer, generation_config),
117
115
m_sampler(m_tokenizer) {
118
116
auto kv_pos = ov::genai::utils::get_kv_axes_pos (model);
119
- auto [compiled, kv_desc] = utils::compile_decoder_for_npu (
120
- model, properties, kv_pos, models_path / " openvino_model.xml"
121
- );
117
+ auto [compiled, kv_desc] = utils::compile_decoder_for_npu (model, properties, kv_pos);
122
118
m_max_prompt_len = kv_desc.max_prompt_len ;
123
119
m_kvcache_total = kv_desc.max_prompt_len + kv_desc.min_response_len ;
124
120
m_request = compiled.create_infer_request ();
@@ -358,16 +354,14 @@ LLMPipelineFactory::create(const std::filesystem::path& models_path,
358
354
std::unique_ptr<LLMPipelineImplBase> LLMPipelineFactory::create (const std::shared_ptr<ov::Model>& model,
359
355
const ov::genai::Tokenizer& tokenizer,
360
356
const ov::AnyMap& properties,
361
- const ov::genai::GenerationConfig& generation_config,
362
- const std::filesystem::path& models_path) {
357
+ const ov::genai::GenerationConfig& generation_config) {
363
358
auto properties_copy = properties;
364
359
const auto pipeline_mode = str_to_pipeline (utils::pop_or_default (properties_copy, " STATIC_PIPELINE" , std::string (" STATEFUL" )));
365
360
if (pipeline_mode == StaticPipelineKind::STATEFUL) {
366
361
return std::make_unique<ov::genai::static_llm::StatefulLLMPipeline>(model,
367
362
tokenizer,
368
363
properties_copy,
369
- generation_config,
370
- models_path);
364
+ generation_config);
371
365
}
372
366
OPENVINO_ASSERT (false );
373
367
}
0 commit comments