@@ -54,28 +54,29 @@ LlamaCppModel::LlamaCppModel(const std::string& gguf_fname, const std::shared_pt
54
54
55
55
ov::ParameterVector inputs{input_ids};
56
56
57
- std::vector<std::pair<std::string, ov::element::Type_t>> unused_names_in_order = {
58
- {" attention_mask" , ov::element::Type_t::i64},
59
- {" position_ids" , ov::element::Type_t::i64},
60
- {" beam_idx" , ov::element::Type_t::i32}};
61
- for (const auto & descr : unused_names_in_order) {
62
- auto unused_inp = std::make_shared<ov::opset13::Parameter>(descr.second , ov::PartialShape ({-1 , -1 }));
57
+ std::vector<std::tuple<std::string, ov::element::Type_t, ov::PartialShape>> additional_inputs_in_order = {
58
+ {" attention_mask" , ov::element::Type_t::i64, {-1 , -1 }},
59
+ {" position_ids" , ov::element::Type_t::i64, {-1 , -1 }},
60
+ {" beam_idx" , ov::element::Type_t::i32, {-1 , -1 }}};
61
+
62
+ for (const auto & descr : additional_inputs_in_order) {
63
+ auto unused_inp = std::make_shared<ov::opset13::Parameter>(std::get<1 >(descr), std::get<2 >(descr));
63
64
inputs.push_back (unused_inp);
64
65
}
65
66
66
- m_model = std::make_shared<ov::Model>(logits, inputs, " fake_ov_model_for_io_specification" );
67
+ m_fake_model = std::make_shared<ov::Model>(logits, inputs, " fake_ov_model_for_io_specification" );
67
68
68
- m_model ->inputs ()[0 ].set_names ({" input_ids" });
69
- for (size_t i = 0 ; i < unused_names_in_order .size (); i++) {
70
- m_model ->inputs ()[i + 1 ].set_names ({unused_names_in_order [i]. first });
69
+ m_fake_model ->inputs ()[0 ].set_names ({" input_ids" });
70
+ for (size_t i = 0 ; i < additional_inputs_in_order .size (); i++) {
71
+ m_fake_model ->inputs ()[i + 1 ].set_names ({std::get< 0 >(additional_inputs_in_order [i]) });
71
72
}
72
73
73
- m_model ->outputs ()[0 ].set_names ({" logits" });
74
+ m_fake_model ->outputs ()[0 ].set_names ({" logits" });
74
75
75
- for (auto input : m_model ->inputs ()) {
76
+ for (auto input : m_fake_model ->inputs ()) {
76
77
m_fake_inputs.emplace_back (input);
77
78
}
78
- for (auto output : m_model ->outputs ()) {
79
+ for (auto output : m_fake_model ->outputs ()) {
79
80
m_fake_outputs.emplace_back (output);
80
81
}
81
82
}
0 commit comments