File tree 3 files changed +4
-5
lines changed
3 files changed +4
-5
lines changed Original file line number Diff line number Diff line change @@ -209,7 +209,7 @@ class ModelRunner {
209
209
sequence_group->get_prompt_ids ()[position_id] :
210
210
sequence->get_generated_ids ()[position_id - prompt_len];
211
211
} else if (sequence_group_type == SequenceGroupType::EMBEDDINGS) {
212
- auto generated_embeds = sequence->get_generated_ids_embeds ();
212
+ const auto & generated_embeds = sequence->get_generated_ids_embeds ();
213
213
const float * src = position_id < prompt_len ? sequence_group->get_input_embeds ()[position_id].data () : generated_embeds[position_id - prompt_len].data ();
214
214
std::copy_n (src, hidden_size, inputs_embeds_data + token_id * hidden_size);
215
215
} else {
@@ -340,7 +340,7 @@ class ModelRunner {
340
340
size_t seq_group_id = scheduler_output.m_scheduled_sequence_groups_ids [i];
341
341
SequenceGroup::CPtr sequence_group = sequence_groups[seq_group_id];
342
342
for (auto seq: sequence_group->get_running_sequences ()) {
343
- auto generated_ids = seq->get_generated_ids ();
343
+ const auto & generated_ids = seq->get_generated_ids ();
344
344
for (size_t token_idx = seq->get_generated_ids_embeds ().size (); token_idx < generated_ids.size (); token_idx++) {
345
345
generated_ids_data[pos] = generated_ids[token_idx];
346
346
pos++;
Original file line number Diff line number Diff line change @@ -40,7 +40,7 @@ size_t Sequence::_make_hash(size_t content_length) {
40
40
size = content.size () * sizeof (content[0 ]);
41
41
}
42
42
else if (sequence_group->get_sequence_group_type () == SequenceGroupType::EMBEDDINGS) {
43
- const auto input_embeds = sequence_group->get_input_embeds ();
43
+ const auto & input_embeds = sequence_group->get_input_embeds ();
44
44
const auto generated_embeds = m_generated_ids_embeds;
45
45
OPENVINO_ASSERT (content_length <= input_embeds.size () + generated_embeds.size ());
46
46
std::vector<float > content_float;
@@ -49,7 +49,6 @@ size_t Sequence::_make_hash(size_t content_length) {
49
49
if (block_start_idx < input_embeds.size ()) {
50
50
for (size_t idx = block_start_idx; idx < std::min (input_embeds.size (), content_length); idx++) {
51
51
auto embed = _reduce_embedding (input_embeds[idx]);
52
- const char * embed_char = reinterpret_cast <const char *>(embed.data ());
53
52
content_float.insert (content_float.end (), embed.begin (), embed.end ());
54
53
}
55
54
}
Original file line number Diff line number Diff line change @@ -202,7 +202,7 @@ class Sequence {
202
202
m_sequence_group = sequence_group;
203
203
}
204
204
205
- std::vector<std::vector<float >> get_generated_ids_embeds () const {
205
+ const std::vector<std::vector<float >>& get_generated_ids_embeds () const {
206
206
OPENVINO_ASSERT (m_type == ov::genai::SequenceGroupType::EMBEDDINGS);
207
207
return m_generated_ids_embeds;
208
208
}
You can’t perform that action at this time.
0 commit comments