Skip to content

Commit e6ec494

Browse files
Apply suggestions from code review
Co-authored-by: Ilya Lavrenov <ilya.lavrenov@intel.com>
1 parent d053feb commit e6ec494

File tree

3 files changed

+4
-5
lines changed

3 files changed

+4
-5
lines changed

src/cpp/src/model_runner.hpp

+2-2
Original file line numberDiff line numberDiff line change
@@ -209,7 +209,7 @@ class ModelRunner {
209209
sequence_group->get_prompt_ids()[position_id] :
210210
sequence->get_generated_ids()[position_id - prompt_len];
211211
} else if (sequence_group_type == SequenceGroupType::EMBEDDINGS) {
212-
auto generated_embeds = sequence->get_generated_ids_embeds();
212+
const auto& generated_embeds = sequence->get_generated_ids_embeds();
213213
const float* src = position_id < prompt_len ? sequence_group->get_input_embeds()[position_id].data() : generated_embeds[position_id - prompt_len].data();
214214
std::copy_n(src, hidden_size, inputs_embeds_data + token_id * hidden_size);
215215
} else {
@@ -340,7 +340,7 @@ class ModelRunner {
340340
size_t seq_group_id = scheduler_output.m_scheduled_sequence_groups_ids[i];
341341
SequenceGroup::CPtr sequence_group = sequence_groups[seq_group_id];
342342
for (auto seq: sequence_group->get_running_sequences()) {
343-
auto generated_ids = seq->get_generated_ids();
343+
const auto& generated_ids = seq->get_generated_ids();
344344
for (size_t token_idx = seq->get_generated_ids_embeds().size(); token_idx < generated_ids.size(); token_idx++) {
345345
generated_ids_data[pos] = generated_ids[token_idx];
346346
pos++;

src/cpp/src/sequence_group.cpp

+1-2
Original file line numberDiff line numberDiff line change
@@ -40,7 +40,7 @@ size_t Sequence::_make_hash(size_t content_length) {
4040
size = content.size() * sizeof(content[0]);
4141
}
4242
else if (sequence_group->get_sequence_group_type() == SequenceGroupType::EMBEDDINGS) {
43-
const auto input_embeds = sequence_group->get_input_embeds();
43+
const auto& input_embeds = sequence_group->get_input_embeds();
4444
const auto generated_embeds = m_generated_ids_embeds;
4545
OPENVINO_ASSERT(content_length <= input_embeds.size() + generated_embeds.size());
4646
std::vector<float> content_float;
@@ -49,7 +49,6 @@ size_t Sequence::_make_hash(size_t content_length) {
4949
if (block_start_idx < input_embeds.size()) {
5050
for (size_t idx = block_start_idx; idx < std::min(input_embeds.size(), content_length); idx++) {
5151
auto embed = _reduce_embedding(input_embeds[idx]);
52-
const char* embed_char = reinterpret_cast<const char*>(embed.data());
5352
content_float.insert(content_float.end(), embed.begin(), embed.end());
5453
}
5554
}

src/cpp/src/sequence_group.hpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -202,7 +202,7 @@ class Sequence {
202202
m_sequence_group = sequence_group;
203203
}
204204

205-
std::vector<std::vector<float>> get_generated_ids_embeds() const{
205+
const std::vector<std::vector<float>>& get_generated_ids_embeds() const {
206206
OPENVINO_ASSERT(m_type == ov::genai::SequenceGroupType::EMBEDDINGS);
207207
return m_generated_ids_embeds;
208208
}

0 commit comments

Comments
 (0)