@@ -121,6 +121,7 @@ Dataset filtered_dataset(const std::string& models_path, const std::string& data
121
121
122
122
ov::genai::GenerationConfig greedy_search = ov::genai::greedy ();
123
123
greedy_search.max_new_tokens = std::min (max_output_len, output_len);
124
+ greedy_search.ignore_eos = true ;
124
125
greedy_search.repetition_penalty = 1.0 ;
125
126
greedy_search.frequency_penalty = 0.0 ;
126
127
greedy_search.presence_penalty = 0.0 ;
@@ -228,14 +229,16 @@ class GenerationInfo {
228
229
229
230
GenerationMetrics get_metrics () {
230
231
GenerationMetrics generation_metrics;
231
- for (auto & sequenceInfoPair : sequences_info) {
232
- generation_metrics.mean_ttft += sequenceInfoPair.second .ttft ;
233
- generation_metrics.mean_tpot += sequenceInfoPair.second .mean_tpot ;
234
- generation_metrics.num_output_tokens += sequenceInfoPair.second .num_output_tokens ;
232
+ if (!sequences_info.empty ()) {
233
+ for (auto & sequenceInfoPair : sequences_info) {
234
+ generation_metrics.mean_ttft += sequenceInfoPair.second .ttft ;
235
+ generation_metrics.mean_tpot += sequenceInfoPair.second .mean_tpot ;
236
+ generation_metrics.num_output_tokens += sequenceInfoPair.second .num_output_tokens ;
237
+ }
238
+ generation_metrics.mean_ttft /= sequences_info.size ();
239
+ generation_metrics.mean_tpot /= sequences_info.size ();
240
+ generation_metrics.num_input_tokens = input_len;
235
241
}
236
- generation_metrics.mean_ttft /= sequences_info.size ();
237
- generation_metrics.mean_tpot /= sequences_info.size ();
238
- generation_metrics.num_input_tokens = input_len;
239
242
return generation_metrics;
240
243
}
241
244
};
0 commit comments