Skip to content

Commit 8846fb8

Browse files
committedMar 18, 2025
[CHECK] OVMS try CPU crash
1 parent 69720e5 commit 8846fb8

File tree

1 file changed

+1
-6
lines changed

1 file changed

+1
-6
lines changed
 

‎src/cpp/src/continuous_batching_impl.cpp

+1-6
Original file line numberDiff line numberDiff line change
@@ -115,12 +115,7 @@ void ContinuousBatchingPipeline::ContinuousBatchingImpl::initialize_pipeline(
115115
normalized_config.num_kv_blocks = size_in_bytes / cache_manager->get_block_size_in_bytes();
116116
}
117117

118-
bool can_use_partial_preemption = true;
119-
if (device.find("GPU") != std::string::npos && !normalized_config.dynamic_split_fuse) {
120-
// in case of executing a `vLLM-like` pipeline, it's better not to use partial eviction on the GPU,
121-
// as it may lead to performance slowdown
122-
can_use_partial_preemption = false;
123-
}
118+
bool can_use_partial_preemption = false;
124119

125120
m_scheduler = std::make_shared<Scheduler>(m_block_size, cache_manager, normalized_config, m_num_decoder_layers, can_use_partial_preemption);
126121

0 commit comments

Comments
 (0)