Skip to content

Commit 46fb2f5

Browse files
committed
[GPU] Fix synchronization in the PagedAttention kernel when KV-cache rotation is enabled but skipped for the current iteration
1 parent 6eda8ce commit 46fb2f5

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

src/plugins/intel_gpu/src/graph/impls/ocl/paged_attention.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -346,7 +346,7 @@ struct paged_attention_impl : multi_stage_primitive<paged_attention> {
346346

347347
std::vector<event::ptr> res_events;
348348
std::vector<event::ptr> dep_events = events;
349-
if (has_rotated_blocks) {
349+
if (has_rotated_blocks && !_kernels_data[Stage::KV_CACHE_ROTATE].kernels[0].skip_execution) {
350350
execute_stage(dep_events, instance, res_events, Stage::KV_CACHE_ROTATE, is_mixed_mode);
351351
dep_events = res_events;
352352
}

0 commit comments

Comments
 (0)