Skip to content

Commit 1fbd98f

Browse files
authored
Update dynamic_quantize_gpu_kv_cache.cl
1 parent 317638e commit 1fbd98f

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

src/plugins/intel_gpu/src/kernel_selector/cl_kernels/dynamic_quantize_gpu_kv_cache.cl

+1-1
Original file line numberDiff line numberDiff line change
@@ -89,7 +89,7 @@ KERNEL(dynamic_quantize_gpu_kv_cache)(
8989
max_value = work_group_reduce_max(max_value);
9090

9191
// If the range of input data is zero, it is adjusted to the minimum value(0.001).
92-
half diff_value = max_value == min_value ? (grp_max) : (max_value - min_value);
92+
ACCUMULATOR_TYPE diff_value = max_value == min_value ? (grp_max) : (max_value - min_value);
9393
ACCUMULATOR_TYPE scale_tmp = (ACCUMULATOR_TYPE)((CHAR_MAX - CHAR_MIN) / diff_value);
9494
ACCUMULATOR_TYPE zp_tmp = (ACCUMULATOR_TYPE)(-min_value * scale_tmp) + CHAR_MIN;
9595
OUTPUT1_TYPE scale = (OUTPUT1_TYPE)(scale_tmp);

0 commit comments

Comments
 (0)