Skip to content

Commit d149dd4

Browse files
author
Vladimir Paramuzov
committed
fixes
1 parent 478c588 commit d149dd4

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

src/plugins/intel_gpu/src/kernel_selector/cl_kernels/sdpa_micro.cl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -265,7 +265,7 @@ KERNEL(micro_sdpa)(OPTIONAL_SHAPE_INFO_ARG
265265

266266
#if WITH_ATTN_MASK
267267
mask_tile_type mask_tile;
268-
tile_load_t(&mask_tile, msk, k, q, q, sg_j0_kq + wg_j0, k0 + sg_i0_kq);
268+
tile_load_t(&mask_tile, msk, q, k, q, sg_j0_kq + wg_j0, k0 + sg_i0_kq);
269269
#endif
270270

271271
#if REMAINDER_K

src/plugins/intel_gpu/src/kernel_selector/kernels/sdpa/sdpa_kernel_micro.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -187,7 +187,7 @@ void SDPAKernelMicro::init_microkernels(const sdpa_params& params, micro::Packag
187187
auto& out = params.outputs[0];
188188
const auto head_size = params.conf.head_size;
189189
const auto d_max = get_d_max(head_size);
190-
const Tensor::Dim n_keys = K.X().v; //get_seq_length(K, params.input1_order);
190+
const Tensor::Dim n_keys = get_seq_length(K, params.input1_order);
191191
const Tensor::Dim n_queries = get_seq_length(Q, params.input0_order);
192192
const Tensor::Dim n_values = V.X();
193193
const auto batch = out.Batch().v * out.Feature().v;
@@ -585,7 +585,7 @@ void SDPAKernelMicro::GetUpdateDispatchDataFunc(KernelData& kd) const {
585585
s_q.t = ScalarDescriptor::Types::INT32;
586586
s_q.v.s32 = static_cast<uint32_t>(n_queries.v);
587587

588-
const bool is_prefill = true;//n_queries.v > 1;
588+
const bool is_prefill = n_queries.v > 1;
589589

590590
OPENVINO_ASSERT(kernel_data.kernels.size() == 2, "[GPU] Invalid kernels size for update dispatch data func");
591591

0 commit comments

Comments
 (0)