@@ -3028,7 +3028,7 @@ static bool should_reorder_tensor(ggml_backend_sycl_context& ctx, const ggml_ten
3028
3028
return !g_ggml_sycl_disable_optimize && // allow optimize, controlled by $GGML_SYCL_DISABLE_OPT
3029
3029
ctx.opt_feature .reorder && // allow this device due to good perf, skip the devices with bad perf.
3030
3030
dst->op == GGML_OP_MUL_MAT && // limit to some supported cases of Q4_0, to do for more cases.
3031
- dst->src [1 ]->ne [2 ]==1 && dst->src [1 ]->ne [3 ]==1 ;
3031
+ dst->src [1 ]->ne [1 ]== 1 && dst-> src [ 1 ]-> ne [ 2 ]==1 && dst->src [1 ]->ne [3 ]==1 ;
3032
3032
}
3033
3033
3034
3034
static void opt_for_reorder (ggml_backend_sycl_context * ctx, const ggml_tensor * src0, const ggml_tensor * /* src1 */ ,
@@ -3151,8 +3151,6 @@ static void ggml_sycl_mul_mat(ggml_backend_sycl_context & ctx, const ggml_tensor
3151
3151
ggml_sycl_op_mul_mat (ctx, src0, src1, dst, ggml_sycl_op_mul_mat_q, convert_src1_to_q8_1);
3152
3152
} else {
3153
3153
constexpr bool convert_src1_to_q8_1 = false ;
3154
- // MUL_MAT_SYCL supports reorder
3155
- opt_for_reorder (&ctx, src0, src1, dst, mul_mat_algo::MUL_MAT_SYCL);
3156
3154
ggml_sycl_op_mul_mat (ctx, src0, src1, dst, ggml_sycl_op_mul_mat_sycl, convert_src1_to_q8_1);
3157
3155
}
3158
3156
GGML_SYCL_DEBUG (" call %s done\n " , __func__);
0 commit comments