Skip to content

Commit ea784c1

Browse files
[SYCL] re-enabled mul_mat_batched_sycl path for batched Q*K & KQ*V (#8057)
1 parent 0e4699e commit ea784c1

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml-sycl.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15228,7 +15228,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1
1522815228
} else if (!split && src0->type == GGML_TYPE_F16 && !ggml_is_contiguous(src0) && !ggml_is_transposed(src1) && src1->ne[1] == 1) {
1522915229
// KQV single-batch
1523015230
ggml_sycl_mul_mat_vec_nc(src0, src1, dst);
15231-
} else if (!split && src0->type == GGML_TYPE_F16 && (src1->type == GGML_TYPE_F16) && !ggml_is_transposed(src0) && !ggml_is_transposed(src1) && src1->ne[2]*src1->ne[3] > 1) {
15231+
} else if (!split && src0->type == GGML_TYPE_F16 && !ggml_is_transposed(src0) && !ggml_is_transposed(src1) && src1->ne[2] * src1->ne[3] > 1) {
1523215232
// KQ + KQV multi-batch
1523315233
ggml_sycl_mul_mat_batched_sycl(src0, src1, dst);
1523415234
} else if (use_dequantize_mul_mat_vec) {

0 commit comments

Comments
 (0)