Skip to content

Commit 4b17701

Browse files
author
Aidan
committed
Fix q_xxs using mul_mat_q
1 parent 62bfef5 commit 4b17701

File tree

1 file changed

+1
-0
lines changed

1 file changed

+1
-0
lines changed

ggml-sycl.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15243,6 +15243,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1
1524315243
}
1524415244
} else {
1524515245
bool use_mul_mat_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type);
15246+
use_mul_mat_q = use_mul_mat_q && (src0->type != GGML_TYPE_IQ2_XXS);
1524615247

1524715248
if (use_xmx && min_compute_capability >= VER_GEN9 && src1->ne[1] > XMX_MAX_BATCH_SIZE) {
1524815249
use_mul_mat_q = false;

0 commit comments

Comments
 (0)