Skip to content

Commit 155902b

Browse files
author
Aidan
committed
Fix q_xxs using mul_mat_q
1 parent 9a17ab9 commit 155902b

File tree

1 file changed

+1
-0
lines changed

1 file changed

+1
-0
lines changed

ggml-sycl.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15703,6 +15703,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1
1570315703
}
1570415704
} else {
1570515705
bool use_mul_mat_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type);
15706+
use_mul_mat_q = use_mul_mat_q && (src0->type != GGML_TYPE_IQ2_XXS);
1570615707

1570715708
if (use_xmx && min_compute_capability >= VER_GEN9 && src1->ne[1] > XMX_MAX_BATCH_SIZE) {
1570815709
use_mul_mat_q = false;

0 commit comments

Comments
 (0)