Skip to content

Commit 95f84d5

Browse files
authored
Fix q_xxs using mul_mat_q (#7459)
1 parent 5487593 commit 95f84d5

File tree

1 file changed

+1
-0
lines changed

1 file changed

+1
-0
lines changed

ggml-sycl.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15263,6 +15263,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1
1526315263
}
1526415264
} else {
1526515265
bool use_mul_mat_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type);
15266+
use_mul_mat_q = use_mul_mat_q && (src0->type != GGML_TYPE_IQ2_XXS);
1526615267

1526715268
if (use_xmx && min_compute_capability >= VER_GEN9 && src1->ne[1] > XMX_MAX_BATCH_SIZE) {
1526815269
use_mul_mat_q = false;

0 commit comments

Comments
 (0)