Skip to content

Commit 42f70cb

Browse files
ikawrakowKawrakow
andauthored
Fix scalar version of Q5_K when QK_K = 64 (#2362)
Co-authored-by: Iwan Kawrakow <[email protected]>
1 parent 84e09a7 commit 42f70cb

File tree

1 file changed

+2
-3
lines changed

1 file changed

+2
-3
lines changed

k_quants.c

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3297,8 +3297,7 @@ void ggml_vec_dot_q5_K_q8_K(const int n, float * restrict s, const void * restri
32973297

32983298
#else
32993299

3300-
3301-
uint8_t aux8[QK_K];
3300+
int8_t aux8[QK_K];
33023301
int16_t aux16[16];
33033302
float sums [8];
33043303
memset(sums, 0, 8*sizeof(float));
@@ -3308,7 +3307,7 @@ void ggml_vec_dot_q5_K_q8_K(const int n, float * restrict s, const void * restri
33083307
const uint8_t * restrict q4 = x[i].qs;
33093308
const uint8_t * restrict hm = x[i].qh;
33103309
const int8_t * restrict q8 = y[i].qs;
3311-
uint8_t * restrict a = aux8;
3310+
int8_t * restrict a = aux8;
33123311
for (int l = 0; l < 32; ++l) {
33133312
a[l+ 0] = q4[l] & 0xF;
33143313
a[l+32] = q4[l] >> 4;

0 commit comments

Comments
 (0)