Skip to content

Commit 50b43c5

Browse files
ggerganovjordankanter
authored andcommitted
ggml : fix vld1q_s8_x4 32-bit compat (ggml-org#4828)
* ggml : fix vld1q_s8_x4 32-bit compat ggml-ci * ggml : fix 32-bit ARM compat (cont) ggml-ci
1 parent bdfb181 commit 50b43c5

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

ggml-quants.c

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -7250,9 +7250,9 @@ void ggml_vec_dot_iq2_xxs_q8_K(const int n, float * restrict s, const void * res
72507250
uint32_t aux32[4];
72517251
const uint8_t * aux8 = (const uint8_t *)aux32;
72527252

7253-
int8x16x4_t q2u;
7254-
int8x16x4_t q2s;
7255-
int8x16x4_t q8b;
7253+
ggml_int8x16x4_t q2u;
7254+
ggml_int8x16x4_t q2s;
7255+
ggml_int8x16x4_t q8b;
72567256

72577257
float sumf = 0;
72587258
for (int i = 0; i < nb; ++i) {
@@ -7261,7 +7261,7 @@ void ggml_vec_dot_iq2_xxs_q8_K(const int n, float * restrict s, const void * res
72617261
const int8_t * restrict q8 = y[i].qs;
72627262
float sumf1 = 0, sumf2 = 0;
72637263
for (int ib32 = 0; ib32 < QK_K/32; ib32 += 2) {
7264-
q8b = vld1q_s8_x4(q8); q8 += 64;
7264+
q8b = ggml_vld1q_s8_x4(q8); q8 += 64;
72657265
memcpy(aux32, q2, 4*sizeof(uint32_t)); q2 += 8;
72667266
q2u.val[0] = vcombine_s8(vld1_s8((const void *)(iq2xxs_grid + aux8[ 0])), vld1_s8((const void *)(iq2xxs_grid + aux8[ 1])));
72677267
q2u.val[1] = vcombine_s8(vld1_s8((const void *)(iq2xxs_grid + aux8[ 2])), vld1_s8((const void *)(iq2xxs_grid + aux8[ 3])));

0 commit comments

Comments
 (0)