Skip to content

Commit b389842

Browse files
small change
1 parent 393eae0 commit b389842

File tree

1 file changed

+6
-6
lines changed

1 file changed

+6
-6
lines changed

ggml-cuda.cu

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1416,14 +1416,14 @@ static __device__ __forceinline__ float vec_dot_q2_K_q8_1(
14161416
for (int i = 0; i < 4; ++i) {
14171417
const int sc = bq2_K->scales[iqs - iqs%8 + (iqs%8) / 4 + 2*i];
14181418

1419-
const int vii = (vi >> (2*i)) & 0x03030303;
1420-
14211419
const block_q8_1 * bq8i = bq8_1 + bq8_offset + i;
1422-
const float d8 = bq8i->d;
1423-
const int qs8 = *((int*) &bq8i->qs[4*(iqs%8)]);
1420+
const float d8i = bq8i->d;
1421+
1422+
const int vii = (vi >> (2*i)) & 0x03030303;
1423+
const int uii = *((int*) &bq8i->qs[4 * (iqs%8)]);
14241424

1425-
sumf_d += d8 * __dp4a(vii, qs8, 0) * (sc & 0xF);
1426-
sumf_m += d8 * __dp4a(0x01010101, qs8, 0) * (sc >> 4);
1425+
sumf_d += d8i * __dp4a(vii, uii, 0) * (sc & 0xF);
1426+
sumf_m += d8i * __dp4a(0x01010101, uii, 0) * (sc >> 4);
14271427
}
14281428

14291429

0 commit comments

Comments
 (0)