Skip to content

Commit c01ccf8

Browse files
committed
little stuff
1 parent d70a731 commit c01ccf8

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_q3_k.comp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55

66
layout(local_size_x_id = 0, local_size_y = 1, local_size_z = 1) in;
77

8-
shared FLOAT_TYPE sccache[BLOCK_SIZE/16][2][12];
8+
shared FLOAT_TYPE sccache[BLOCK_SIZE/16][2][8];
99

1010
void compute_outputs(const uint32_t first_row, const uint32_t num_rows) {
1111
uint a_offset, b_offset, d_offset;
@@ -44,7 +44,7 @@ void compute_outputs(const uint32_t first_row, const uint32_t num_rows) {
4444
const uint ib0 = a_offset / QUANT_K + (first_row+n)*num_blocks_per_row;
4545
const FLOAT_TYPE d = FLOAT_TYPE(data_a[ib0 + i].d);
4646

47-
sccache[ix][v_im][itid8] = FLOAT_TYPE(int8_t(((int8_t(data_a[ib0+i].scales[itid8]) >> 4*v_im) & 0xF) | ((int8_t(data_a[ib0+i].scales[itid%4+8]) >> (4*v_im + 2*(itid8/4)) & 0x3) << 4)) - 32);
47+
sccache[ix][v_im][itid8] = FLOAT_TYPE(int8_t(((int8_t(data_a[ib0+i].scales[itid8]) >> 4*v_im) & 0xF) | ((int8_t(data_a[ib0+i].scales[itid8%4+8]) >> (4*v_im + 2*(itid8/4)) & 0x3) << 4)) - 32);
4848
barrier();
4949

5050
[[unroll]] for (uint j = 0; j < NUM_COLS; ++j) {

0 commit comments

Comments
 (0)