File tree Expand file tree Collapse file tree 2 files changed +4
-6
lines changed
ggml/src/ggml-vulkan/vulkan-shaders Expand file tree Collapse file tree 2 files changed +4
-6
lines changed Original file line number Diff line number Diff line change @@ -234,9 +234,9 @@ void main() {
234
234
#endif
235
235
236
236
#if QUANT_AUXF == 1
237
- FLOAT_TYPE cache_a_dm[TM];
237
+ FLOAT_TYPE cache_a_dm[WMITER * TM];
238
238
#else
239
- FLOAT_TYPE_VEC2 cache_a_dm[TM];
239
+ FLOAT_TYPE_VEC2 cache_a_dm[WMITER * TM];
240
240
#endif
241
241
242
242
FLOAT_TYPE_VEC2 cache_b_ds[TN];
@@ -247,7 +247,6 @@ void main() {
247
247
const uint iqs = loadr_a;
248
248
const uint buf_ib = loadc_a + l;
249
249
250
- // Should ds be gated to a single thread?
251
250
if (iqs == 0) {
252
251
#if QUANT_AUXF == 1
253
252
buf_a_dm[buf_ib] = get_d(ib);
@@ -276,7 +275,6 @@ void main() {
276
275
277
276
const uint buf_ib = loadc_b + l;
278
277
279
- // Should ds be gated to a single thread?
280
278
if (iqs == 0) {
281
279
buf_b_ds[buf_ib] = FLOAT_TYPE_VEC2(data_b[ib].ds);
282
280
}
Original file line number Diff line number Diff line change @@ -17,7 +17,7 @@ i32vec2 repack(uint ib, uint iqs) {
17
17
}
18
18
19
19
ACC_TYPE mul_q8_1(int32_t q_sum, float da, vec2 dsb) {
20
- return ACC_TYPE(da * (float(q_sum) * dsb.x - 8.0 * dsb.y));
20
+ return ACC_TYPE(da * (float(q_sum) * dsb.x - 8.0f * dsb.y));
21
21
}
22
22
#endif
23
23
@@ -51,7 +51,7 @@ i32vec2 repack(uint ib, uint iqs) {
51
51
}
52
52
53
53
ACC_TYPE mul_q8_1(int32_t q_sum, float da, vec2 dsb) {
54
- return ACC_TYPE(da * (float(q_sum) * dsb.x - 16.0 * dsb.y));
54
+ return ACC_TYPE(da * (float(q_sum) * dsb.x - 16.0f * dsb.y));
55
55
}
56
56
#endif
57
57
You can’t perform that action at this time.
0 commit comments