@@ -788,7 +788,7 @@ static void quantize_row_q4_0(const float * restrict x, void * restrict vy, int
788
788
MAX (wasm_f32x4_extract_lane (amaxv [0 ], 2 ), wasm_f32x4_extract_lane (amaxv [0 ], 3 )));
789
789
790
790
const float d = amax / ((1 << 3 ) - 1 );
791
- const float id = d ? 1.0 /d : 0.0 ;
791
+ const float id = d ? 1.0f /d : 0.0f ;
792
792
793
793
y [i ].d = d ;
794
794
@@ -2087,18 +2087,18 @@ static void ggml_vec_dot_q4_0(const int n, float * restrict s, const void * rest
2087
2087
float sum1 = 0.0f ;
2088
2088
2089
2089
for (int i = 0 ; i < nb ; i += 2 ) {
2090
- const block_q4_0 * restrict x0 = & px [i + 0 ];
2091
- const block_q4_0 * restrict y0 = & py [i + 0 ];
2092
- const block_q4_0 * restrict x1 = & px [i + 1 ];
2093
- const block_q4_0 * restrict y1 = & py [i + 1 ];
2090
+ const block_q4_0 * restrict x0 = & x [i + 0 ];
2091
+ const block_q4_0 * restrict y0 = & y [i + 0 ];
2092
+ const block_q4_0 * restrict x1 = & x [i + 1 ];
2093
+ const block_q4_0 * restrict y1 = & y [i + 1 ];
2094
2094
2095
2095
const v128_t m4b = wasm_u8x16_splat (0xf );
2096
2096
const v128_t s8b = wasm_i8x16_splat (0x8 );
2097
2097
2098
- const v128_t v0_0 = wasm_v128_load (x0 . qs );
2099
- const v128_t v0_1 = wasm_v128_load (y0 . qs );
2100
- const v128_t v1_0 = wasm_v128_load (x1 . qs );
2101
- const v128_t v1_1 = wasm_v128_load (y1 . qs );
2098
+ const v128_t v0_0 = wasm_v128_load (x0 -> qs );
2099
+ const v128_t v0_1 = wasm_v128_load (y0 -> qs );
2100
+ const v128_t v1_0 = wasm_v128_load (x1 -> qs );
2101
+ const v128_t v1_1 = wasm_v128_load (y1 -> qs );
2102
2102
2103
2103
// 4-bit -> 8-bit
2104
2104
const v128_t v0_0l = wasm_v128_and (v0_0 , m4b );
0 commit comments