@@ -167,58 +167,58 @@ static_assert(sizeof(block_q8_K) == sizeof(float) + QK_K + QK_K/16*sizeof(int16_
167
167
168
168
169
169
// Quantization
170
- void quantize_row_q4_0_reference (const float * restrict x , block_q4_0 * restrict y , int k );
171
- void quantize_row_q4_1_reference (const float * restrict x , block_q4_1 * restrict y , int k );
172
- void quantize_row_q5_0_reference (const float * restrict x , block_q5_0 * restrict y , int k );
173
- void quantize_row_q5_1_reference (const float * restrict x , block_q5_1 * restrict y , int k );
174
- void quantize_row_q8_0_reference (const float * restrict x , block_q8_0 * restrict y , int k );
175
- void quantize_row_q8_1_reference (const float * restrict x , block_q8_1 * restrict y , int k );
176
-
177
- void quantize_row_q2_K_reference (const float * restrict x , block_q2_K * restrict y , int k );
178
- void quantize_row_q3_K_reference (const float * restrict x , block_q3_K * restrict y , int k );
179
- void quantize_row_q4_K_reference (const float * restrict x , block_q4_K * restrict y , int k );
180
- void quantize_row_q5_K_reference (const float * restrict x , block_q5_K * restrict y , int k );
181
- void quantize_row_q6_K_reference (const float * restrict x , block_q6_K * restrict y , int k );
182
- void quantize_row_q8_K_reference (const float * restrict x , block_q8_K * restrict y , int k );
183
-
184
- void quantize_row_q4_0 (const float * restrict x , void * restrict y , int k );
185
- void quantize_row_q4_1 (const float * restrict x , void * restrict y , int k );
186
- void quantize_row_q5_0 (const float * restrict x , void * restrict y , int k );
187
- void quantize_row_q5_1 (const float * restrict x , void * restrict y , int k );
188
- void quantize_row_q8_0 (const float * restrict x , void * restrict y , int k );
189
- void quantize_row_q8_1 (const float * restrict x , void * restrict y , int k );
190
-
191
- void quantize_row_q2_K (const float * restrict x , void * restrict y , int k );
192
- void quantize_row_q3_K (const float * restrict x , void * restrict y , int k );
193
- void quantize_row_q4_K (const float * restrict x , void * restrict y , int k );
194
- void quantize_row_q5_K (const float * restrict x , void * restrict y , int k );
195
- void quantize_row_q6_K (const float * restrict x , void * restrict y , int k );
196
- void quantize_row_q8_K (const float * restrict x , void * restrict y , int k );
170
+ void quantize_row_q4_0_reference (const float * __restrict__ x , block_q4_0 * __restrict__ y , int k );
171
+ void quantize_row_q4_1_reference (const float * __restrict__ x , block_q4_1 * __restrict__ y , int k );
172
+ void quantize_row_q5_0_reference (const float * __restrict__ x , block_q5_0 * __restrict__ y , int k );
173
+ void quantize_row_q5_1_reference (const float * __restrict__ x , block_q5_1 * __restrict__ y , int k );
174
+ void quantize_row_q8_0_reference (const float * __restrict__ x , block_q8_0 * __restrict__ y , int k );
175
+ void quantize_row_q8_1_reference (const float * __restrict__ x , block_q8_1 * __restrict__ y , int k );
176
+
177
+ void quantize_row_q2_K_reference (const float * __restrict__ x , block_q2_K * __restrict__ y , int k );
178
+ void quantize_row_q3_K_reference (const float * __restrict__ x , block_q3_K * __restrict__ y , int k );
179
+ void quantize_row_q4_K_reference (const float * __restrict__ x , block_q4_K * __restrict__ y , int k );
180
+ void quantize_row_q5_K_reference (const float * __restrict__ x , block_q5_K * __restrict__ y , int k );
181
+ void quantize_row_q6_K_reference (const float * __restrict__ x , block_q6_K * __restrict__ y , int k );
182
+ void quantize_row_q8_K_reference (const float * __restrict__ x , block_q8_K * __restrict__ y , int k );
183
+
184
+ void quantize_row_q4_0 (const float * __restrict__ x , void * __restrict__ y , int k );
185
+ void quantize_row_q4_1 (const float * __restrict__ x , void * __restrict__ y , int k );
186
+ void quantize_row_q5_0 (const float * __restrict__ x , void * __restrict__ y , int k );
187
+ void quantize_row_q5_1 (const float * __restrict__ x , void * __restrict__ y , int k );
188
+ void quantize_row_q8_0 (const float * __restrict__ x , void * __restrict__ y , int k );
189
+ void quantize_row_q8_1 (const float * __restrict__ x , void * __restrict__ y , int k );
190
+
191
+ void quantize_row_q2_K (const float * __restrict__ x , void * __restrict__ y , int k );
192
+ void quantize_row_q3_K (const float * __restrict__ x , void * __restrict__ y , int k );
193
+ void quantize_row_q4_K (const float * __restrict__ x , void * __restrict__ y , int k );
194
+ void quantize_row_q5_K (const float * __restrict__ x , void * __restrict__ y , int k );
195
+ void quantize_row_q6_K (const float * __restrict__ x , void * __restrict__ y , int k );
196
+ void quantize_row_q8_K (const float * __restrict__ x , void * __restrict__ y , int k );
197
197
198
198
// Dequantization
199
- void dequantize_row_q4_0 (const block_q4_0 * restrict x , float * restrict y , int k );
200
- void dequantize_row_q4_1 (const block_q4_1 * restrict x , float * restrict y , int k );
201
- void dequantize_row_q5_0 (const block_q5_0 * restrict x , float * restrict y , int k );
202
- void dequantize_row_q5_1 (const block_q5_1 * restrict x , float * restrict y , int k );
203
- void dequantize_row_q8_0 (const block_q8_0 * restrict x , float * restrict y , int k );
204
- //void dequantize_row_q8_1(const block_q8_1 * restrict x, float * restrict y, int k);
205
-
206
- void dequantize_row_q2_K (const block_q2_K * restrict x , float * restrict y , int k );
207
- void dequantize_row_q3_K (const block_q3_K * restrict x , float * restrict y , int k );
208
- void dequantize_row_q4_K (const block_q4_K * restrict x , float * restrict y , int k );
209
- void dequantize_row_q5_K (const block_q5_K * restrict x , float * restrict y , int k );
210
- void dequantize_row_q6_K (const block_q6_K * restrict x , float * restrict y , int k );
211
- void dequantize_row_q8_K (const block_q8_K * restrict x , float * restrict y , int k );
199
+ void dequantize_row_q4_0 (const block_q4_0 * __restrict__ x , float * __restrict__ y , int k );
200
+ void dequantize_row_q4_1 (const block_q4_1 * __restrict__ x , float * __restrict__ y , int k );
201
+ void dequantize_row_q5_0 (const block_q5_0 * __restrict__ x , float * __restrict__ y , int k );
202
+ void dequantize_row_q5_1 (const block_q5_1 * __restrict__ x , float * __restrict__ y , int k );
203
+ void dequantize_row_q8_0 (const block_q8_0 * __restrict__ x , float * __restrict__ y , int k );
204
+ //void dequantize_row_q8_1(const block_q8_1 * __restrict__ x, float * __restrict__ y, int k);
205
+
206
+ void dequantize_row_q2_K (const block_q2_K * __restrict__ x , float * __restrict__ y , int k );
207
+ void dequantize_row_q3_K (const block_q3_K * __restrict__ x , float * __restrict__ y , int k );
208
+ void dequantize_row_q4_K (const block_q4_K * __restrict__ x , float * __restrict__ y , int k );
209
+ void dequantize_row_q5_K (const block_q5_K * __restrict__ x , float * __restrict__ y , int k );
210
+ void dequantize_row_q6_K (const block_q6_K * __restrict__ x , float * __restrict__ y , int k );
211
+ void dequantize_row_q8_K (const block_q8_K * __restrict__ x , float * __restrict__ y , int k );
212
212
213
213
// Dot product
214
- void ggml_vec_dot_q4_0_q8_0 (int n , float * restrict s , const void * restrict vx , const void * restrict vy );
215
- void ggml_vec_dot_q4_1_q8_1 (int n , float * restrict s , const void * restrict vx , const void * restrict vy );
216
- void ggml_vec_dot_q5_0_q8_0 (int n , float * restrict s , const void * restrict vx , const void * restrict vy );
217
- void ggml_vec_dot_q5_1_q8_1 (int n , float * restrict s , const void * restrict vx , const void * restrict vy );
218
- void ggml_vec_dot_q8_0_q8_0 (int n , float * restrict s , const void * restrict vx , const void * restrict vy );
219
-
220
- void ggml_vec_dot_q2_K_q8_K (int n , float * restrict s , const void * restrict vx , const void * restrict vy );
221
- void ggml_vec_dot_q3_K_q8_K (int n , float * restrict s , const void * restrict vx , const void * restrict vy );
222
- void ggml_vec_dot_q4_K_q8_K (int n , float * restrict s , const void * restrict vx , const void * restrict vy );
223
- void ggml_vec_dot_q5_K_q8_K (int n , float * restrict s , const void * restrict vx , const void * restrict vy );
224
- void ggml_vec_dot_q6_K_q8_K (int n , float * restrict s , const void * restrict vx , const void * restrict vy );
214
+ void ggml_vec_dot_q4_0_q8_0 (int n , float * __restrict__ s , const void * __restrict__ vx , const void * __restrict__ vy );
215
+ void ggml_vec_dot_q4_1_q8_1 (int n , float * __restrict__ s , const void * __restrict__ vx , const void * __restrict__ vy );
216
+ void ggml_vec_dot_q5_0_q8_0 (int n , float * __restrict__ s , const void * __restrict__ vx , const void * __restrict__ vy );
217
+ void ggml_vec_dot_q5_1_q8_1 (int n , float * __restrict__ s , const void * __restrict__ vx , const void * __restrict__ vy );
218
+ void ggml_vec_dot_q8_0_q8_0 (int n , float * __restrict__ s , const void * __restrict__ vx , const void * __restrict__ vy );
219
+
220
+ void ggml_vec_dot_q2_K_q8_K (int n , float * __restrict__ s , const void * __restrict__ vx , const void * __restrict__ vy );
221
+ void ggml_vec_dot_q3_K_q8_K (int n , float * __restrict__ s , const void * __restrict__ vx , const void * __restrict__ vy );
222
+ void ggml_vec_dot_q4_K_q8_K (int n , float * __restrict__ s , const void * __restrict__ vx , const void * __restrict__ vy );
223
+ void ggml_vec_dot_q5_K_q8_K (int n , float * __restrict__ s , const void * __restrict__ vx , const void * __restrict__ vy );
224
+ void ggml_vec_dot_q6_K_q8_K (int n , float * __restrict__ s , const void * __restrict__ vx , const void * __restrict__ vy );
0 commit comments