File tree Expand file tree Collapse file tree 1 file changed +4
-5
lines changed Expand file tree Collapse file tree 1 file changed +4
-5
lines changed Original file line number Diff line number Diff line change @@ -1400,7 +1400,7 @@ static __device__ __forceinline__ float vec_dot_q8_0_q8_1(const void * __restric
1400
1400
static __device__ __forceinline__ float vec_dot_q2_K_q8_1 (
1401
1401
const void * __restrict__ vbq, const block_q8_1 * __restrict__ bq8_1, const int iqs) {
1402
1402
1403
- // #if __CUDA_ARCH__ >= 600 // lowest compute capability for integer intrinsics
1403
+ #if __CUDA_ARCH__ >= 600 // lowest compute capability for integer intrinsics
1404
1404
const block_q2_K * bq2_K = (const block_q2_K *) vbq;
1405
1405
1406
1406
const int bq8_offset = 4 * (iqs/8 );
@@ -1426,11 +1426,10 @@ static __device__ __forceinline__ float vec_dot_q2_K_q8_1(
1426
1426
sumf_m += d8i * (__dp4a (0x01010101 , uii, 0 ) * (sc >> 4 ));
1427
1427
}
1428
1428
1429
-
1430
1429
return d*sumf_d - dmin*sumf_m;
1431
- // #else
1432
- // return 0.0f; // only to satisfy the compiler
1433
- // #endif // __CUDA_ARCH__ >= 600
1430
+ #else
1431
+ return 0 .0f ; // only to satisfy the compiler
1432
+ #endif // __CUDA_ARCH__ >= 600
1434
1433
}
1435
1434
1436
1435
template <int qk, int qi, typename block_q_t , vec_dot_q_cuda_t vec_dot_q_cuda>
You can’t perform that action at this time.
0 commit comments