Skip to content

Commit 1861a36

Browse files
Fixed q2_k compute arch
1 parent 6f2ea98 commit 1861a36

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

ggml-cuda.cu

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1400,7 +1400,7 @@ static __device__ __forceinline__ float vec_dot_q8_0_q8_1(const void * __restric
14001400
static __device__ __forceinline__ float vec_dot_q2_K_q8_1(
14011401
const void * __restrict__ vbq, const block_q8_1 * __restrict__ bq8_1, const int iqs) {
14021402

1403-
#if __CUDA_ARCH__ >= 600 // lowest compute capability for integer intrinsics
1403+
#if __CUDA_ARCH__ >= 610 // lowest compute capability for integer intrinsics
14041404
const block_q2_K * bq2_K = (const block_q2_K *) vbq;
14051405

14061406
const int bq8_offset = 4 * (iqs/8);
@@ -1429,7 +1429,7 @@ static __device__ __forceinline__ float vec_dot_q2_K_q8_1(
14291429
return d*sumf_d - dmin*sumf_m;
14301430
#else
14311431
return 0.0f; // only to satisfy the compiler
1432-
#endif // __CUDA_ARCH__ >= 600
1432+
#endif // __CUDA_ARCH__ >= 610
14331433
}
14341434

14351435
template <int qk, int qi, typename block_q_t, vec_dot_q_cuda_t vec_dot_q_cuda>

0 commit comments

Comments
 (0)