Skip to content

Commit 153bb26

Browse files
committed
Use warp_size instead of WARP_SIZE
1 parent 071b282 commit 153bb26

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml/src/ggml-cuda/fattn.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -293,7 +293,7 @@ void ggml_cuda_flash_attn_ext(ggml_backend_cuda_context & ctx, ggml_tensor * dst
293293
return;
294294
}
295295

296-
if (Q->ne[1] == 1 && Q->ne[0] % (2*WARP_SIZE) == 0) {
296+
if (Q->ne[1] == 1 && Q->ne[0] % (2*warp_size) == 0) {
297297
if (prec == GGML_PREC_DEFAULT) {
298298
ggml_cuda_flash_attn_ext_vec_f16(ctx, dst);
299299
return;

0 commit comments

Comments
 (0)