Skip to content

Commit 09b203c

Browse files
slarentybalex
authored andcommitted
cuda : fix LLAMA_CUDA_F16 build (ggml-org#6197)
1 parent 904d82e commit 09b203c

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml-cuda.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9453,7 +9453,7 @@ static void ggml_cuda_op_dequantize_mul_mat_vec(
94539453

94549454
// on some GPUs it is faster to convert src1 to half and to use half precision intrinsics
94559455
#ifdef GGML_CUDA_F16
9456-
cuda_pool_alloc<half> src1_dfloat_a;
9456+
ggml_cuda_pool_alloc<half> src1_dfloat_a(ctx.pool());
94579457
half * src1_dfloat = nullptr; // dfloat == half
94589458

94599459
bool src1_convert_f16 =

0 commit comments

Comments
 (0)