Skip to content

Commit 4c72ab1

Browse files
committed
metal : use mm kernels for batch size > 2
1 parent e946379 commit 4c72ab1

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml-metal.m

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -958,7 +958,7 @@ void ggml_metal_graph_compute(
958958
src1t == GGML_TYPE_F32 &&
959959
[ctx->device supportsFamily:MTLGPUFamilyApple7] &&
960960
ne00%32 == 0 &&
961-
ne11 > 1) {
961+
ne11 > 2) {
962962
switch (src0->type) {
963963
case GGML_TYPE_F32: [encoder setComputePipelineState:ctx->pipeline_mul_mm_f32_f32]; break;
964964
case GGML_TYPE_F16: [encoder setComputePipelineState:ctx->pipeline_mul_mm_f16_f32]; break;

0 commit comments

Comments
 (0)