Skip to content

Commit d4ba722

Browse files
committed
Optimize soft_max
1 parent 14ea4fa commit d4ba722

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

ggml/src/ggml-vulkan/ggml-vulkan.cpp

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1428,8 +1428,9 @@ static bool ggml_vk_matmul_shmem_support(const vk_device& device, const std::vec
14281428
// Inner map: key is pipeline name; value is the subgroup size.
14291429
static std::unordered_map<std::string, std::unordered_map<std::string, uint32_t>> gpu_pipeline_config = {
14301430
{"RX 5700", {
1431-
{"im2col_f32", 64},
1432-
{"im2col_f32_f16", 64}
1431+
{"soft_max_f32", 64}, {"soft_max_f32_wg512", 64},
1432+
{"soft_max_f32_f16", 64}, {"soft_max_f32_f16_wg512", 64},
1433+
{"im2col_f32", 64}, {"im2col_f32_f16", 64},
14331434
}}
14341435
};
14351436

0 commit comments

Comments
 (0)