Skip to content

Commit cefda3a

Browse files
jerrymannildnikolaev-amd
authored andcommitted
Add new kernel config for AMD GPUs
1 parent 31b3681 commit cefda3a

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

torch/_inductor/kernel/mm_common.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -136,6 +136,7 @@ def filtered_configs(
136136
{"config": (128, 64, 32, 4, 8), "cond": True},
137137
{"config": (128, 128, 32, 2, 8), "cond": True},
138138
{"config": (128, 128, 32, 3, 4), "cond": True},
139+
{"config": (128, 128, 64, 2, 8), "cond": torch.version.hip is not None},
139140
{"config": (128, 128, 64, 3, 4), "cond": True},
140141
{"config": (128, 128, 64, 5, 8), "cond": True},
141142
]
@@ -165,6 +166,7 @@ def filtered_configs(
165166
# {"config": (32, 32, 16, 1, 2), "cond": True},
166167
{"config": (128, 256, 128, 3, 8), "cond": torch.version.hip is None},
167168
{"config": (256, 128, 128, 3, 8), "cond": torch.version.hip is None},
169+
{"config": (128, 128, 64, 2, 8), "cond": torch.version.hip is not None},
168170
]
169171

170172
# Mixed precision kernel configs for small sizes of m for mm's like (16, 8192) x (8192, 8192).

0 commit comments

Comments
 (0)