Skip to content

Commit 7efca48

Browse files
jerrymannilpruthvistony
authored andcommitted
Add new kernel config for AMD GPUs
1 parent e005ace commit 7efca48

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

torch/_inductor/kernel/mm_common.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -137,6 +137,7 @@ def filtered_configs(
137137
{"config": (128, 64, 32, 4, 8), "cond": True},
138138
{"config": (128, 128, 32, 2, 8), "cond": True},
139139
{"config": (128, 128, 32, 3, 4), "cond": True},
140+
{"config": (128, 128, 64, 2, 8), "cond": torch.version.hip is not None},
140141
{"config": (128, 128, 64, 3, 4), "cond": True},
141142
{"config": (128, 128, 64, 5, 8), "cond": True},
142143
]
@@ -184,6 +185,7 @@ def filtered_configs(
184185
# {"config": (32, 32, 16, 1, 2), "cond": True},
185186
{"config": (128, 256, 128, 3, 8), "cond": torch.version.hip is None},
186187
{"config": (256, 128, 128, 3, 8), "cond": torch.version.hip is None},
188+
{"config": (128, 128, 64, 2, 8), "cond": torch.version.hip is not None},
187189
]
188190

189191
# Mixed precision kernel configs for small sizes of m for mm's like (16, 8192) x (8192, 8192).

0 commit comments

Comments
 (0)