Skip to content

Commit d43da7e

Browse files
committed
rename AppendExtraBoolArg
1 parent d678b26 commit d43da7e

File tree

1 file changed

+7
-5
lines changed

1 file changed

+7
-5
lines changed

clang/lib/CodeGen/CGBuiltin.cpp

Lines changed: 7 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -18330,8 +18330,10 @@ Value *CodeGenFunction::EmitAMDGPUBuiltinExpr(unsigned BuiltinID,
1833018330
// D = A * B + C
1833118331
// We need to specify one type for matrices AB and one for matrices CD.
1833218332
SmallVector<unsigned, 2> ArgsForMatchingMatrixTypes;
18333-
// Some intrinsics expect "false" as an extra bool argument.
18334-
bool AppendExtraBoolArg = false;
18333+
// On GFX12, the intrinsics with 16-bit accumulator use a packed layout.
18334+
// There is no need for the variable opsel argument, so always set it to
18335+
// "false".
18336+
bool AppendFalseForOpselArg = false;
1833518337
unsigned BuiltinWMMAOp;
1833618338

1833718339
switch (BuiltinID) {
@@ -18351,7 +18353,7 @@ Value *CodeGenFunction::EmitAMDGPUBuiltinExpr(unsigned BuiltinID,
1835118353
break;
1835218354
case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w32_gfx12:
1835318355
case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w64_gfx12:
18354-
AppendExtraBoolArg = true;
18356+
AppendFalseForOpselArg = true;
1835518357
LLVM_FALLTHROUGH;
1835618358
case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w32:
1835718359
case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w64:
@@ -18360,7 +18362,7 @@ Value *CodeGenFunction::EmitAMDGPUBuiltinExpr(unsigned BuiltinID,
1836018362
break;
1836118363
case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w32_gfx12:
1836218364
case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w64_gfx12:
18363-
AppendExtraBoolArg = true;
18365+
AppendFalseForOpselArg = true;
1836418366
LLVM_FALLTHROUGH;
1836518367
case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w32:
1836618368
case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w64:
@@ -18476,7 +18478,7 @@ Value *CodeGenFunction::EmitAMDGPUBuiltinExpr(unsigned BuiltinID,
1847618478
SmallVector<Value *, 6> Args;
1847718479
for (int i = 0, e = E->getNumArgs(); i != e; ++i)
1847818480
Args.push_back(EmitScalarExpr(E->getArg(i)));
18479-
if (AppendExtraBoolArg)
18481+
if (AppendFalseForOpselArg)
1848018482
Args.push_back(Builder.getFalse());
1848118483

1848218484
SmallVector<llvm::Type *, 6> ArgTypes;

0 commit comments

Comments
 (0)