[mlir][rocdl] Add AMDGPU-specific `cf.assert` lowering #121067

makslevental · 2024-12-24T20:31:33Z

This commit adds an AMD-specific lowering of cf.assert to llvm.intr.trap. It depends on (and is therefore merging into) #120431.

Note, the reason for lowering to llvm.intr.trap instead of __assertfail / __assert_fail is because these are header only functions in HIP.

Note also, this currently doesn't work with runtime=OpenCL because the gpu.printf isn't legalized on that path (ever? adjacent printf.mlir doesn't lower for OpenCL either...).

cc @danzimm @SamGinzburg

llvmbot · 2024-12-24T20:32:08Z

@llvm/pr-subscribers-mlir-gpu

@llvm/pr-subscribers-mlir

Author: Maksim Levental (makslevental)

Changes

This commit adds an AMD-specific lowering of cf.assert to llvm.intr.trap. It depends on (and is therefore merging into) #120431.

Note, the reason for lowering to llvm.intr.trap instead of __assertfail / __assert_fail is because these are header only functions in HIP.

Full diff: https://github.com/llvm/llvm-project/pull/121067.diff

2 Files Affected:

(modified) mlir/lib/Conversion/GPUToROCDL/LowerGpuOpsToROCDLOps.cpp (+71-1)
(added) mlir/test/Integration/GPU/ROCM/assert.mlir (+37)

diff --git a/mlir/lib/Conversion/GPUToROCDL/LowerGpuOpsToROCDLOps.cpp b/mlir/lib/Conversion/GPUToROCDL/LowerGpuOpsToROCDLOps.cpp
index aaf00e51f49416..2b0d16a5defb1f 100644
--- a/mlir/lib/Conversion/GPUToROCDL/LowerGpuOpsToROCDLOps.cpp
+++ b/mlir/lib/Conversion/GPUToROCDL/LowerGpuOpsToROCDLOps.cpp
@@ -31,6 +31,7 @@
 #include "mlir/Conversion/MemRefToLLVM/MemRefToLLVM.h"
 #include "mlir/Conversion/VectorToLLVM/ConvertVectorToLLVM.h"
 #include "mlir/Dialect/ControlFlow/IR/ControlFlow.h"
+#include "mlir/Dialect/ControlFlow/IR/ControlFlowOps.h"
 #include "mlir/Dialect/Func/IR/FuncOps.h"
 #include "mlir/Dialect/GPU/IR/GPUDialect.h"
 #include "mlir/Dialect/GPU/Transforms/Passes.h"
@@ -195,6 +196,75 @@ struct GPUShuffleOpLowering : public ConvertOpToLLVMPattern<gpu::ShuffleOp> {
   }
 };
 
+/// Based on
+/// mlir/lib/Conversion/GPUToNVVM/LowerGpuOpsToNVVMOps.cpp#AssertOpToAssertfailLowering
+/// Lowering of cf.assert into a conditional llvm.intr.trap plus gpu.printf with
+/// the metadata (filename, fileline, assert msg).
+struct AssertOpToBuiltinTrapLowering
+    : public ConvertOpToLLVMPattern<cf::AssertOp> {
+  using ConvertOpToLLVMPattern<cf::AssertOp>::ConvertOpToLLVMPattern;
+
+  LogicalResult
+  matchAndRewrite(cf::AssertOp assertOp, cf::AssertOpAdaptor adaptor,
+                  ConversionPatternRewriter &rewriter) const override {
+    Location loc = assertOp.getLoc();
+
+    // Split blocks and insert conditional branch.
+    // ^before:
+    //   ...
+    //   cf.cond_br %condition, ^after, ^assert
+    // ^assert:
+    //   cf.assert
+    //   cf.br ^after
+    // ^after:
+    //   ...
+    Block *beforeBlock = assertOp->getBlock();
+    Block *assertBlock =
+        rewriter.splitBlock(beforeBlock, assertOp->getIterator());
+    Block *afterBlock =
+        rewriter.splitBlock(assertBlock, ++assertOp->getIterator());
+    rewriter.setInsertionPointToEnd(beforeBlock);
+    rewriter.create<cf::CondBranchOp>(loc, adaptor.getArg(), afterBlock,
+                                      assertBlock);
+    rewriter.setInsertionPointToEnd(assertBlock);
+    rewriter.create<cf::BranchOp>(loc, afterBlock);
+
+    // Continue cf.assert lowering.
+    rewriter.setInsertionPoint(assertOp);
+
+    // Populate file name, file number and function name from the location of
+    // the AssertOp.
+    StringRef fileName = "(unknown)";
+    StringRef funcName = "(unknown)";
+    int32_t fileLine = 0;
+    if (auto fileLineColLoc = dyn_cast<FileLineColRange>(loc)) {
+      fileName = fileLineColLoc.getFilename().strref();
+      fileLine = fileLineColLoc.getStartLine();
+    } else if (auto nameLoc = dyn_cast<NameLoc>(loc)) {
+      funcName = nameLoc.getName().strref();
+      if (auto fileLineColLoc =
+              dyn_cast<FileLineColRange>(nameLoc.getChildLoc())) {
+        fileName = fileLineColLoc.getFilename().strref();
+        fileLine = fileLineColLoc.getStartLine();
+      }
+    }
+
+    Value assertLine =
+        rewriter.create<LLVM::ConstantOp>(loc, rewriter.getI32Type(), fileLine);
+    // interpolate the fmt str AOT because current gpu.printf lowering doesn't
+    // handle %s
+    llvm::Twine fmtStr = fileName + ":%u: " + funcName +
+                         " Device-side assertion `" + assertOp.getMsg() +
+                         "' failed.\n";
+    rewriter.create<gpu::PrintfOp>(assertOp.getLoc(),
+                                   rewriter.getStringAttr(fmtStr),
+                                   ValueRange{assertLine});
+    rewriter.replaceOpWithNewOp<LLVM::Trap>(assertOp);
+
+    return success();
+  }
+};
+
 /// Import the GPU Ops to ROCDL Patterns.
 #include "GPUToROCDL.cpp.inc"
 
@@ -297,7 +367,7 @@ struct LowerGpuOpsToROCDLOpsPass
     populateVectorToLLVMConversionPatterns(converter, llvmPatterns);
     populateMathToLLVMConversionPatterns(converter, llvmPatterns);
     cf::populateControlFlowToLLVMConversionPatterns(converter, llvmPatterns);
-    cf::populateAssertToLLVMConversionPattern(converter, llvmPatterns);
+    llvmPatterns.add<AssertOpToBuiltinTrapLowering>(converter);
     populateFuncToLLVMConversionPatterns(converter, llvmPatterns);
     populateFinalizeMemRefToLLVMConversionPatterns(converter, llvmPatterns);
     populateGpuToROCDLConversionPatterns(converter, llvmPatterns, runtime);
diff --git a/mlir/test/Integration/GPU/ROCM/assert.mlir b/mlir/test/Integration/GPU/ROCM/assert.mlir
new file mode 100644
index 00000000000000..0c292d1b02473e
--- /dev/null
+++ b/mlir/test/Integration/GPU/ROCM/assert.mlir
@@ -0,0 +1,37 @@
+// RUN: mlir-opt %s -gpu-lower-to-nvvm-pipeline="cubin-format=%gpu_compilation_format" \
+// RUN: | mlir-cpu-runner \
+// RUN:   --shared-libs=%mlir_cuda_runtime \
+// RUN:   --shared-libs=%mlir_runner_utils \
+// RUN:   --entry-point-result=void 2>&1 \
+// RUN: | FileCheck %s
+
+// CHECK-DAG: thread 0: print after passing assertion
+// CHECK-DAG: thread 1: print after passing assertion
+// CHECK-DAG: mlir/test/Integration/GPU/ROCM/assert.mlir:{{.*}}: (unknown) Device-side assertion `failing assertion' failed.
+// CHECK-DAG: mlir/test/Integration/GPU/ROCM/assert.mlir:{{.*}}: (unknown) Device-side assertion `failing assertion' failed.
+// CHECK-NOT: print after failing assertion
+
+module attributes {gpu.container_module} {
+gpu.module @kernels {
+gpu.func @test_assert(%c0: i1, %c1: i1) kernel {
+  %0 = gpu.thread_id x
+  cf.assert %c1, "passing assertion"
+  gpu.printf "thread %lld: print after passing assertion\n" %0 : index
+  cf.assert %c0, "failing assertion"
+  gpu.printf "thread %lld: print after failing assertion\n" %0 : index
+  gpu.return
+}
+}
+
+func.func @main() {
+  %c2 = arith.constant 2 : index
+  %c1 = arith.constant 1 : index
+  %c0_i1 = arith.constant 0 : i1
+  %c1_i1 = arith.constant 1 : i1
+  gpu.launch_func @kernels::@test_assert
+      blocks in (%c1, %c1, %c1)
+      threads in (%c2, %c1, %c1)
+      args(%c0_i1 : i1, %c1_i1 : i1)
+  return
+}
+}

krzysz00

Approved
Wrt OpenCL ... I hope legalization didn't get broken, but in the OpenCL flow, pryntf should lower to ... printf(), which the compiler will handle. Or at least that's my recollection of how that goes from staring at the AMDGPU backend ~a year ago

jhuber6 · 2025-01-03T14:54:12Z

Approved

Wrt OpenCL ... I hope legalization didn't get broken, but in the OpenCL flow, pryntf should lower to ... printf(), which the compiler will handle. Or at least that's my recollection of how that goes from staring at the AMDGPU backend ~a year ago

It's complicated, there's like two different flows that either lower printf to AMD's hostcall version or to a ring buffer type affair, then if you suppress the transform you just get printf symbols which is what my implementation uses.

krzysz00 · 2025-01-03T17:58:10Z

Re OpenCL and the linked test: we don't have an integration test for OpenCL's lowering because we don't have a way to execute it

matthias-springer · 2025-01-06T12:40:19Z

llvm:users/matthias-springer/gpu_assert was deleted when I merged my PR. Looks like this cannot be reopened, I think you have to create a new PR. Or maybe you can change the target branch and then reopen.

[mlir][GPU] Add gpu.assert op

8865986

llvmbot added mlir:gpu mlir labels Dec 24, 2024

makslevental requested a review from jhuber6 December 24, 2024 20:31

makslevental requested a review from krzysz00 December 24, 2024 20:32

makslevental force-pushed the users/makslevental/amdgpu-gpu_assert branch from a3ba62c to b8afb04 Compare December 24, 2024 20:33

makslevental requested a review from antiagainst December 24, 2024 20:41

[mlir][rocdl] Add AMDGPU-specific cf.assert lowering

79c96cb

makslevental force-pushed the users/makslevental/amdgpu-gpu_assert branch from b8afb04 to 79c96cb Compare December 24, 2024 20:50

krzysz00 approved these changes Jan 3, 2025

View reviewed changes

matthias-springer force-pushed the users/matthias-springer/gpu_assert branch from 8865986 to 86f4eff Compare January 6, 2025 08:51

matthias-springer requested a review from grypp as a code owner January 6, 2025 08:51

matthias-springer force-pushed the users/matthias-springer/gpu_assert branch from 86f4eff to dbd81f3 Compare January 6, 2025 09:28

matthias-springer deleted the branch llvm:users/matthias-springer/gpu_assert January 6, 2025 11:00

matthias-springer closed this Jan 6, 2025

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

[mlir][rocdl] Add AMDGPU-specific `cf.assert` lowering #121067

[mlir][rocdl] Add AMDGPU-specific `cf.assert` lowering #121067

Uh oh!

makslevental commented Dec 24, 2024 •

edited

Loading

Uh oh!

llvmbot commented Dec 24, 2024 •

edited

Loading

Uh oh!

krzysz00 left a comment

Uh oh!

jhuber6 commented Jan 3, 2025

Uh oh!

krzysz00 commented Jan 3, 2025

Uh oh!

matthias-springer commented Jan 6, 2025

Uh oh!

Uh oh!

[mlir][rocdl] Add AMDGPU-specific cf.assert lowering #121067

[mlir][rocdl] Add AMDGPU-specific cf.assert lowering #121067

Uh oh!

Conversation

makslevental commented Dec 24, 2024 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

llvmbot commented Dec 24, 2024 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

krzysz00 left a comment

Choose a reason for hiding this comment

Uh oh!

jhuber6 commented Jan 3, 2025

Uh oh!

krzysz00 commented Jan 3, 2025

Uh oh!

matthias-springer commented Jan 6, 2025

Uh oh!

Uh oh!

[mlir][rocdl] Add AMDGPU-specific `cf.assert` lowering #121067

[mlir][rocdl] Add AMDGPU-specific `cf.assert` lowering #121067

makslevental commented Dec 24, 2024 •

edited

Loading

llvmbot commented Dec 24, 2024 •

edited

Loading