Skip to content

Commit f4fb039

Browse files
authored
[MLIR] Cleanup Pass Pipeline in sm_90 Integration Tests (#67416)
MLIR has begun supporting many features of Nvidia's sm_90 architecture, and new tests have been added for it. Although the tests worked well, there were redundancies in the pipeline. This PR cleans up unnecessary passes.
1 parent 39f36d5 commit f4fb039

File tree

3 files changed

+27
-47
lines changed

3 files changed

+27
-47
lines changed

mlir/test/Integration/GPU/CUDA/sm90/tma_load_128x64_swizzle128b.mlir

Lines changed: 13 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -1,20 +1,16 @@
1-
// RUN: mlir-opt %s --convert-nvgpu-to-nvvm \
2-
// RUN: -convert-linalg-to-loops \
3-
// RUN: -gpu-kernel-outlining \
4-
// RUN: -convert-vector-to-scf \
5-
// RUN: -lower-affine \
6-
// RUN: -convert-scf-to-cf \
7-
// RUN: -convert-nvvm-to-llvm \
8-
// RUN: -convert-nvgpu-to-nvvm \
9-
// RUN: -convert-scf-to-cf \
10-
// RUN: -convert-vector-to-llvm \
11-
// RUN: -convert-math-to-llvm \
12-
// RUN: -convert-index-to-llvm=index-bitwidth=32 \
13-
// RUN: -convert-arith-to-llvm \
14-
// RUN: -finalize-memref-to-llvm='use-opaque-pointers=1' \
15-
// RUN: -convert-func-to-llvm \
16-
// RUN: -canonicalize -cse \
17-
// RUN: -expand-strided-metadata --nvvm-attach-target="module=main_kernel features=+ptx80 chip=sm_90 O=3" \
1+
// RUN: mlir-opt %s \
2+
// RUN: -convert-nvgpu-to-nvvm \
3+
// RUN: -gpu-kernel-outlining \
4+
// RUN: -convert-vector-to-scf \
5+
// RUN: -convert-scf-to-cf \
6+
// RUN: -convert-nvvm-to-llvm \
7+
// RUN: -convert-vector-to-llvm \
8+
// RUN: -convert-index-to-llvm=index-bitwidth=32 \
9+
// RUN: -convert-arith-to-llvm \
10+
// RUN: -finalize-memref-to-llvm='use-opaque-pointers=1' \
11+
// RUN: -convert-func-to-llvm \
12+
// RUN: -canonicalize -cse \
13+
// RUN: -expand-strided-metadata --nvvm-attach-target="module=main_kernel features=+ptx80 chip=sm_90 O=3" \
1814
// RUN: | mlir-opt -pass-pipeline='builtin.module(gpu.module(strip-debuginfo,convert-gpu-to-nvvm,convert-index-to-llvm{index-bitwidth=32},canonicalize,cse))' \
1915
// RUN: | mlir-opt --gpu-to-llvm --gpu-module-to-binary=format=%gpu_compilation_format -canonicalize -cse -reconcile-unrealized-casts \
2016
// RUN: | mlir-cpu-runner \

mlir/test/Integration/GPU/CUDA/sm90/tma_load_64x64_swizzle128b.mlir

Lines changed: 14 additions & 27 deletions
Original file line numberDiff line numberDiff line change
@@ -1,30 +1,17 @@
1-
// RUN: mlir-opt %s --convert-nvgpu-to-nvvm \
2-
// RUN: -convert-linalg-to-loops \
3-
// RUN: -canonicalize -cse \
4-
// RUN: -gpu-kernel-outlining \
5-
// RUN: -canonicalize -cse \
6-
// RUN: -convert-vector-to-scf \
7-
// RUN: -canonicalize -cse \
8-
// RUN: -lower-affine \
9-
// RUN: -canonicalize -cse \
10-
// RUN: -convert-scf-to-cf \
11-
// RUN: -canonicalize -cse \
12-
// RUN: -convert-nvvm-to-llvm \
13-
// RUN: -canonicalize -cse \
14-
// RUN: -convert-nvgpu-to-nvvm \
15-
// RUN: -canonicalize -cse \
16-
// RUN: -convert-scf-to-cf \
17-
// RUN: -convert-vector-to-llvm \
18-
// RUN: -canonicalize -cse \
19-
// RUN: -convert-math-to-llvm \
20-
// RUN: -canonicalize -cse \
21-
// RUN: -lower-affine \
22-
// RUN: -convert-index-to-llvm=index-bitwidth=32 \
23-
// RUN: -convert-arith-to-llvm \
24-
// RUN: -finalize-memref-to-llvm='use-opaque-pointers=1' \
25-
// RUN: -convert-func-to-llvm \
26-
// RUN: -canonicalize -cse \
27-
// RUN: -expand-strided-metadata --nvvm-attach-target="module=main_kernel features=+ptx80 chip=sm_90 O=3" \
1+
// RUN: mlir-opt %s \
2+
// RUN: -convert-nvgpu-to-nvvm \
3+
// RUN: -canonicalize -cse \
4+
// RUN: -gpu-kernel-outlining \
5+
// RUN: -convert-vector-to-scf \
6+
// RUN: -convert-scf-to-cf \
7+
// RUN: -convert-nvvm-to-llvm \
8+
// RUN: -convert-vector-to-llvm \
9+
// RUN: -convert-index-to-llvm=index-bitwidth=32 \
10+
// RUN: -convert-arith-to-llvm \
11+
// RUN: -finalize-memref-to-llvm='use-opaque-pointers=1' \
12+
// RUN: -convert-func-to-llvm \
13+
// RUN: -canonicalize -cse \
14+
// RUN: -expand-strided-metadata --nvvm-attach-target="module=main_kernel features=+ptx80 chip=sm_90 O=3" \
2815
// RUN: | mlir-opt -pass-pipeline='builtin.module(gpu.module(strip-debuginfo,convert-gpu-to-nvvm,convert-index-to-llvm{index-bitwidth=32},canonicalize,cse))' \
2916
// RUN: | mlir-opt --gpu-to-llvm --gpu-module-to-binary -canonicalize -cse -reconcile-unrealized-casts \
3017
// RUN: | mlir-cpu-runner \

mlir/test/Integration/GPU/CUDA/sm90/tma_load_64x8_8x128_noswizzle.mlir

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,6 @@
11
// RUN: mlir-opt %s --convert-nvgpu-to-nvvm \
22
// RUN: -gpu-kernel-outlining \
33
// RUN: -convert-nvvm-to-llvm \
4-
// RUN: -convert-nvgpu-to-nvvm \
54
// RUN: -convert-scf-to-cf \
65
// RUN: -convert-vector-to-llvm \
76
// RUN: -convert-index-to-llvm=index-bitwidth=32 \
@@ -25,7 +24,6 @@
2524
// RUN: mlir-opt %s --convert-nvgpu-to-nvvm \
2625
// RUN: -gpu-kernel-outlining \
2726
// RUN: -convert-nvvm-to-llvm \
28-
// RUN: -convert-nvgpu-to-nvvm \
2927
// RUN: -convert-scf-to-cf \
3028
// RUN: -convert-vector-to-llvm \
3129
// RUN: -convert-index-to-llvm=index-bitwidth=32 \
@@ -41,7 +39,6 @@
4139
// RUN: --entry-point-result=void \
4240
// RUN: | FileCheck %s
4341

44-
4542
// CHECK: [GPU] TMA BEFORE lhs[45][7] 0.000000
4643
// CHECK: [GPU] TMA BEFORE rhs[7][0] 0.000000
4744
// CHECK: [GPU] TMA LOADED lhs[45][7] 7.000000

0 commit comments

Comments
 (0)