Skip to content

Commit 3bc1254

Browse files
authored
[AMDGPU][Verifier] Check address space of alloca instruction (llvm#135820)
This PR updates the `Verifier` to enforce that `alloca` instructions on AMDGPU must be in AS5. This prevents hitting a misleading backend error like "unable to select FrameIndex," which makes it look like a backend bug when it's actually an IR-level issue.
1 parent fa65a22 commit 3bc1254

File tree

10 files changed

+4085
-3215
lines changed

10 files changed

+4085
-3215
lines changed

llvm/lib/IR/Verifier.cpp

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4395,6 +4395,11 @@ void Verifier::visitAllocaInst(AllocaInst &AI) {
43954395
verifySwiftErrorValue(&AI);
43964396
}
43974397

4398+
if (TT.isAMDGPU()) {
4399+
Check(AI.getAddressSpace() == AMDGPUAS::PRIVATE_ADDRESS,
4400+
"alloca on amdgpu must be in addrspace(5)", &AI);
4401+
}
4402+
43984403
visitInstruction(AI);
43994404
}
44004405

llvm/test/CodeGen/AMDGPU/assert-wrong-alloca-addrspace.ll

Lines changed: 0 additions & 16 deletions
This file was deleted.

llvm/test/CodeGen/AMDGPU/lower-indirect-lds-references.ll

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -16,8 +16,9 @@ define amdgpu_kernel void @offloading_kernel() {
1616
}
1717

1818
define void @call_unknown() {
19-
%1 = alloca ptr, align 8
20-
%2 = call i32 %1()
19+
%alloca = alloca ptr, align 8, addrspace(5)
20+
%alloca.cast = addrspacecast ptr addrspace(5) %alloca to ptr
21+
%ret = call i32 %alloca.cast()
2122
ret void
2223
}
2324

llvm/test/Transforms/InstCombine/alloca-in-non-alloca-as.ll

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,9 +3,6 @@
33

44
; Gracefully handle the alloca that is not in the alloca AS (=5)
55

6-
target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-p7:160:256:256:32-p8:128:128-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5-G1-ni:7:8:9"
7-
target triple = "amdgcn-amd-amdhsa"
8-
96
declare void @use(ptr)
107
declare void @use2(ptr, ptr)
118

llvm/test/Transforms/OpenMP/custom_state_machines.ll

Lines changed: 1202 additions & 947 deletions
Large diffs are not rendered by default.

llvm/test/Transforms/OpenMP/custom_state_machines_pre_lto.ll

Lines changed: 1582 additions & 1284 deletions
Large diffs are not rendered by default.

llvm/test/Transforms/OpenMP/spmdization.ll

Lines changed: 776 additions & 555 deletions
Large diffs are not rendered by default.

llvm/test/Transforms/OpenMP/spmdization_constant_prop.ll

Lines changed: 124 additions & 129 deletions
Large diffs are not rendered by default.

llvm/test/Transforms/OpenMP/spmdization_indirect.ll

Lines changed: 291 additions & 279 deletions
Large diffs are not rendered by default.

llvm/test/Verifier/AMDGPU/alloca.ll

Lines changed: 102 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,102 @@
1+
; RUN: not llvm-as %s --disable-output 2>&1 | FileCheck %s
2+
3+
target triple = "amdgcn-amd-amdhsa"
4+
5+
; CHECK: alloca on amdgpu must be in addrspace(5)
6+
; CHECK-NEXT: %alloca.0 = alloca i32, align 4
7+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
8+
; CHECK-NEXT: %alloca.1 = alloca i32, align 4, addrspace(1)
9+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
10+
; CHECK-NEXT: %alloca.2 = alloca i32, align 4, addrspace(2)
11+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
12+
; CHECK-NEXT: %alloca.3 = alloca i32, align 4, addrspace(3)
13+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
14+
; CHECK-NEXT: %alloca.4 = alloca i32, align 4, addrspace(4)
15+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
16+
; CHECK-NEXT: %alloca.6 = alloca i32, align 4, addrspace(6)
17+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
18+
; CHECK-NEXT: %alloca.7 = alloca i32, align 4, addrspace(7)
19+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
20+
; CHECK-NEXT: %alloca.8 = alloca i32, align 4, addrspace(8)
21+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
22+
; CHECK-NEXT: %alloca.9 = alloca i32, align 4, addrspace(9)
23+
define void @static_alloca() {
24+
entry:
25+
%alloca.0 = alloca i32, align 4
26+
%alloca.1 = alloca i32, align 4, addrspace(1)
27+
%alloca.2 = alloca i32, align 4, addrspace(2)
28+
%alloca.3 = alloca i32, align 4, addrspace(3)
29+
%alloca.4 = alloca i32, align 4, addrspace(4)
30+
%alloca.5 = alloca i32, align 4, addrspace(5)
31+
%alloca.6 = alloca i32, align 4, addrspace(6)
32+
%alloca.7 = alloca i32, align 4, addrspace(7)
33+
%alloca.8 = alloca i32, align 4, addrspace(8)
34+
%alloca.9 = alloca i32, align 4, addrspace(9)
35+
ret void
36+
}
37+
38+
; CHECK: alloca on amdgpu must be in addrspace(5)
39+
; CHECK-NEXT: %alloca.0 = alloca i32, i32 %n, align 4
40+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
41+
; CHECK-NEXT: %alloca.1 = alloca i32, i32 %n, align 4, addrspace(1)
42+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
43+
; CHECK-NEXT: %alloca.2 = alloca i32, i32 %n, align 4, addrspace(2)
44+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
45+
; CHECK-NEXT: %alloca.3 = alloca i32, i32 %n, align 4, addrspace(3)
46+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
47+
; CHECK-NEXT: %alloca.4 = alloca i32, i32 %n, align 4, addrspace(4)
48+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
49+
; CHECK-NEXT: %alloca.6 = alloca i32, i32 %n, align 4, addrspace(6)
50+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
51+
; CHECK-NEXT: %alloca.7 = alloca i32, i32 %n, align 4, addrspace(7)
52+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
53+
; CHECK-NEXT: %alloca.8 = alloca i32, i32 %n, align 4, addrspace(8)
54+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
55+
; CHECK-NEXT: %alloca.9 = alloca i32, i32 %n, align 4, addrspace(9)
56+
define void @dynamic_alloca_i32(i32 %n) {
57+
entry:
58+
%alloca.0 = alloca i32, i32 %n, align 4
59+
%alloca.1 = alloca i32, i32 %n, align 4, addrspace(1)
60+
%alloca.2 = alloca i32, i32 %n, align 4, addrspace(2)
61+
%alloca.3 = alloca i32, i32 %n, align 4, addrspace(3)
62+
%alloca.4 = alloca i32, i32 %n, align 4, addrspace(4)
63+
%alloca.5 = alloca i32, i32 %n, align 4, addrspace(5)
64+
%alloca.6 = alloca i32, i32 %n, align 4, addrspace(6)
65+
%alloca.7 = alloca i32, i32 %n, align 4, addrspace(7)
66+
%alloca.8 = alloca i32, i32 %n, align 4, addrspace(8)
67+
%alloca.9 = alloca i32, i32 %n, align 4, addrspace(9)
68+
ret void
69+
}
70+
71+
; CHECK: alloca on amdgpu must be in addrspace(5)
72+
; CHECK-NEXT: %alloca.0 = alloca i32, i64 %n, align 4
73+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
74+
; CHECK-NEXT: %alloca.1 = alloca i32, i64 %n, align 4, addrspace(1)
75+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
76+
; CHECK-NEXT: %alloca.2 = alloca i32, i64 %n, align 4, addrspace(2)
77+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
78+
; CHECK-NEXT: %alloca.3 = alloca i32, i64 %n, align 4, addrspace(3)
79+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
80+
; CHECK-NEXT: %alloca.4 = alloca i32, i64 %n, align 4, addrspace(4)
81+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
82+
; CHECK-NEXT: %alloca.6 = alloca i32, i64 %n, align 4, addrspace(6)
83+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
84+
; CHECK-NEXT: %alloca.7 = alloca i32, i64 %n, align 4, addrspace(7)
85+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
86+
; CHECK-NEXT: %alloca.8 = alloca i32, i64 %n, align 4, addrspace(8)
87+
; CHECK-NEXT: alloca on amdgpu must be in addrspace(5)
88+
; CHECK-NEXT: %alloca.9 = alloca i32, i64 %n, align 4, addrspace(9)
89+
define void @dynamic_alloca_i64(i64 %n) {
90+
entry:
91+
%alloca.0 = alloca i32, i64 %n, align 4
92+
%alloca.1 = alloca i32, i64 %n, align 4, addrspace(1)
93+
%alloca.2 = alloca i32, i64 %n, align 4, addrspace(2)
94+
%alloca.3 = alloca i32, i64 %n, align 4, addrspace(3)
95+
%alloca.4 = alloca i32, i64 %n, align 4, addrspace(4)
96+
%alloca.5 = alloca i32, i64 %n, align 4, addrspace(5)
97+
%alloca.6 = alloca i32, i64 %n, align 4, addrspace(6)
98+
%alloca.7 = alloca i32, i64 %n, align 4, addrspace(7)
99+
%alloca.8 = alloca i32, i64 %n, align 4, addrspace(8)
100+
%alloca.9 = alloca i32, i64 %n, align 4, addrspace(9)
101+
ret void
102+
}

0 commit comments

Comments
 (0)