1
1
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --function-signature --check-globals
2
2
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-attributor %s | FileCheck --check-prefixes=CHECK,OW %s
3
3
; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes='amdgpu-attributor<closed-world>' %s | FileCheck --check-prefixes=CHECK,CW %s
4
+ ; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes='amdgpu-attributor<closed-world>' -amdgpu-indirect-call-specialization-threshold=0 %s | FileCheck --check-prefixes=CHECK,NO %s
4
5
5
6
target datalayout = "A5"
6
7
@@ -9,8 +10,8 @@ target datalayout = "A5"
9
10
;.
10
11
; CHECK: @G = global i32 0, align 4
11
12
;.
12
- define void @bar () {
13
- ; CHECK-LABEL: define {{[^@]+}}@bar
13
+ define void @bar1 () {
14
+ ; CHECK-LABEL: define {{[^@]+}}@bar1
14
15
; CHECK-SAME: () #[[ATTR0:[0-9]+]] {
15
16
; CHECK-NEXT: entry:
16
17
; CHECK-NEXT: store i32 1, ptr @G, align 4
@@ -21,14 +22,36 @@ entry:
21
22
ret void
22
23
}
23
24
24
- define ptr @helper () {
25
- ; CHECK-LABEL: define {{[^@]+}}@helper
25
+ define void @bar2 () {
26
+ ; CHECK-LABEL: define {{[^@]+}}@bar2
26
27
; CHECK-SAME: () #[[ATTR0]] {
27
28
; CHECK-NEXT: entry:
28
- ; CHECK-NEXT: ret ptr @bar
29
+ ; CHECK-NEXT: store i32 2, ptr @G, align 4
30
+ ; CHECK-NEXT: ret void
29
31
;
30
32
entry:
31
- ret ptr @bar
33
+ store i32 2 , ptr @G , align 4
34
+ ret void
35
+ }
36
+
37
+ define ptr @helper1 () {
38
+ ; CHECK-LABEL: define {{[^@]+}}@helper1
39
+ ; CHECK-SAME: () #[[ATTR0]] {
40
+ ; CHECK-NEXT: entry:
41
+ ; CHECK-NEXT: ret ptr @bar1
42
+ ;
43
+ entry:
44
+ ret ptr @bar1
45
+ }
46
+
47
+ define ptr @helper2 () {
48
+ ; CHECK-LABEL: define {{[^@]+}}@helper2
49
+ ; CHECK-SAME: () #[[ATTR0]] {
50
+ ; CHECK-NEXT: entry:
51
+ ; CHECK-NEXT: ret ptr @bar2
52
+ ;
53
+ entry:
54
+ ret ptr @bar2
32
55
}
33
56
34
57
define amdgpu_kernel void @foo (ptr noundef %fp ) {
@@ -45,10 +68,29 @@ define amdgpu_kernel void @foo(ptr noundef %fp) {
45
68
; CW-NEXT: entry:
46
69
; CW-NEXT: [[FP_ADDR:%.*]] = alloca ptr, align 8, addrspace(5)
47
70
; CW-NEXT: store ptr [[FP]], ptr addrspace(5) [[FP_ADDR]], align 8
48
- ; CW-NEXT: [[LOAD:%.*]] = load ptr, ptr addrspace(5) [[FP_ADDR]], align 8
49
- ; CW-NEXT: call void @bar()
71
+ ; CW-NEXT: [[TMP0:%.*]] = icmp eq ptr [[FP]], @bar1
72
+ ; CW-NEXT: br i1 [[TMP0]], label [[TMP1:%.*]], label [[TMP2:%.*]]
73
+ ; CW: 1:
74
+ ; CW-NEXT: call void @bar1()
75
+ ; CW-NEXT: br label [[TMP5:%.*]]
76
+ ; CW: 2:
77
+ ; CW-NEXT: br i1 true, label [[TMP3:%.*]], label [[TMP4:%.*]]
78
+ ; CW: 3:
79
+ ; CW-NEXT: call void @bar2()
80
+ ; CW-NEXT: br label [[TMP5]]
81
+ ; CW: 4:
82
+ ; CW-NEXT: unreachable
83
+ ; CW: 5:
50
84
; CW-NEXT: ret void
51
85
;
86
+ ; NO-LABEL: define {{[^@]+}}@foo
87
+ ; NO-SAME: (ptr noundef [[FP:%.*]]) #[[ATTR1:[0-9]+]] {
88
+ ; NO-NEXT: entry:
89
+ ; NO-NEXT: [[FP_ADDR:%.*]] = alloca ptr, align 8, addrspace(5)
90
+ ; NO-NEXT: store ptr [[FP]], ptr addrspace(5) [[FP_ADDR]], align 8
91
+ ; NO-NEXT: call void [[FP]](), !callees [[META0:![0-9]+]]
92
+ ; NO-NEXT: ret void
93
+ ;
52
94
entry:
53
95
%fp.addr = alloca ptr , addrspace (5 )
54
96
store ptr %fp , ptr addrspace (5 ) %fp.addr
@@ -57,10 +99,15 @@ entry:
57
99
ret void
58
100
}
59
101
102
+ ;.
103
+ ; NO: attributes #[[ATTR0]] = { "amdgpu-no-agpr" "amdgpu-no-completion-action" "amdgpu-no-default-queue" "amdgpu-no-dispatch-id" "amdgpu-no-dispatch-ptr" "amdgpu-no-heap-ptr" "amdgpu-no-hostcall-ptr" "amdgpu-no-implicitarg-ptr" "amdgpu-no-lds-kernel-id" "amdgpu-no-multigrid-sync-arg" "amdgpu-no-queue-ptr" "amdgpu-no-workgroup-id-x" "amdgpu-no-workgroup-id-y" "amdgpu-no-workgroup-id-z" "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "amdgpu-waves-per-eu"="4,10" "uniform-work-group-size"="false" }
104
+ ; NO: attributes #[[ATTR1]] = { "amdgpu-no-completion-action" "amdgpu-no-default-queue" "amdgpu-no-dispatch-id" "amdgpu-no-dispatch-ptr" "amdgpu-no-heap-ptr" "amdgpu-no-hostcall-ptr" "amdgpu-no-implicitarg-ptr" "amdgpu-no-lds-kernel-id" "amdgpu-no-multigrid-sync-arg" "amdgpu-no-queue-ptr" "amdgpu-no-workgroup-id-x" "amdgpu-no-workgroup-id-y" "amdgpu-no-workgroup-id-z" "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "uniform-work-group-size"="false" }
60
105
;.
61
106
; OW: attributes #[[ATTR0]] = { "amdgpu-no-agpr" "amdgpu-no-completion-action" "amdgpu-no-default-queue" "amdgpu-no-dispatch-id" "amdgpu-no-dispatch-ptr" "amdgpu-no-heap-ptr" "amdgpu-no-hostcall-ptr" "amdgpu-no-implicitarg-ptr" "amdgpu-no-lds-kernel-id" "amdgpu-no-multigrid-sync-arg" "amdgpu-no-queue-ptr" "amdgpu-no-workgroup-id-x" "amdgpu-no-workgroup-id-y" "amdgpu-no-workgroup-id-z" "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "amdgpu-waves-per-eu"="4,10" "uniform-work-group-size"="false" }
62
107
; OW: attributes #[[ATTR1]] = { "uniform-work-group-size"="false" }
63
108
;.
64
109
; CW: attributes #[[ATTR0]] = { "amdgpu-no-agpr" "amdgpu-no-completion-action" "amdgpu-no-default-queue" "amdgpu-no-dispatch-id" "amdgpu-no-dispatch-ptr" "amdgpu-no-heap-ptr" "amdgpu-no-hostcall-ptr" "amdgpu-no-implicitarg-ptr" "amdgpu-no-lds-kernel-id" "amdgpu-no-multigrid-sync-arg" "amdgpu-no-queue-ptr" "amdgpu-no-workgroup-id-x" "amdgpu-no-workgroup-id-y" "amdgpu-no-workgroup-id-z" "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "amdgpu-waves-per-eu"="4,10" "uniform-work-group-size"="false" }
65
110
; CW: attributes #[[ATTR1]] = { "amdgpu-no-completion-action" "amdgpu-no-default-queue" "amdgpu-no-dispatch-id" "amdgpu-no-dispatch-ptr" "amdgpu-no-heap-ptr" "amdgpu-no-hostcall-ptr" "amdgpu-no-implicitarg-ptr" "amdgpu-no-lds-kernel-id" "amdgpu-no-multigrid-sync-arg" "amdgpu-no-queue-ptr" "amdgpu-no-workgroup-id-x" "amdgpu-no-workgroup-id-y" "amdgpu-no-workgroup-id-z" "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "uniform-work-group-size"="false" }
66
111
;.
112
+ ; NO: [[META0]] = !{ptr @bar1, ptr @bar2}
113
+ ;.
0 commit comments