1
+ ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
1
2
; RUN: llc < %s -mtriple=powerpc-unknown-linux-gnu -verify-machineinstrs -ppc-asm-full-reg-names | FileCheck %s --check-prefix=CHECK --check-prefix=PPC32
2
3
; FIXME: -verify-machineinstrs currently fail on ppc64 (mismatched register/instruction).
3
4
; This is already checked for in Atomics-64.ll
8
9
9
10
; Indexed version of loads
10
11
define i8 @load_x_i8_seq_cst ([100000 x i8 ]* %mem ) {
11
- ; CHECK-LABEL: load_x_i8_seq_cst
12
- ; CHECK: sync
13
- ; CHECK: lbzx [[VAL:r[0-9]+]]
12
+ ; PPC32-LABEL: load_x_i8_seq_cst:
13
+ ; PPC32: # %bb.0:
14
+ ; PPC32-NEXT: lis r4, 1
15
+ ; PPC32-NEXT: sync
16
+ ; PPC32-NEXT: ori r4, r4, 24464
17
+ ; PPC32-NEXT: lbzx r3, r3, r4
18
+ ; PPC32-NEXT: lwsync
19
+ ; PPC32-NEXT: blr
20
+ ;
21
+ ; PPC64-LABEL: load_x_i8_seq_cst:
22
+ ; PPC64: # %bb.0:
23
+ ; PPC64-NEXT: lis r4, 1
24
+ ; PPC64-NEXT: sync
25
+ ; PPC64-NEXT: ori r4, r4, 24464
26
+ ; PPC64-NEXT: lbzx r3, r3, r4
27
+ ; PPC64-NEXT: cmpd cr7, r3, r3
28
+ ; PPC64-NEXT: bne- cr7, .+4
29
+ ; PPC64-NEXT: isync
30
+ ; PPC64-NEXT: blr
14
31
; CHECK-PPC32: lwsync
15
32
; CHECK-PPC64: cmpw [[CR:cr[0-9]+]], [[VAL]], [[VAL]]
16
33
; CHECK-PPC64: bne- [[CR]], .+4
@@ -20,8 +37,23 @@ define i8 @load_x_i8_seq_cst([100000 x i8]* %mem) {
20
37
ret i8 %val
21
38
}
22
39
define i16 @load_x_i16_acquire ([100000 x i16 ]* %mem ) {
23
- ; CHECK-LABEL: load_x_i16_acquire
24
- ; CHECK: lhzx [[VAL:r[0-9]+]]
40
+ ; PPC32-LABEL: load_x_i16_acquire:
41
+ ; PPC32: # %bb.0:
42
+ ; PPC32-NEXT: lis r4, 2
43
+ ; PPC32-NEXT: ori r4, r4, 48928
44
+ ; PPC32-NEXT: lhzx r3, r3, r4
45
+ ; PPC32-NEXT: lwsync
46
+ ; PPC32-NEXT: blr
47
+ ;
48
+ ; PPC64-LABEL: load_x_i16_acquire:
49
+ ; PPC64: # %bb.0:
50
+ ; PPC64-NEXT: lis r4, 2
51
+ ; PPC64-NEXT: ori r4, r4, 48928
52
+ ; PPC64-NEXT: lhzx r3, r3, r4
53
+ ; PPC64-NEXT: cmpd cr7, r3, r3
54
+ ; PPC64-NEXT: bne- cr7, .+4
55
+ ; PPC64-NEXT: isync
56
+ ; PPC64-NEXT: blr
25
57
; CHECK-PPC32: lwsync
26
58
; CHECK-PPC64: cmpw [[CR:cr[0-9]+]], [[VAL]], [[VAL]]
27
59
; CHECK-PPC64: bne- [[CR]], .+4
@@ -31,55 +63,109 @@ define i16 @load_x_i16_acquire([100000 x i16]* %mem) {
31
63
ret i16 %val
32
64
}
33
65
define i32 @load_x_i32_monotonic ([100000 x i32 ]* %mem ) {
34
- ; CHECK-LABEL: load_x_i32_monotonic
35
- ; CHECK: lwzx
36
- ; CHECK-NOT: sync
66
+ ; CHECK-LABEL: load_x_i32_monotonic:
67
+ ; CHECK: # %bb.0:
68
+ ; CHECK-NEXT: lis r4, 5
69
+ ; CHECK-NEXT: ori r4, r4, 32320
70
+ ; CHECK-NEXT: lwzx r3, r3, r4
71
+ ; CHECK-NEXT: blr
37
72
%ptr = getelementptr inbounds [100000 x i32 ], [100000 x i32 ]* %mem , i64 0 , i64 90000
38
73
%val = load atomic i32 , i32* %ptr monotonic , align 4
39
74
ret i32 %val
40
75
}
41
76
define i64 @load_x_i64_unordered ([100000 x i64 ]* %mem ) {
42
- ; CHECK-LABEL: load_x_i64_unordered
43
- ; PPC32: __sync_
44
- ; PPC64-NOT: __sync_
45
- ; PPC64: ldx
46
- ; CHECK-NOT: sync
77
+ ; PPC32-LABEL: load_x_i64_unordered:
78
+ ; PPC32: # %bb.0:
79
+ ; PPC32-NEXT: mflr r0
80
+ ; PPC32-NEXT: stw r0, 4(r1)
81
+ ; PPC32-NEXT: stwu r1, -16(r1)
82
+ ; PPC32-NEXT: .cfi_def_cfa_offset 16
83
+ ; PPC32-NEXT: .cfi_offset lr, 4
84
+ ; PPC32-NEXT: addi r3, r3, -896
85
+ ; PPC32-NEXT: addis r3, r3, 11
86
+ ; PPC32-NEXT: li r4, 0
87
+ ; PPC32-NEXT: bl __atomic_load_8
88
+ ; PPC32-NEXT: lwz r0, 20(r1)
89
+ ; PPC32-NEXT: addi r1, r1, 16
90
+ ; PPC32-NEXT: mtlr r0
91
+ ; PPC32-NEXT: blr
92
+ ;
93
+ ; PPC64-LABEL: load_x_i64_unordered:
94
+ ; PPC64: # %bb.0:
95
+ ; PPC64-NEXT: lis r4, 10
96
+ ; PPC64-NEXT: ori r4, r4, 64640
97
+ ; PPC64-NEXT: ldx r3, r3, r4
98
+ ; PPC64-NEXT: blr
47
99
%ptr = getelementptr inbounds [100000 x i64 ], [100000 x i64 ]* %mem , i64 0 , i64 90000
48
100
%val = load atomic i64 , i64* %ptr unordered , align 8
49
101
ret i64 %val
50
102
}
51
103
52
104
; Indexed version of stores
53
105
define void @store_x_i8_seq_cst ([100000 x i8 ]* %mem ) {
54
- ; CHECK-LABEL: store_x_i8_seq_cst
55
- ; CHECK: sync
56
- ; CHECK: stbx
106
+ ; CHECK-LABEL: store_x_i8_seq_cst:
107
+ ; CHECK: # %bb.0:
108
+ ; CHECK-NEXT: lis r4, 1
109
+ ; CHECK-NEXT: ori r4, r4, 24464
110
+ ; CHECK-NEXT: li r5, 42
111
+ ; CHECK-NEXT: sync
112
+ ; CHECK-NEXT: stbx r5, r3, r4
113
+ ; CHECK-NEXT: blr
57
114
%ptr = getelementptr inbounds [100000 x i8 ], [100000 x i8 ]* %mem , i64 0 , i64 90000
58
115
store atomic i8 42 , i8* %ptr seq_cst , align 1
59
116
ret void
60
117
}
61
118
define void @store_x_i16_release ([100000 x i16 ]* %mem ) {
62
- ; CHECK-LABEL: store_x_i16_release
63
- ; CHECK: lwsync
64
- ; CHECK: sthx
119
+ ; CHECK-LABEL: store_x_i16_release:
120
+ ; CHECK: # %bb.0:
121
+ ; CHECK-NEXT: lis r4, 2
122
+ ; CHECK-NEXT: ori r4, r4, 48928
123
+ ; CHECK-NEXT: li r5, 42
124
+ ; CHECK-NEXT: lwsync
125
+ ; CHECK-NEXT: sthx r5, r3, r4
126
+ ; CHECK-NEXT: blr
65
127
%ptr = getelementptr inbounds [100000 x i16 ], [100000 x i16 ]* %mem , i64 0 , i64 90000
66
128
store atomic i16 42 , i16* %ptr release , align 2
67
129
ret void
68
130
}
69
131
define void @store_x_i32_monotonic ([100000 x i32 ]* %mem ) {
70
- ; CHECK-LABEL: store_x_i32_monotonic
71
- ; CHECK-NOT: sync
72
- ; CHECK: stwx
132
+ ; CHECK-LABEL: store_x_i32_monotonic:
133
+ ; CHECK: # %bb.0:
134
+ ; CHECK-NEXT: lis r4, 5
135
+ ; CHECK-NEXT: ori r4, r4, 32320
136
+ ; CHECK-NEXT: li r5, 42
137
+ ; CHECK-NEXT: stwx r5, r3, r4
138
+ ; CHECK-NEXT: blr
73
139
%ptr = getelementptr inbounds [100000 x i32 ], [100000 x i32 ]* %mem , i64 0 , i64 90000
74
140
store atomic i32 42 , i32* %ptr monotonic , align 4
75
141
ret void
76
142
}
77
143
define void @store_x_i64_unordered ([100000 x i64 ]* %mem ) {
78
- ; CHECK-LABEL: store_x_i64_unordered
79
- ; CHECK-NOT: sync
80
- ; PPC32: __sync_
81
- ; PPC64-NOT: __sync_
82
- ; PPC64: stdx
144
+ ; PPC32-LABEL: store_x_i64_unordered:
145
+ ; PPC32: # %bb.0:
146
+ ; PPC32-NEXT: mflr r0
147
+ ; PPC32-NEXT: stw r0, 4(r1)
148
+ ; PPC32-NEXT: stwu r1, -16(r1)
149
+ ; PPC32-NEXT: .cfi_def_cfa_offset 16
150
+ ; PPC32-NEXT: .cfi_offset lr, 4
151
+ ; PPC32-NEXT: addi r3, r3, -896
152
+ ; PPC32-NEXT: addis r3, r3, 11
153
+ ; PPC32-NEXT: li r5, 0
154
+ ; PPC32-NEXT: li r6, 42
155
+ ; PPC32-NEXT: li r7, 0
156
+ ; PPC32-NEXT: bl __atomic_store_8
157
+ ; PPC32-NEXT: lwz r0, 20(r1)
158
+ ; PPC32-NEXT: addi r1, r1, 16
159
+ ; PPC32-NEXT: mtlr r0
160
+ ; PPC32-NEXT: blr
161
+ ;
162
+ ; PPC64-LABEL: store_x_i64_unordered:
163
+ ; PPC64: # %bb.0:
164
+ ; PPC64-NEXT: lis r4, 10
165
+ ; PPC64-NEXT: ori r4, r4, 64640
166
+ ; PPC64-NEXT: li r5, 42
167
+ ; PPC64-NEXT: stdx r5, r3, r4
168
+ ; PPC64-NEXT: blr
83
169
%ptr = getelementptr inbounds [100000 x i64 ], [100000 x i64 ]* %mem , i64 0 , i64 90000
84
170
store atomic i64 42 , i64* %ptr unordered , align 8
85
171
ret void
0 commit comments