|
1 | 1 | ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
2 | 2 | ; RUN: llc -mtriple=riscv32 -relocation-model=pic -verify-machineinstrs < %s \
|
3 |
| -; RUN: | FileCheck -check-prefixes=RV32I %s |
| 3 | +; RUN: | FileCheck -check-prefixes=RV32I,RV32NOFUSION %s |
4 | 4 | ; RUN: llc -mtriple=riscv64 -relocation-model=pic -verify-machineinstrs < %s \
|
5 |
| -; RUN: | FileCheck -check-prefixes=RV64I %s |
| 5 | +; RUN: | FileCheck -check-prefixes=RV64I,RV64NOFUSION %s |
| 6 | +; RUN: llc -mtriple=riscv32 -relocation-model=pic -verify-machineinstrs < %s \ |
| 7 | +; RUN: -mattr=+auipc-addi-fusion | FileCheck -check-prefixes=RV32I,RV32FUSION %s |
| 8 | +; RUN: llc -mtriple=riscv64 -relocation-model=pic -verify-machineinstrs < %s \ |
| 9 | +; RUN: -mattr=+auipc-addi-fusion | FileCheck -check-prefixes=RV64I,RV64FUSION %s |
6 | 10 |
|
7 | 11 | ; Verifies that MachineLICM can hoist address generation pseudos out of loops.
|
8 | 12 |
|
@@ -141,59 +145,113 @@ ret:
|
141 | 145 | @gd = external thread_local global i32
|
142 | 146 |
|
143 | 147 | define void @test_la_tls_gd(i32 signext %n) nounwind {
|
144 |
| -; RV32I-LABEL: test_la_tls_gd: |
145 |
| -; RV32I: # %bb.0: # %entry |
146 |
| -; RV32I-NEXT: addi sp, sp, -16 |
147 |
| -; RV32I-NEXT: sw ra, 12(sp) # 4-byte Folded Spill |
148 |
| -; RV32I-NEXT: sw s0, 8(sp) # 4-byte Folded Spill |
149 |
| -; RV32I-NEXT: sw s1, 4(sp) # 4-byte Folded Spill |
150 |
| -; RV32I-NEXT: sw s2, 0(sp) # 4-byte Folded Spill |
151 |
| -; RV32I-NEXT: mv s0, a0 |
152 |
| -; RV32I-NEXT: li s2, 0 |
153 |
| -; RV32I-NEXT: .Lpcrel_hi3: |
154 |
| -; RV32I-NEXT: auipc a0, %tls_gd_pcrel_hi(gd) |
155 |
| -; RV32I-NEXT: addi s1, a0, %pcrel_lo(.Lpcrel_hi3) |
156 |
| -; RV32I-NEXT: .LBB3_1: # %loop |
157 |
| -; RV32I-NEXT: # =>This Inner Loop Header: Depth=1 |
158 |
| -; RV32I-NEXT: mv a0, s1 |
159 |
| -; RV32I-NEXT: call __tls_get_addr |
160 |
| -; RV32I-NEXT: lw zero, 0(a0) |
161 |
| -; RV32I-NEXT: addi s2, s2, 1 |
162 |
| -; RV32I-NEXT: blt s2, s0, .LBB3_1 |
163 |
| -; RV32I-NEXT: # %bb.2: # %ret |
164 |
| -; RV32I-NEXT: lw ra, 12(sp) # 4-byte Folded Reload |
165 |
| -; RV32I-NEXT: lw s0, 8(sp) # 4-byte Folded Reload |
166 |
| -; RV32I-NEXT: lw s1, 4(sp) # 4-byte Folded Reload |
167 |
| -; RV32I-NEXT: lw s2, 0(sp) # 4-byte Folded Reload |
168 |
| -; RV32I-NEXT: addi sp, sp, 16 |
169 |
| -; RV32I-NEXT: ret |
| 148 | +; RV32NOFUSION-LABEL: test_la_tls_gd: |
| 149 | +; RV32NOFUSION: # %bb.0: # %entry |
| 150 | +; RV32NOFUSION-NEXT: addi sp, sp, -16 |
| 151 | +; RV32NOFUSION-NEXT: sw ra, 12(sp) # 4-byte Folded Spill |
| 152 | +; RV32NOFUSION-NEXT: sw s0, 8(sp) # 4-byte Folded Spill |
| 153 | +; RV32NOFUSION-NEXT: sw s1, 4(sp) # 4-byte Folded Spill |
| 154 | +; RV32NOFUSION-NEXT: sw s2, 0(sp) # 4-byte Folded Spill |
| 155 | +; RV32NOFUSION-NEXT: mv s0, a0 |
| 156 | +; RV32NOFUSION-NEXT: li s2, 0 |
| 157 | +; RV32NOFUSION-NEXT: .Lpcrel_hi3: |
| 158 | +; RV32NOFUSION-NEXT: auipc a0, %tls_gd_pcrel_hi(gd) |
| 159 | +; RV32NOFUSION-NEXT: addi s1, a0, %pcrel_lo(.Lpcrel_hi3) |
| 160 | +; RV32NOFUSION-NEXT: .LBB3_1: # %loop |
| 161 | +; RV32NOFUSION-NEXT: # =>This Inner Loop Header: Depth=1 |
| 162 | +; RV32NOFUSION-NEXT: mv a0, s1 |
| 163 | +; RV32NOFUSION-NEXT: call __tls_get_addr |
| 164 | +; RV32NOFUSION-NEXT: lw zero, 0(a0) |
| 165 | +; RV32NOFUSION-NEXT: addi s2, s2, 1 |
| 166 | +; RV32NOFUSION-NEXT: blt s2, s0, .LBB3_1 |
| 167 | +; RV32NOFUSION-NEXT: # %bb.2: # %ret |
| 168 | +; RV32NOFUSION-NEXT: lw ra, 12(sp) # 4-byte Folded Reload |
| 169 | +; RV32NOFUSION-NEXT: lw s0, 8(sp) # 4-byte Folded Reload |
| 170 | +; RV32NOFUSION-NEXT: lw s1, 4(sp) # 4-byte Folded Reload |
| 171 | +; RV32NOFUSION-NEXT: lw s2, 0(sp) # 4-byte Folded Reload |
| 172 | +; RV32NOFUSION-NEXT: addi sp, sp, 16 |
| 173 | +; RV32NOFUSION-NEXT: ret |
170 | 174 | ;
|
171 |
| -; RV64I-LABEL: test_la_tls_gd: |
172 |
| -; RV64I: # %bb.0: # %entry |
173 |
| -; RV64I-NEXT: addi sp, sp, -32 |
174 |
| -; RV64I-NEXT: sd ra, 24(sp) # 8-byte Folded Spill |
175 |
| -; RV64I-NEXT: sd s0, 16(sp) # 8-byte Folded Spill |
176 |
| -; RV64I-NEXT: sd s1, 8(sp) # 8-byte Folded Spill |
177 |
| -; RV64I-NEXT: sd s2, 0(sp) # 8-byte Folded Spill |
178 |
| -; RV64I-NEXT: mv s0, a0 |
179 |
| -; RV64I-NEXT: li s2, 0 |
180 |
| -; RV64I-NEXT: .Lpcrel_hi3: |
181 |
| -; RV64I-NEXT: auipc a0, %tls_gd_pcrel_hi(gd) |
182 |
| -; RV64I-NEXT: addi s1, a0, %pcrel_lo(.Lpcrel_hi3) |
183 |
| -; RV64I-NEXT: .LBB3_1: # %loop |
184 |
| -; RV64I-NEXT: # =>This Inner Loop Header: Depth=1 |
185 |
| -; RV64I-NEXT: mv a0, s1 |
186 |
| -; RV64I-NEXT: call __tls_get_addr |
187 |
| -; RV64I-NEXT: lw zero, 0(a0) |
188 |
| -; RV64I-NEXT: addiw s2, s2, 1 |
189 |
| -; RV64I-NEXT: blt s2, s0, .LBB3_1 |
190 |
| -; RV64I-NEXT: # %bb.2: # %ret |
191 |
| -; RV64I-NEXT: ld ra, 24(sp) # 8-byte Folded Reload |
192 |
| -; RV64I-NEXT: ld s0, 16(sp) # 8-byte Folded Reload |
193 |
| -; RV64I-NEXT: ld s1, 8(sp) # 8-byte Folded Reload |
194 |
| -; RV64I-NEXT: ld s2, 0(sp) # 8-byte Folded Reload |
195 |
| -; RV64I-NEXT: addi sp, sp, 32 |
196 |
| -; RV64I-NEXT: ret |
| 175 | +; RV64NOFUSION-LABEL: test_la_tls_gd: |
| 176 | +; RV64NOFUSION: # %bb.0: # %entry |
| 177 | +; RV64NOFUSION-NEXT: addi sp, sp, -32 |
| 178 | +; RV64NOFUSION-NEXT: sd ra, 24(sp) # 8-byte Folded Spill |
| 179 | +; RV64NOFUSION-NEXT: sd s0, 16(sp) # 8-byte Folded Spill |
| 180 | +; RV64NOFUSION-NEXT: sd s1, 8(sp) # 8-byte Folded Spill |
| 181 | +; RV64NOFUSION-NEXT: sd s2, 0(sp) # 8-byte Folded Spill |
| 182 | +; RV64NOFUSION-NEXT: mv s0, a0 |
| 183 | +; RV64NOFUSION-NEXT: li s2, 0 |
| 184 | +; RV64NOFUSION-NEXT: .Lpcrel_hi3: |
| 185 | +; RV64NOFUSION-NEXT: auipc a0, %tls_gd_pcrel_hi(gd) |
| 186 | +; RV64NOFUSION-NEXT: addi s1, a0, %pcrel_lo(.Lpcrel_hi3) |
| 187 | +; RV64NOFUSION-NEXT: .LBB3_1: # %loop |
| 188 | +; RV64NOFUSION-NEXT: # =>This Inner Loop Header: Depth=1 |
| 189 | +; RV64NOFUSION-NEXT: mv a0, s1 |
| 190 | +; RV64NOFUSION-NEXT: call __tls_get_addr |
| 191 | +; RV64NOFUSION-NEXT: lw zero, 0(a0) |
| 192 | +; RV64NOFUSION-NEXT: addiw s2, s2, 1 |
| 193 | +; RV64NOFUSION-NEXT: blt s2, s0, .LBB3_1 |
| 194 | +; RV64NOFUSION-NEXT: # %bb.2: # %ret |
| 195 | +; RV64NOFUSION-NEXT: ld ra, 24(sp) # 8-byte Folded Reload |
| 196 | +; RV64NOFUSION-NEXT: ld s0, 16(sp) # 8-byte Folded Reload |
| 197 | +; RV64NOFUSION-NEXT: ld s1, 8(sp) # 8-byte Folded Reload |
| 198 | +; RV64NOFUSION-NEXT: ld s2, 0(sp) # 8-byte Folded Reload |
| 199 | +; RV64NOFUSION-NEXT: addi sp, sp, 32 |
| 200 | +; RV64NOFUSION-NEXT: ret |
| 201 | +; |
| 202 | +; RV32FUSION-LABEL: test_la_tls_gd: |
| 203 | +; RV32FUSION: # %bb.0: # %entry |
| 204 | +; RV32FUSION-NEXT: addi sp, sp, -16 |
| 205 | +; RV32FUSION-NEXT: sw ra, 12(sp) # 4-byte Folded Spill |
| 206 | +; RV32FUSION-NEXT: sw s0, 8(sp) # 4-byte Folded Spill |
| 207 | +; RV32FUSION-NEXT: sw s1, 4(sp) # 4-byte Folded Spill |
| 208 | +; RV32FUSION-NEXT: sw s2, 0(sp) # 4-byte Folded Spill |
| 209 | +; RV32FUSION-NEXT: mv s0, a0 |
| 210 | +; RV32FUSION-NEXT: li s2, 0 |
| 211 | +; RV32FUSION-NEXT: .Lpcrel_hi3: |
| 212 | +; RV32FUSION-NEXT: auipc s1, %tls_gd_pcrel_hi(gd) |
| 213 | +; RV32FUSION-NEXT: addi s1, s1, %pcrel_lo(.Lpcrel_hi3) |
| 214 | +; RV32FUSION-NEXT: .LBB3_1: # %loop |
| 215 | +; RV32FUSION-NEXT: # =>This Inner Loop Header: Depth=1 |
| 216 | +; RV32FUSION-NEXT: mv a0, s1 |
| 217 | +; RV32FUSION-NEXT: call __tls_get_addr |
| 218 | +; RV32FUSION-NEXT: lw zero, 0(a0) |
| 219 | +; RV32FUSION-NEXT: addi s2, s2, 1 |
| 220 | +; RV32FUSION-NEXT: blt s2, s0, .LBB3_1 |
| 221 | +; RV32FUSION-NEXT: # %bb.2: # %ret |
| 222 | +; RV32FUSION-NEXT: lw ra, 12(sp) # 4-byte Folded Reload |
| 223 | +; RV32FUSION-NEXT: lw s0, 8(sp) # 4-byte Folded Reload |
| 224 | +; RV32FUSION-NEXT: lw s1, 4(sp) # 4-byte Folded Reload |
| 225 | +; RV32FUSION-NEXT: lw s2, 0(sp) # 4-byte Folded Reload |
| 226 | +; RV32FUSION-NEXT: addi sp, sp, 16 |
| 227 | +; RV32FUSION-NEXT: ret |
| 228 | +; |
| 229 | +; RV64FUSION-LABEL: test_la_tls_gd: |
| 230 | +; RV64FUSION: # %bb.0: # %entry |
| 231 | +; RV64FUSION-NEXT: addi sp, sp, -32 |
| 232 | +; RV64FUSION-NEXT: sd ra, 24(sp) # 8-byte Folded Spill |
| 233 | +; RV64FUSION-NEXT: sd s0, 16(sp) # 8-byte Folded Spill |
| 234 | +; RV64FUSION-NEXT: sd s1, 8(sp) # 8-byte Folded Spill |
| 235 | +; RV64FUSION-NEXT: sd s2, 0(sp) # 8-byte Folded Spill |
| 236 | +; RV64FUSION-NEXT: mv s0, a0 |
| 237 | +; RV64FUSION-NEXT: li s2, 0 |
| 238 | +; RV64FUSION-NEXT: .Lpcrel_hi3: |
| 239 | +; RV64FUSION-NEXT: auipc s1, %tls_gd_pcrel_hi(gd) |
| 240 | +; RV64FUSION-NEXT: addi s1, s1, %pcrel_lo(.Lpcrel_hi3) |
| 241 | +; RV64FUSION-NEXT: .LBB3_1: # %loop |
| 242 | +; RV64FUSION-NEXT: # =>This Inner Loop Header: Depth=1 |
| 243 | +; RV64FUSION-NEXT: mv a0, s1 |
| 244 | +; RV64FUSION-NEXT: call __tls_get_addr |
| 245 | +; RV64FUSION-NEXT: lw zero, 0(a0) |
| 246 | +; RV64FUSION-NEXT: addiw s2, s2, 1 |
| 247 | +; RV64FUSION-NEXT: blt s2, s0, .LBB3_1 |
| 248 | +; RV64FUSION-NEXT: # %bb.2: # %ret |
| 249 | +; RV64FUSION-NEXT: ld ra, 24(sp) # 8-byte Folded Reload |
| 250 | +; RV64FUSION-NEXT: ld s0, 16(sp) # 8-byte Folded Reload |
| 251 | +; RV64FUSION-NEXT: ld s1, 8(sp) # 8-byte Folded Reload |
| 252 | +; RV64FUSION-NEXT: ld s2, 0(sp) # 8-byte Folded Reload |
| 253 | +; RV64FUSION-NEXT: addi sp, sp, 32 |
| 254 | +; RV64FUSION-NEXT: ret |
197 | 255 | entry:
|
198 | 256 | br label %loop
|
199 | 257 |
|
|
0 commit comments