|
1 |
| -; RUN: llc -O0 < %s -mtriple=nvptx -mcpu=sm_20 | FileCheck %s -check-prefixes=ALL,CLS32,G32 |
2 |
| -; RUN: llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 | FileCheck %s -check-prefixes=ALL,NOPTRCONV,CLS64,G64 |
3 |
| -; RUN: llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 --nvptx-short-ptr| FileCheck %s -check-prefixes=ALL,PTRCONV,CLS64,G64 |
| 1 | +; RUN: llc -O0 < %s -mtriple=nvptx -mcpu=sm_20 | FileCheck %s -check-prefixes=ALL,CLS32 |
| 2 | +; RUN: llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 | FileCheck %s -check-prefixes=ALL,NOPTRCONV,CLS64 |
| 3 | +; RUN: llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 --nvptx-short-ptr | FileCheck %s -check-prefixes=ALL,PTRCONV,CLS64 |
4 | 4 | ; RUN: %if ptxas && !ptxas-12.0 %{ llc -O0 < %s -mtriple=nvptx -mcpu=sm_20 | %ptxas-verify %}
|
5 | 5 | ; RUN: %if ptxas %{ llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 | %ptxas-verify %}
|
6 | 6 | ; RUN: %if ptxas %{ llc -O0 < %s -mtriple=nvptx64 -mcpu=sm_20 --nvptx-short-ptr | %ptxas-verify %}
|
7 | 7 |
|
8 | 8 | ; ALL-LABEL: conv1
|
9 | 9 | define i32 @conv1(ptr addrspace(1) %ptr) {
|
10 |
| -; G32: cvta.global.u32 |
| 10 | +; CLS32: cvta.global.u32 |
11 | 11 | ; ALL-NOT: cvt.u64.u32
|
12 |
| -; G64: cvta.global.u64 |
| 12 | +; CLS64: cvta.global.u64 |
13 | 13 | ; ALL: ld.u32
|
14 | 14 | %genptr = addrspacecast ptr addrspace(1) %ptr to ptr
|
15 | 15 | %val = load i32, ptr %genptr
|
@@ -101,13 +101,10 @@ define i32 @conv8(ptr %ptr) {
|
101 | 101 |
|
102 | 102 | ; ALL-LABEL: conv9
|
103 | 103 | define i32 @conv9(ptr addrspace(1) %ptr) {
|
104 |
| -; CLS32: cvta.global.u32 |
105 |
| -; CLS32: cvta.to.shared.u32 |
106 |
| -; CLS64: cvta.global.u64 |
107 |
| -; CLS64: cvta.to.shared.u64 |
108 |
| -; PTRCONV: cvt.u32.u64 |
109 |
| -; NOPTRCONV-NOT: cvt.u32.u64 |
110 |
| -; ALL: ld.shared.u32 |
| 104 | +; CLS32: // implicit-def: %[[ADDR:r[0-9]+]] |
| 105 | +; PTRCONV: // implicit-def: %[[ADDR:r[0-9]+]] |
| 106 | +; NOPTRCONV: // implicit-def: %[[ADDR:rd[0-9]+]] |
| 107 | +; ALL: ld.shared.u32 %r{{[0-9]+}}, [%[[ADDR]]] |
111 | 108 | %specptr = addrspacecast ptr addrspace(1) %ptr to ptr addrspace(3)
|
112 | 109 | %val = load i32, ptr addrspace(3) %specptr
|
113 | 110 | ret i32 %val
|
|
0 commit comments