|
4 | 4 |
|
5 | 5 | define noundef i32 @test_firstbithigh_ushort(i16 noundef %a) {
|
6 | 6 | entry:
|
7 |
| -; CHECK: call i32 @dx.op.unaryBits.i16(i32 33, i16 %{{.*}}) #[[#ATTR:]] |
| 7 | +; CHECK: call i32 @dx.op.unaryBits.i16(i32 33, i16 %{{.*}}) |
8 | 8 | %elt.firstbithigh = call i32 @llvm.dx.firstbituhigh.i16(i16 %a)
|
9 | 9 | ret i32 %elt.firstbithigh
|
10 | 10 | }
|
11 | 11 |
|
12 | 12 | define noundef i32 @test_firstbithigh_short(i16 noundef %a) {
|
13 | 13 | entry:
|
14 |
| -; CHECK: call i32 @dx.op.unaryBits.i16(i32 34, i16 %{{.*}}) #[[#ATTR]] |
| 14 | +; CHECK: call i32 @dx.op.unaryBits.i16(i32 34, i16 %{{.*}}) |
15 | 15 | %elt.firstbithigh = call i32 @llvm.dx.firstbitshigh.i16(i16 %a)
|
16 | 16 | ret i32 %elt.firstbithigh
|
17 | 17 | }
|
18 | 18 |
|
19 | 19 | define noundef i32 @test_firstbithigh_uint(i32 noundef %a) {
|
20 | 20 | entry:
|
21 |
| -; CHECK: call i32 @dx.op.unaryBits.i32(i32 33, i32 %{{.*}}) #[[#ATTR]] |
| 21 | +; CHECK: call i32 @dx.op.unaryBits.i32(i32 33, i32 %{{.*}}) |
22 | 22 | %elt.firstbithigh = call i32 @llvm.dx.firstbituhigh.i32(i32 %a)
|
23 | 23 | ret i32 %elt.firstbithigh
|
24 | 24 | }
|
25 | 25 |
|
26 | 26 | define noundef i32 @test_firstbithigh_int(i32 noundef %a) {
|
27 | 27 | entry:
|
28 |
| -; CHECK: call i32 @dx.op.unaryBits.i32(i32 34, i32 %{{.*}}) #[[#ATTR]] |
| 28 | +; CHECK: call i32 @dx.op.unaryBits.i32(i32 34, i32 %{{.*}}) |
29 | 29 | %elt.firstbithigh = call i32 @llvm.dx.firstbitshigh.i32(i32 %a)
|
30 | 30 | ret i32 %elt.firstbithigh
|
31 | 31 | }
|
32 | 32 |
|
33 | 33 | define noundef i32 @test_firstbithigh_ulong(i64 noundef %a) {
|
34 | 34 | entry:
|
35 |
| -; CHECK: call i32 @dx.op.unaryBits.i64(i32 33, i64 %{{.*}}) #[[#ATTR]] |
| 35 | +; CHECK: call i32 @dx.op.unaryBits.i64(i32 33, i64 %{{.*}}) |
36 | 36 | %elt.firstbithigh = call i32 @llvm.dx.firstbituhigh.i64(i64 %a)
|
37 | 37 | ret i32 %elt.firstbithigh
|
38 | 38 | }
|
39 | 39 |
|
40 | 40 | define noundef i32 @test_firstbithigh_long(i64 noundef %a) {
|
41 | 41 | entry:
|
42 |
| -; CHECK: call i32 @dx.op.unaryBits.i64(i32 34, i64 %{{.*}}) #[[#ATTR]] |
| 42 | +; CHECK: call i32 @dx.op.unaryBits.i64(i32 34, i64 %{{.*}}) |
43 | 43 | %elt.firstbithigh = call i32 @llvm.dx.firstbitshigh.i64(i64 %a)
|
44 | 44 | ret i32 %elt.firstbithigh
|
45 | 45 | }
|
46 | 46 |
|
47 | 47 | define noundef <4 x i32> @test_firstbituhigh_vec4_i32(<4 x i32> noundef %a) {
|
48 | 48 | entry:
|
49 | 49 | ; CHECK: [[ee0:%.*]] = extractelement <4 x i32> %a, i64 0
|
50 |
| - ; CHECK: [[ie0:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee0]]) #[[#ATTR]] |
| 50 | + ; CHECK: [[ie0:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee0]]) |
51 | 51 | ; CHECK: [[ee1:%.*]] = extractelement <4 x i32> %a, i64 1
|
52 |
| - ; CHECK: [[ie1:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee1]]) #[[#ATTR]] |
| 52 | + ; CHECK: [[ie1:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee1]]) |
53 | 53 | ; CHECK: [[ee2:%.*]] = extractelement <4 x i32> %a, i64 2
|
54 |
| - ; CHECK: [[ie2:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee2]]) #[[#ATTR]] |
| 54 | + ; CHECK: [[ie2:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee2]]) |
55 | 55 | ; CHECK: [[ee3:%.*]] = extractelement <4 x i32> %a, i64 3
|
56 |
| - ; CHECK: [[ie3:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee3]]) #[[#ATTR]] |
57 |
| - ; CHECK: insertelement <4 x i32> poison, i32 [[ie0]], i64 0 |
58 |
| - ; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie1]], i64 1 |
59 |
| - ; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie2]], i64 2 |
60 |
| - ; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie3]], i64 3 |
| 56 | + ; CHECK: [[ie3:%.*]] = call i32 @dx.op.unaryBits.i32(i32 33, i32 [[ee3]]) |
| 57 | + ; CHECK: [[rt0:%.*]] = insertelement <4 x i32> poison, i32 [[ie0]], i64 0 |
| 58 | + ; CHECK: [[rt1:%.*]] = insertelement <4 x i32> [[rt0]], i32 [[ie1]], i64 1 |
| 59 | + ; CHECK: [[rt2:%.*]] = insertelement <4 x i32> [[rt1]], i32 [[ie2]], i64 2 |
| 60 | + ; CHECK: [[rt3:%.*]] = insertelement <4 x i32> [[rt2]], i32 [[ie3]], i64 3 |
| 61 | + ; CHECK: ret <4 x i32> [[rt3]] |
61 | 62 | %2 = call <4 x i32> @llvm.dx.firstbituhigh.v4i32(<4 x i32> %a)
|
62 | 63 | ret <4 x i32> %2
|
63 | 64 | }
|
64 | 65 |
|
65 | 66 | define noundef <4 x i32> @test_firstbitshigh_vec4_i32(<4 x i32> noundef %a) {
|
66 | 67 | entry:
|
67 | 68 | ; CHECK: [[ee0:%.*]] = extractelement <4 x i32> %a, i64 0
|
68 |
| - ; CHECK: [[ie0:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee0]]) #[[#ATTR]] |
| 69 | + ; CHECK: [[ie0:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee0]]) |
69 | 70 | ; CHECK: [[ee1:%.*]] = extractelement <4 x i32> %a, i64 1
|
70 |
| - ; CHECK: [[ie1:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee1]]) #[[#ATTR]] |
| 71 | + ; CHECK: [[ie1:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee1]]) |
71 | 72 | ; CHECK: [[ee2:%.*]] = extractelement <4 x i32> %a, i64 2
|
72 |
| - ; CHECK: [[ie2:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee2]]) #[[#ATTR]] |
| 73 | + ; CHECK: [[ie2:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee2]]) |
73 | 74 | ; CHECK: [[ee3:%.*]] = extractelement <4 x i32> %a, i64 3
|
74 |
| - ; CHECK: [[ie3:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee3]]) #[[#ATTR]] |
75 |
| - ; CHECK: insertelement <4 x i32> poison, i32 [[ie0]], i64 0 |
76 |
| - ; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie1]], i64 1 |
77 |
| - ; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie2]], i64 2 |
78 |
| - ; CHECK: insertelement <4 x i32> %{{.*}}, i32 [[ie3]], i64 3 |
| 75 | + ; CHECK: [[ie3:%.*]] = call i32 @dx.op.unaryBits.i32(i32 34, i32 [[ee3]]) |
| 76 | + ; CHECK: [[rt0:%.*]] = insertelement <4 x i32> poison, i32 [[ie0]], i64 0 |
| 77 | + ; CHECK: [[rt1:%.*]] = insertelement <4 x i32> [[rt0]], i32 [[ie1]], i64 1 |
| 78 | + ; CHECK: [[rt2:%.*]] = insertelement <4 x i32> [[rt1]], i32 [[ie2]], i64 2 |
| 79 | + ; CHECK: [[rt3:%.*]] = insertelement <4 x i32> [[rt2]], i32 [[ie3]], i64 3 |
| 80 | + ; CHECK: ret <4 x i32> [[rt3]] |
79 | 81 | %2 = call <4 x i32> @llvm.dx.firstbitshigh.v4i32(<4 x i32> %a)
|
80 | 82 | ret <4 x i32> %2
|
81 | 83 | }
|
82 | 84 |
|
83 |
| -; CHECK: attributes #[[#ATTR]] = {{{.*}} memory(none) {{.*}}} |
84 |
| - |
85 |
| -declare i32 @llvm.dx.firstbituhigh.i16(i16) |
86 |
| -declare i32 @llvm.dx.firstbituhigh.i32(i32) |
87 |
| -declare i32 @llvm.dx.firstbituhigh.i64(i64) |
88 |
| -declare <4 x i32> @llvm.dx.firstbituhigh.v4i32(<4 x i32>) |
| 85 | +define noundef <4 x i32> @test_firstbituhigh_vec4_i16(<4 x i16> noundef %a) { |
| 86 | +entry: |
| 87 | + ; CHECK: [[ee0:%.*]] = extractelement <4 x i16> %a, i64 0 |
| 88 | + ; CHECK: [[ie0:%.*]] = call i32 @dx.op.unaryBits.i16(i32 33, i16 [[ee0]]) |
| 89 | + ; CHECK: [[ee1:%.*]] = extractelement <4 x i16> %a, i64 1 |
| 90 | + ; CHECK: [[ie1:%.*]] = call i32 @dx.op.unaryBits.i16(i32 33, i16 [[ee1]]) |
| 91 | + ; CHECK: [[ee2:%.*]] = extractelement <4 x i16> %a, i64 2 |
| 92 | + ; CHECK: [[ie2:%.*]] = call i32 @dx.op.unaryBits.i16(i32 33, i16 [[ee2]]) |
| 93 | + ; CHECK: [[ee3:%.*]] = extractelement <4 x i16> %a, i64 3 |
| 94 | + ; CHECK: [[ie3:%.*]] = call i32 @dx.op.unaryBits.i16(i32 33, i16 [[ee3]]) |
| 95 | + ; CHECK: [[rt0:%.*]] = insertelement <4 x i32> poison, i32 [[ie0]], i64 0 |
| 96 | + ; CHECK: [[rt1:%.*]] = insertelement <4 x i32> [[rt0]], i32 [[ie1]], i64 1 |
| 97 | + ; CHECK: [[rt2:%.*]] = insertelement <4 x i32> [[rt1]], i32 [[ie2]], i64 2 |
| 98 | + ; CHECK: [[rt3:%.*]] = insertelement <4 x i32> [[rt2]], i32 [[ie3]], i64 3 |
| 99 | + ; CHECK: ret <4 x i32> [[rt3]] |
| 100 | + %2 = call <4 x i32> @llvm.dx.firstbituhigh.v4i16(<4 x i16> %a) |
| 101 | + ret <4 x i32> %2 |
| 102 | +} |
89 | 103 |
|
90 |
| -declare i32 @llvm.dx.firstbitshigh.i16(i16) |
91 |
| -declare i32 @llvm.dx.firstbitshigh.i32(i32) |
92 |
| -declare i32 @llvm.dx.firstbitshigh.i64(i64) |
93 |
| -declare <4 x i32> @llvm.dx.firstbitshigh.v4i32(<4 x i32>) |
| 104 | +define noundef <4 x i32> @test_firstbitshigh_vec4_i16(<4 x i16> noundef %a) { |
| 105 | +entry: |
| 106 | + ; CHECK: [[ee0:%.*]] = extractelement <4 x i16> %a, i64 0 |
| 107 | + ; CHECK: [[ie0:%.*]] = call i32 @dx.op.unaryBits.i16(i32 34, i16 [[ee0]]) |
| 108 | + ; CHECK: [[ee1:%.*]] = extractelement <4 x i16> %a, i64 1 |
| 109 | + ; CHECK: [[ie1:%.*]] = call i32 @dx.op.unaryBits.i16(i32 34, i16 [[ee1]]) |
| 110 | + ; CHECK: [[ee2:%.*]] = extractelement <4 x i16> %a, i64 2 |
| 111 | + ; CHECK: [[ie2:%.*]] = call i32 @dx.op.unaryBits.i16(i32 34, i16 [[ee2]]) |
| 112 | + ; CHECK: [[ee3:%.*]] = extractelement <4 x i16> %a, i64 3 |
| 113 | + ; CHECK: [[ie3:%.*]] = call i32 @dx.op.unaryBits.i16(i32 34, i16 [[ee3]]) |
| 114 | + ; CHECK: [[rt0:%.*]] = insertelement <4 x i32> poison, i32 [[ie0]], i64 0 |
| 115 | + ; CHECK: [[rt1:%.*]] = insertelement <4 x i32> [[rt0]], i32 [[ie1]], i64 1 |
| 116 | + ; CHECK: [[rt2:%.*]] = insertelement <4 x i32> [[rt1]], i32 [[ie2]], i64 2 |
| 117 | + ; CHECK: [[rt3:%.*]] = insertelement <4 x i32> [[rt2]], i32 [[ie3]], i64 3 |
| 118 | + ; CHECK: ret <4 x i32> [[rt3]] |
| 119 | + %2 = call <4 x i32> @llvm.dx.firstbitshigh.v4i16(<4 x i16> %a) |
| 120 | + ret <4 x i32> %2 |
| 121 | +} |
0 commit comments