Skip to content

Commit 5ff310e

Browse files
committed
GlobalISel: Add basic legalization for G_BITREVERSE
llvm-svn: 370979
1 parent 56e9b60 commit 5ff310e

File tree

3 files changed

+177
-1
lines changed

3 files changed

+177
-1
lines changed

llvm/lib/CodeGen/GlobalISel/LegalizerHelper.cpp

Lines changed: 19 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1470,6 +1470,24 @@ LegalizerHelper::widenScalar(MachineInstr &MI, unsigned TypeIdx, LLT WideTy) {
14701470
Observer.changedInstr(MI);
14711471
return Legalized;
14721472
}
1473+
case TargetOpcode::G_BITREVERSE: {
1474+
Observer.changingInstr(MI);
1475+
1476+
Register DstReg = MI.getOperand(0).getReg();
1477+
LLT Ty = MRI.getType(DstReg);
1478+
unsigned DiffBits = WideTy.getScalarSizeInBits() - Ty.getScalarSizeInBits();
1479+
1480+
Register DstExt = MRI.createGenericVirtualRegister(WideTy);
1481+
widenScalarSrc(MI, WideTy, 1, TargetOpcode::G_ANYEXT);
1482+
MI.getOperand(0).setReg(DstExt);
1483+
MIRBuilder.setInsertPt(MIRBuilder.getMBB(), ++MIRBuilder.getInsertPt());
1484+
1485+
auto ShiftAmt = MIRBuilder.buildConstant(WideTy, DiffBits);
1486+
auto Shift = MIRBuilder.buildLShr(WideTy, DstExt, ShiftAmt);
1487+
MIRBuilder.buildTrunc(DstReg, Shift);
1488+
Observer.changedInstr(MI);
1489+
return Legalized;
1490+
}
14731491
case TargetOpcode::G_ADD:
14741492
case TargetOpcode::G_AND:
14751493
case TargetOpcode::G_MUL:
@@ -2826,6 +2844,7 @@ LegalizerHelper::fewerElementsVector(MachineInstr &MI, unsigned TypeIdx,
28262844
case G_FSIN:
28272845
case G_FSQRT:
28282846
case G_BSWAP:
2847+
case G_BITREVERSE:
28292848
case G_SDIV:
28302849
case G_SMIN:
28312850
case G_SMAX:

llvm/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -433,7 +433,7 @@ AMDGPULegalizerInfo::AMDGPULegalizerInfo(const GCNSubtarget &ST_,
433433
.widenScalarToNextPow2(1, 32);
434434

435435
// TODO: Expand for > s32
436-
getActionDefinitionsBuilder(G_BSWAP)
436+
getActionDefinitionsBuilder({G_BSWAP, G_BITREVERSE})
437437
.legalFor({S32})
438438
.clampScalar(0, S32, S32)
439439
.scalarize(0);
Lines changed: 157 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,157 @@
1+
# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
2+
# RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=fiji -O0 -run-pass=legalizer -global-isel-abort=0 %s -o - | FileCheck %s
3+
4+
---
5+
name: bitreverse_s8
6+
7+
body: |
8+
bb.0:
9+
liveins: $vgpr0
10+
; CHECK-LABEL: name: bitreverse_s8
11+
; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
12+
; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[COPY]](s32)
13+
; CHECK: [[BITREVERSE:%[0-9]+]]:_(s32) = G_BITREVERSE [[COPY1]]
14+
; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 24
15+
; CHECK: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[BITREVERSE]], [[C]](s32)
16+
; CHECK: [[COPY2:%[0-9]+]]:_(s32) = COPY [[LSHR]](s32)
17+
; CHECK: $vgpr0 = COPY [[COPY2]](s32)
18+
%0:_(s32) = COPY $vgpr0
19+
%1:_(s8) = G_TRUNC %0
20+
%2:_(s8) = G_BITREVERSE %1
21+
%3:_(s32) = G_ANYEXT %2
22+
$vgpr0 = COPY %3
23+
...
24+
25+
---
26+
name: bitreverse_s16
27+
28+
body: |
29+
bb.0:
30+
liveins: $vgpr0
31+
; CHECK-LABEL: name: bitreverse_s16
32+
; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
33+
; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[COPY]](s32)
34+
; CHECK: [[BITREVERSE:%[0-9]+]]:_(s32) = G_BITREVERSE [[COPY1]]
35+
; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 16
36+
; CHECK: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[BITREVERSE]], [[C]](s32)
37+
; CHECK: [[COPY2:%[0-9]+]]:_(s32) = COPY [[LSHR]](s32)
38+
; CHECK: $vgpr0 = COPY [[COPY2]](s32)
39+
%0:_(s32) = COPY $vgpr0
40+
%1:_(s16) = G_TRUNC %0
41+
%2:_(s16) = G_BITREVERSE %1
42+
%3:_(s32) = G_ANYEXT %2
43+
$vgpr0 = COPY %3
44+
...
45+
46+
---
47+
name: bitreverse_s24
48+
49+
body: |
50+
bb.0:
51+
liveins: $vgpr0
52+
; CHECK-LABEL: name: bitreverse_s24
53+
; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
54+
; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[COPY]](s32)
55+
; CHECK: [[BITREVERSE:%[0-9]+]]:_(s32) = G_BITREVERSE [[COPY1]]
56+
; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 8
57+
; CHECK: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[BITREVERSE]], [[C]](s32)
58+
; CHECK: [[COPY2:%[0-9]+]]:_(s32) = COPY [[LSHR]](s32)
59+
; CHECK: $vgpr0 = COPY [[COPY2]](s32)
60+
%0:_(s32) = COPY $vgpr0
61+
%1:_(s24) = G_TRUNC %0
62+
%2:_(s24) = G_BITREVERSE %1
63+
%3:_(s32) = G_ANYEXT %2
64+
$vgpr0 = COPY %3
65+
...
66+
67+
---
68+
name: bitreverse_s32
69+
70+
body: |
71+
bb.0:
72+
liveins: $vgpr0
73+
; CHECK-LABEL: name: bitreverse_s32
74+
; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
75+
; CHECK: [[BITREVERSE:%[0-9]+]]:_(s32) = G_BITREVERSE [[COPY]]
76+
; CHECK: $vgpr0 = COPY [[BITREVERSE]](s32)
77+
%0:_(s32) = COPY $vgpr0
78+
%1:_(s32) = G_BITREVERSE %0
79+
$vgpr0 = COPY %1
80+
...
81+
82+
---
83+
name: bitreverse_v2s16
84+
85+
body: |
86+
bb.0:
87+
liveins: $vgpr0
88+
; CHECK-LABEL: name: bitreverse_v2s16
89+
; CHECK: [[COPY:%[0-9]+]]:_(<2 x s16>) = COPY $vgpr0
90+
; CHECK: [[BITCAST:%[0-9]+]]:_(s32) = G_BITCAST [[COPY]](<2 x s16>)
91+
; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 16
92+
; CHECK: [[LSHR:%[0-9]+]]:_(s32) = G_LSHR [[BITCAST]], [[C]](s32)
93+
; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[BITCAST]](s32)
94+
; CHECK: [[BITREVERSE:%[0-9]+]]:_(s32) = G_BITREVERSE [[COPY1]]
95+
; CHECK: [[LSHR1:%[0-9]+]]:_(s32) = G_LSHR [[BITREVERSE]], [[C]](s32)
96+
; CHECK: [[TRUNC:%[0-9]+]]:_(s16) = G_TRUNC [[LSHR1]](s32)
97+
; CHECK: [[COPY2:%[0-9]+]]:_(s32) = COPY [[LSHR]](s32)
98+
; CHECK: [[BITREVERSE1:%[0-9]+]]:_(s32) = G_BITREVERSE [[COPY2]]
99+
; CHECK: [[LSHR2:%[0-9]+]]:_(s32) = G_LSHR [[BITREVERSE1]], [[C]](s32)
100+
; CHECK: [[TRUNC1:%[0-9]+]]:_(s16) = G_TRUNC [[LSHR2]](s32)
101+
; CHECK: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s16>) = G_BUILD_VECTOR [[TRUNC]](s16), [[TRUNC1]](s16)
102+
; CHECK: $vgpr0 = COPY [[BUILD_VECTOR]](<2 x s16>)
103+
%0:_(<2 x s16>) = COPY $vgpr0
104+
%1:_(<2 x s16>) = G_BITREVERSE %0
105+
$vgpr0 = COPY %1
106+
...
107+
108+
---
109+
name: bitreverse_v2s32
110+
111+
body: |
112+
bb.0:
113+
liveins: $vgpr0_vgpr1
114+
; CHECK-LABEL: name: bitreverse_v2s32
115+
; CHECK: [[COPY:%[0-9]+]]:_(<2 x s32>) = COPY $vgpr0_vgpr1
116+
; CHECK: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[COPY]](<2 x s32>)
117+
; CHECK: [[BITREVERSE:%[0-9]+]]:_(s32) = G_BITREVERSE [[UV]]
118+
; CHECK: [[BITREVERSE1:%[0-9]+]]:_(s32) = G_BITREVERSE [[UV1]]
119+
; CHECK: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s32>) = G_BUILD_VECTOR [[BITREVERSE]](s32), [[BITREVERSE1]](s32)
120+
; CHECK: $vgpr0_vgpr1 = COPY [[BUILD_VECTOR]](<2 x s32>)
121+
%0:_(<2 x s32>) = COPY $vgpr0_vgpr1
122+
%1:_(<2 x s32>) = G_BITREVERSE %0
123+
$vgpr0_vgpr1 = COPY %1
124+
...
125+
126+
---
127+
name: bitreverse_s64
128+
129+
body: |
130+
bb.0:
131+
liveins: $vgpr0_vgpr1
132+
; CHECK-LABEL: name: bitreverse_s64
133+
; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1
134+
; CHECK: [[BITREVERSE:%[0-9]+]]:_(s64) = G_BITREVERSE [[COPY]]
135+
; CHECK: $vgpr0_vgpr1 = COPY [[BITREVERSE]](s64)
136+
%0:_(s64) = COPY $vgpr0_vgpr1
137+
%1:_(s64) = G_BITREVERSE %0
138+
$vgpr0_vgpr1 = COPY %1
139+
...
140+
141+
---
142+
name: bitreverse_v2s64
143+
144+
body: |
145+
bb.0:
146+
liveins: $vgpr0_vgpr1_vgpr2_vgpr3
147+
; CHECK-LABEL: name: bitreverse_v2s64
148+
; CHECK: [[COPY:%[0-9]+]]:_(<2 x s64>) = COPY $vgpr0_vgpr1_vgpr2_vgpr3
149+
; CHECK: [[UV:%[0-9]+]]:_(s64), [[UV1:%[0-9]+]]:_(s64) = G_UNMERGE_VALUES [[COPY]](<2 x s64>)
150+
; CHECK: [[BITREVERSE:%[0-9]+]]:_(s64) = G_BITREVERSE [[UV]]
151+
; CHECK: [[BITREVERSE1:%[0-9]+]]:_(s64) = G_BITREVERSE [[UV1]]
152+
; CHECK: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s64>) = G_BUILD_VECTOR [[BITREVERSE]](s64), [[BITREVERSE1]](s64)
153+
; CHECK: $vgpr0_vgpr1_vgpr2_vgpr3 = COPY [[BUILD_VECTOR]](<2 x s64>)
154+
%0:_(<2 x s64>) = COPY $vgpr0_vgpr1_vgpr2_vgpr3
155+
%1:_(<2 x s64>) = G_BITREVERSE %0
156+
$vgpr0_vgpr1_vgpr2_vgpr3 = COPY %1
157+
...

0 commit comments

Comments
 (0)