Skip to content
This repository was archived by the owner on Mar 28, 2020. It is now read-only.

Commit 0b3ff9a

Browse files
committed
[ARM] MVE trunc to i1 vectors
This adds patterns for selecting trunc instructions from full vectors to i1's vectors. Differential Revision: https://reviews.llvm.org/D66201 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@368981 91177308-0d34-0410-b5e6-96231b3b80d8
1 parent c571426 commit 0b3ff9a

File tree

2 files changed

+68
-0
lines changed

2 files changed

+68
-0
lines changed

lib/Target/ARM/ARMInstrMVE.td

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4666,6 +4666,13 @@ let Predicates = [HasMVEInt] in {
46664666
(v8i16 (MVE_VPSEL (MVE_VMOVimmi16 1), (MVE_VMOVimmi16 0), 0, VCCR:$pred))>;
46674667
def : Pat<(v4i32 (anyext (v4i1 VCCR:$pred))),
46684668
(v4i32 (MVE_VPSEL (MVE_VMOVimmi32 1), (MVE_VMOVimmi32 0), 0, VCCR:$pred))>;
4669+
4670+
def : Pat<(v16i1 (trunc (v16i8 MQPR:$v1))),
4671+
(v16i1 (MVE_VCMPi32r (v16i8 MQPR:$v1), ZR, 1))>;
4672+
def : Pat<(v8i1 (trunc (v8i16 MQPR:$v1))),
4673+
(v8i1 (MVE_VCMPi32r (v8i16 MQPR:$v1), ZR, 1))>;
4674+
def : Pat<(v4i1 (trunc (v4i32 MQPR:$v1))),
4675+
(v4i1 (MVE_VCMPi32r (v4i32 MQPR:$v1), ZR, 1))>;
46694676
}
46704677

46714678
let Predicates = [HasMVEFloat] in {

test/CodeGen/Thumb2/mve-pred-ext.ll

Lines changed: 61 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -163,6 +163,67 @@ entry:
163163
}
164164

165165

166+
define arm_aapcs_vfpcc <4 x i32> @trunc_v4i1_v4i32(<4 x i32> %src) {
167+
; CHECK-LABEL: trunc_v4i1_v4i32:
168+
; CHECK: @ %bb.0: @ %entry
169+
; CHECK-NEXT: vmov.i32 q1, #0x0
170+
; CHECK-NEXT: vcmp.i32 ne, q0, zr
171+
; CHECK-NEXT: vpsel q0, q0, q1
172+
; CHECK-NEXT: bx lr
173+
entry:
174+
%0 = trunc <4 x i32> %src to <4 x i1>
175+
%1 = select <4 x i1> %0, <4 x i32> %src, <4 x i32> zeroinitializer
176+
ret <4 x i32> %1
177+
}
178+
179+
define arm_aapcs_vfpcc <8 x i16> @trunc_v8i1_v8i16(<8 x i16> %src) {
180+
; CHECK-LABEL: trunc_v8i1_v8i16:
181+
; CHECK: @ %bb.0: @ %entry
182+
; CHECK-NEXT: vmov.i32 q1, #0x0
183+
; CHECK-NEXT: vcmp.i32 ne, q0, zr
184+
; CHECK-NEXT: vpsel q0, q0, q1
185+
; CHECK-NEXT: bx lr
186+
entry:
187+
%0 = trunc <8 x i16> %src to <8 x i1>
188+
%1 = select <8 x i1> %0, <8 x i16> %src, <8 x i16> zeroinitializer
189+
ret <8 x i16> %1
190+
}
191+
192+
define arm_aapcs_vfpcc <16 x i8> @trunc_v16i1_v16i8(<16 x i8> %src) {
193+
; CHECK-LABEL: trunc_v16i1_v16i8:
194+
; CHECK: @ %bb.0: @ %entry
195+
; CHECK-NEXT: vmov.i32 q1, #0x0
196+
; CHECK-NEXT: vcmp.i32 ne, q0, zr
197+
; CHECK-NEXT: vpsel q0, q0, q1
198+
; CHECK-NEXT: bx lr
199+
entry:
200+
%0 = trunc <16 x i8> %src to <16 x i1>
201+
%1 = select <16 x i1> %0, <16 x i8> %src, <16 x i8> zeroinitializer
202+
ret <16 x i8> %1
203+
}
204+
205+
define arm_aapcs_vfpcc <2 x i64> @trunc_v2i1_v2i64(<2 x i64> %src) {
206+
; CHECK-LABEL: trunc_v2i1_v2i64:
207+
; CHECK: @ %bb.0: @ %entry
208+
; CHECK-NEXT: vmov r1, s0
209+
; CHECK-NEXT: vmov r0, s2
210+
; CHECK-NEXT: and r1, r1, #1
211+
; CHECK-NEXT: rsbs r1, r1, #0
212+
; CHECK-NEXT: and r0, r0, #1
213+
; CHECK-NEXT: vmov.32 q1[0], r1
214+
; CHECK-NEXT: rsbs r0, r0, #0
215+
; CHECK-NEXT: vmov.32 q1[1], r1
216+
; CHECK-NEXT: vmov.32 q1[2], r0
217+
; CHECK-NEXT: vmov.32 q1[3], r0
218+
; CHECK-NEXT: vand q0, q0, q1
219+
; CHECK-NEXT: bx lr
220+
entry:
221+
%0 = trunc <2 x i64> %src to <2 x i1>
222+
%1 = select <2 x i1> %0, <2 x i64> %src, <2 x i64> zeroinitializer
223+
ret <2 x i64> %1
224+
}
225+
226+
166227
define arm_aapcs_vfpcc <4 x float> @uitofp_v4i1_v4f32(<4 x i32> %src) {
167228
; CHECK-LABEL: uitofp_v4i1_v4f32:
168229
; CHECK: @ %bb.0: @ %entry

0 commit comments

Comments
 (0)