|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5 |
| 2 | +; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s |
| 3 | + |
| 4 | +define i16 @test(i16 %v1, i16 %v2) { |
| 5 | +; CHECK-LABEL: define i16 @test( |
| 6 | +; CHECK-SAME: i16 [[V1:%.*]], i16 [[V2:%.*]]) { |
| 7 | +; CHECK-NEXT: [[ENTRY:.*:]] |
| 8 | +; CHECK-NEXT: [[TMP0:%.*]] = insertelement <4 x i16> <i16 0, i16 0, i16 0, i16 poison>, i16 [[V2]], i32 3 |
| 9 | +; CHECK-NEXT: [[TMP1:%.*]] = insertelement <4 x i16> <i16 0, i16 0, i16 0, i16 poison>, i16 [[V1]], i32 3 |
| 10 | +; CHECK-NEXT: [[TMP2:%.*]] = or <4 x i16> [[TMP0]], [[TMP1]] |
| 11 | +; CHECK-NEXT: [[TMP3:%.*]] = and <4 x i16> [[TMP0]], [[TMP1]] |
| 12 | +; CHECK-NEXT: [[TMP4:%.*]] = shufflevector <4 x i16> [[TMP2]], <4 x i16> [[TMP3]], <4 x i32> <i32 0, i32 1, i32 2, i32 7> |
| 13 | +; CHECK-NEXT: [[TMP5:%.*]] = shufflevector <4 x i16> [[TMP1]], <4 x i16> poison, <2 x i32> <i32 0, i32 poison> |
| 14 | +; CHECK-NEXT: [[TMP6:%.*]] = insertelement <2 x i16> [[TMP5]], i16 [[V2]], i32 1 |
| 15 | +; CHECK-NEXT: [[TMP7:%.*]] = shufflevector <2 x i16> [[TMP6]], <2 x i16> poison, <4 x i32> <i32 0, i32 0, i32 0, i32 1> |
| 16 | +; CHECK-NEXT: [[TMP8:%.*]] = or <4 x i16> [[TMP7]], zeroinitializer |
| 17 | +; CHECK-NEXT: [[TMP9:%.*]] = and <4 x i16> [[TMP4]], zeroinitializer |
| 18 | +; CHECK-NEXT: [[TMP10:%.*]] = and <4 x i16> [[TMP9]], zeroinitializer |
| 19 | +; CHECK-NEXT: [[TMP11:%.*]] = icmp ne <4 x i16> [[TMP10]], zeroinitializer |
| 20 | +; CHECK-NEXT: [[TMP12:%.*]] = or <4 x i1> [[TMP11]], zeroinitializer |
| 21 | +; CHECK-NEXT: [[TMP13:%.*]] = or <4 x i16> [[TMP8]], zeroinitializer |
| 22 | +; CHECK-NEXT: [[TMP14:%.*]] = or <4 x i16> [[TMP13]], zeroinitializer |
| 23 | +; CHECK-NEXT: [[TMP15:%.*]] = or <4 x i16> [[TMP14]], zeroinitializer |
| 24 | +; CHECK-NEXT: [[TMP16:%.*]] = icmp ne <4 x i16> [[TMP15]], zeroinitializer |
| 25 | +; CHECK-NEXT: [[TMP17:%.*]] = or <4 x i1> zeroinitializer, [[TMP16]] |
| 26 | +; CHECK-NEXT: [[TMP18:%.*]] = or <4 x i1> [[TMP12]], [[TMP17]] |
| 27 | +; CHECK-NEXT: [[TMP19:%.*]] = extractelement <4 x i1> [[TMP18]], i32 2 |
| 28 | +; CHECK-NEXT: [[TMP20:%.*]] = extractelement <4 x i1> [[TMP18]], i32 3 |
| 29 | +; CHECK-NEXT: [[TMP21:%.*]] = or i1 [[TMP20]], [[TMP19]] |
| 30 | +; CHECK-NEXT: [[TMP22:%.*]] = extractelement <4 x i1> [[TMP18]], i32 1 |
| 31 | +; CHECK-NEXT: [[TMP23:%.*]] = or i1 false, [[TMP22]] |
| 32 | +; CHECK-NEXT: [[TMP24:%.*]] = freeze <4 x i1> [[TMP18]] |
| 33 | +; CHECK-NEXT: [[TMP25:%.*]] = call i1 @llvm.vector.reduce.or.v4i1(<4 x i1> [[TMP24]]) |
| 34 | +; CHECK-NEXT: [[SPEC_SELECT31:%.*]] = select i1 [[TMP25]], i32 0, i32 0 |
| 35 | +; CHECK-NEXT: [[TMP26:%.*]] = extractelement <4 x i1> [[TMP18]], i32 0 |
| 36 | +; CHECK-NEXT: [[TMP27:%.*]] = or i1 false, [[TMP26]] |
| 37 | +; CHECK-NEXT: store i32 [[SPEC_SELECT31]], ptr null, align 4 |
| 38 | +; CHECK-NEXT: ret i16 0 |
| 39 | +; |
| 40 | +entry: |
| 41 | + %0 = and i16 %v2, %v1 |
| 42 | + %1 = and i16 %0, 0 |
| 43 | + %2 = and i16 %1, 0 |
| 44 | + %3 = icmp ne i16 %2, 0 |
| 45 | + %.not5.not = or i1 %3, false |
| 46 | + %inc.1.1.i82.i.i = or i16 %v2, 0 |
| 47 | + %inc.143.1.i98.i.i = or i16 0, 0 |
| 48 | + %4 = or i16 %inc.1.1.i82.i.i, 0 |
| 49 | + %5 = or i16 %4, 0 |
| 50 | + %6 = or i16 %5, 0 |
| 51 | + %7 = icmp ne i16 %6, 0 |
| 52 | + %.not7.not = or i1 false, %7 |
| 53 | + %8 = or i1 %.not5.not, %.not7.not |
| 54 | + %9 = and i16 0, %inc.143.1.i98.i.i |
| 55 | + %10 = and i16 %9, 0 |
| 56 | + %11 = icmp ne i16 %10, 0 |
| 57 | + %.not5.not.1 = or i1 %11, false |
| 58 | + %inc.143.i76.i.i.1 = or i16 %v1, 0 |
| 59 | + %inc.143.1.i98.i.i.1 = or i16 0, 0 |
| 60 | + %12 = or i16 0, %inc.143.i76.i.i.1 |
| 61 | + %13 = or i16 %12, 0 |
| 62 | + %14 = or i16 %13, 0 |
| 63 | + %15 = icmp ne i16 %14, 0 |
| 64 | + %.not7.not.1 = or i1 false, %15 |
| 65 | + %16 = or i1 %.not5.not.1, %.not7.not.1 |
| 66 | + %17 = or i1 %8, %16 |
| 67 | + %18 = and i16 0, %inc.143.1.i98.i.i.1 |
| 68 | + %19 = and i16 %18, 0 |
| 69 | + %20 = icmp ne i16 %19, 0 |
| 70 | + %.not5.not.2 = or i1 %20, false |
| 71 | + %inc.143.i76.i.i.2 = or i16 %v1, 0 |
| 72 | + %inc.143.1.i98.i.i.2 = or i16 0, 0 |
| 73 | + %21 = or i16 0, %inc.143.i76.i.i.2 |
| 74 | + %22 = or i16 %21, 0 |
| 75 | + %23 = or i16 %22, 0 |
| 76 | + %24 = icmp ne i16 %23, 0 |
| 77 | + %.not7.not.2 = or i1 false, %24 |
| 78 | + %25 = or i1 %.not5.not.2, %.not7.not.2 |
| 79 | + %26 = or i1 false, %25 |
| 80 | + %27 = and i16 0, %inc.143.1.i98.i.i.2 |
| 81 | + %28 = and i16 %27, 0 |
| 82 | + %29 = icmp ne i16 %28, 0 |
| 83 | + %.not5.not.3 = or i1 %29, false |
| 84 | + %inc.143.i76.i.i.3 = or i16 %v1, 0 |
| 85 | + %30 = or i16 0, %inc.143.i76.i.i.3 |
| 86 | + %31 = or i16 %30, 0 |
| 87 | + %32 = or i16 %31, 0 |
| 88 | + %33 = icmp ne i16 %32, 0 |
| 89 | + %.not7.not.3 = or i1 false, %33 |
| 90 | + %34 = or i1 %.not5.not.3, %.not7.not.3 |
| 91 | + %35 = select i1 %34, i1 true, i1 %25 |
| 92 | + %36 = select i1 %35, i1 true, i1 %16 |
| 93 | + %37 = select i1 %36, i1 true, i1 %8 |
| 94 | + %spec.select31 = select i1 %37, i32 0, i32 0 |
| 95 | + %38 = or i1 false, %34 |
| 96 | + store i32 %spec.select31, ptr null, align 4 |
| 97 | + ret i16 0 |
| 98 | +} |
0 commit comments