|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5 |
| 2 | +; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s |
| 3 | + |
| 4 | +define i1 @test(i64 %v1, ptr %v2, i32 %v3, i1 %v4) { |
| 5 | +; CHECK-LABEL: define i1 @test( |
| 6 | +; CHECK-SAME: i64 [[V1:%.*]], ptr [[V2:%.*]], i32 [[V3:%.*]], i1 [[V4:%.*]]) { |
| 7 | +; CHECK-NEXT: [[NEWFUNCROOT:.*:]] |
| 8 | +; CHECK-NEXT: [[TMP0:%.*]] = insertelement <2 x i64> poison, i64 [[V1]], i32 0 |
| 9 | +; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <2 x i64> [[TMP0]], <2 x i64> poison, <2 x i32> zeroinitializer |
| 10 | +; CHECK-NEXT: [[TMP2:%.*]] = lshr <2 x i64> [[TMP1]], <i64 32, i64 40> |
| 11 | +; CHECK-NEXT: [[TMP3:%.*]] = trunc <2 x i64> [[TMP2]] to <2 x i8> |
| 12 | +; CHECK-NEXT: [[TMP4:%.*]] = and <2 x i8> [[TMP3]], <i8 1, i8 -1> |
| 13 | +; CHECK-NEXT: [[TMP5:%.*]] = zext <2 x i8> [[TMP4]] to <2 x i32> |
| 14 | +; CHECK-NEXT: [[TMP6:%.*]] = icmp eq <2 x i32> [[TMP5]], zeroinitializer |
| 15 | +; CHECK-NEXT: [[TMP7:%.*]] = insertelement <4 x i32> poison, i32 [[V3]], i32 0 |
| 16 | +; CHECK-NEXT: [[TMP8:%.*]] = shufflevector <4 x i32> [[TMP7]], <4 x i32> poison, <4 x i32> <i32 poison, i32 poison, i32 0, i32 0> |
| 17 | +; CHECK-NEXT: [[TMP9:%.*]] = sext <2 x i8> [[TMP4]] to <2 x i32> |
| 18 | +; CHECK-NEXT: [[TMP10:%.*]] = call <4 x i32> @llvm.vector.insert.v4i32.v2i32(<4 x i32> [[TMP8]], <2 x i32> [[TMP9]], i64 0) |
| 19 | +; CHECK-NEXT: [[TMP11:%.*]] = uitofp <4 x i32> [[TMP10]] to <4 x float> |
| 20 | +; CHECK-NEXT: [[TMP12:%.*]] = fdiv <4 x float> zeroinitializer, [[TMP11]] |
| 21 | +; CHECK-NEXT: [[TMP13:%.*]] = insertelement <4 x i1> poison, i1 [[V4]], i32 0 |
| 22 | +; CHECK-NEXT: [[TMP14:%.*]] = shufflevector <4 x i1> [[TMP13]], <4 x i1> poison, <4 x i32> <i32 poison, i32 poison, i32 0, i32 0> |
| 23 | +; CHECK-NEXT: [[TMP15:%.*]] = call <4 x i1> @llvm.vector.insert.v4i1.v2i1(<4 x i1> [[TMP14]], <2 x i1> [[TMP6]], i64 0) |
| 24 | +; CHECK-NEXT: [[TMP16:%.*]] = select <4 x i1> [[TMP15]], <4 x float> zeroinitializer, <4 x float> [[TMP12]] |
| 25 | +; CHECK-NEXT: [[TMP17:%.*]] = extractelement <4 x float> [[TMP16]], i32 3 |
| 26 | +; CHECK-NEXT: [[CONV_I_I1743_3:%.*]] = fptoui float [[TMP17]] to i32 |
| 27 | +; CHECK-NEXT: [[TMP18:%.*]] = icmp ne i32 [[CONV_I_I1743_3]], 0 |
| 28 | +; CHECK-NEXT: [[TMP19:%.*]] = bitcast <4 x float> [[TMP16]] to <4 x i32> |
| 29 | +; CHECK-NEXT: [[TMP20:%.*]] = icmp ult <4 x i32> [[TMP19]], <i32 1333788672, i32 1333788672, i32 1333788672, i32 1333788672> |
| 30 | +; CHECK-NEXT: [[TMP21:%.*]] = extractelement <4 x i1> [[TMP20]], i32 3 |
| 31 | +; CHECK-NEXT: [[NARROW:%.*]] = select i1 [[TMP21]], i1 [[TMP18]], i1 false |
| 32 | +; CHECK-NEXT: [[TMP22:%.*]] = extractelement <4 x float> [[TMP16]], i32 2 |
| 33 | +; CHECK-NEXT: [[CONV_I_I1743_2:%.*]] = fptoui float [[TMP22]] to i32 |
| 34 | +; CHECK-NEXT: [[TMP23:%.*]] = extractelement <4 x i1> [[TMP20]], i32 2 |
| 35 | +; CHECK-NEXT: [[NARROW1:%.*]] = select i1 [[TMP23]], i32 [[CONV_I_I1743_2]], i32 0 |
| 36 | +; CHECK-NEXT: [[TMP24:%.*]] = zext i1 [[NARROW]] to i32 |
| 37 | +; CHECK-NEXT: [[TMP25:%.*]] = or i32 [[NARROW1]], [[TMP24]] |
| 38 | +; CHECK-NEXT: [[TMP26:%.*]] = extractelement <4 x float> [[TMP16]], i32 1 |
| 39 | +; CHECK-NEXT: [[CONV_I_I1743_1:%.*]] = fptoui float [[TMP26]] to i32 |
| 40 | +; CHECK-NEXT: [[TMP27:%.*]] = extractelement <4 x i1> [[TMP20]], i32 1 |
| 41 | +; CHECK-NEXT: [[NARROW2:%.*]] = select i1 [[TMP27]], i32 [[CONV_I_I1743_1]], i32 0 |
| 42 | +; CHECK-NEXT: [[RV3:%.*]] = or i32 [[TMP25]], [[NARROW2]] |
| 43 | +; CHECK-NEXT: [[TMP28:%.*]] = extractelement <4 x float> [[TMP16]], i32 0 |
| 44 | +; CHECK-NEXT: [[CONV_I_I1743:%.*]] = fptoui float [[TMP28]] to i32 |
| 45 | +; CHECK-NEXT: [[TMP29:%.*]] = extractelement <4 x i1> [[TMP20]], i32 0 |
| 46 | +; CHECK-NEXT: [[NARROW4:%.*]] = select i1 [[TMP29]], i32 [[CONV_I_I1743]], i32 0 |
| 47 | +; CHECK-NEXT: [[RT5:%.*]] = or i32 [[RV3]], [[NARROW4]] |
| 48 | +; CHECK-NEXT: [[RT:%.*]] = zext i32 [[RT5]] to i64 |
| 49 | +; CHECK-NEXT: store i64 [[RT]], ptr [[V2]], align 1 |
| 50 | +; CHECK-NEXT: ret i1 false |
| 51 | +; |
| 52 | +newFuncRoot: |
| 53 | + %conv.i147.i1756.3 = uitofp i32 %v3 to float |
| 54 | + %div.i.i.i1749.3 = fdiv float 0.000000e+00, %conv.i147.i1756.3 |
| 55 | + %cond.i.i.i1751.3 = select i1 %v4, float 0.000000e+00, float %div.i.i.i1749.3 |
| 56 | + %conv.i147.i1756.2 = uitofp i32 %v3 to float |
| 57 | + %div.i.i.i1749.2 = fdiv float 0.000000e+00, %conv.i147.i1756.2 |
| 58 | + %cond.i.i.i1751.2 = select i1 %v4, float 0.000000e+00, float %div.i.i.i1749.2 |
| 59 | + %0 = lshr i64 %v1, 40 |
| 60 | + %1 = trunc i64 %0 to i32 |
| 61 | + %tt2 = and i32 %1, 255 |
| 62 | + %cmp1.i.i.i1746.1 = icmp eq i32 %tt2, 0 |
| 63 | + %conv.i147.i1756.1 = uitofp i32 %tt2 to float |
| 64 | + %div.i.i.i1749.1 = fdiv float 0.000000e+00, %conv.i147.i1756.1 |
| 65 | + %cond.i.i.i1751.1 = select i1 %cmp1.i.i.i1746.1, float 0.000000e+00, float %div.i.i.i1749.1 |
| 66 | + %tt3 = lshr i64 %v1, 32 |
| 67 | + %2 = trunc i64 %tt3 to i32 |
| 68 | + %tt1 = and i32 %2, 1 |
| 69 | + %cmp1.i.i.i1746 = icmp eq i32 %tt1, 0 |
| 70 | + %conv.i147.i1756 = uitofp i32 %tt1 to float |
| 71 | + %div.i.i.i1749 = fdiv float 0.000000e+00, %conv.i147.i1756 |
| 72 | + %cond.i.i.i1751 = select i1 %cmp1.i.i.i1746, float 0.000000e+00, float %div.i.i.i1749 |
| 73 | + %3 = bitcast float %cond.i.i.i1751.3 to i32 |
| 74 | + %cmp.i99.i1736.3 = icmp ult i32 %3, 1333788672 |
| 75 | + %conv.i.i1743.3 = fptoui float %cond.i.i.i1751.3 to i32 |
| 76 | + %4 = icmp ne i32 %conv.i.i1743.3, 0 |
| 77 | + %narrow = select i1 %cmp.i99.i1736.3, i1 %4, i1 false |
| 78 | + %5 = bitcast float %cond.i.i.i1751.2 to i32 |
| 79 | + %cmp.i99.i1736.2 = icmp ult i32 %5, 1333788672 |
| 80 | + %conv.i.i1743.2 = fptoui float %cond.i.i.i1751.2 to i32 |
| 81 | + %narrow1 = select i1 %cmp.i99.i1736.2, i32 %conv.i.i1743.2, i32 0 |
| 82 | + %6 = zext i1 %narrow to i32 |
| 83 | + %7 = or i32 %narrow1, %6 |
| 84 | + %8 = bitcast float %cond.i.i.i1751.1 to i32 |
| 85 | + %cmp.i99.i1736.1 = icmp ult i32 %8, 1333788672 |
| 86 | + %conv.i.i1743.1 = fptoui float %cond.i.i.i1751.1 to i32 |
| 87 | + %narrow2 = select i1 %cmp.i99.i1736.1, i32 %conv.i.i1743.1, i32 0 |
| 88 | + %rv3 = or i32 %7, %narrow2 |
| 89 | + %9 = bitcast float %cond.i.i.i1751 to i32 |
| 90 | + %cmp.i99.i1736 = icmp ult i32 %9, 1333788672 |
| 91 | + %conv.i.i1743 = fptoui float %cond.i.i.i1751 to i32 |
| 92 | + %narrow4 = select i1 %cmp.i99.i1736, i32 %conv.i.i1743, i32 0 |
| 93 | + %rt5 = or i32 %rv3, %narrow4 |
| 94 | + %rt = zext i32 %rt5 to i64 |
| 95 | + store i64 %rt, ptr %v2, align 1 |
| 96 | + ret i1 false |
| 97 | +} |
0 commit comments