|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4 |
| 2 | +; RUN: opt -S --passes=slp-vectorizer -mtriple=riscv64-unknown-linux -mattr=+v < %s | FileCheck %s |
| 3 | + |
| 4 | +define void @test(ptr %p, i16 %load794) { |
| 5 | +; CHECK-LABEL: define void @test( |
| 6 | +; CHECK-SAME: ptr [[P:%.*]], i16 [[LOAD794:%.*]]) #[[ATTR0:[0-9]+]] { |
| 7 | +; CHECK-NEXT: [[ZEXT795:%.*]] = zext i16 [[LOAD794]] to i32 |
| 8 | +; CHECK-NEXT: [[GEP799:%.*]] = getelementptr inbounds i8, ptr [[P]], i64 16 |
| 9 | +; CHECK-NEXT: [[TMP1:%.*]] = load <2 x i16>, ptr [[P]], align 2 |
| 10 | +; CHECK-NEXT: [[TMP2:%.*]] = load <2 x i16>, ptr [[GEP799]], align 2 |
| 11 | +; CHECK-NEXT: [[TMP3:%.*]] = sub <2 x i16> [[TMP2]], [[TMP1]] |
| 12 | +; CHECK-NEXT: [[TMP4:%.*]] = add <2 x i16> [[TMP3]], <i16 3329, i16 3329> |
| 13 | +; CHECK-NEXT: [[TMP5:%.*]] = insertelement <2 x i32> poison, i32 [[ZEXT795]], i32 0 |
| 14 | +; CHECK-NEXT: [[TMP6:%.*]] = shufflevector <2 x i32> [[TMP5]], <2 x i32> poison, <2 x i32> zeroinitializer |
| 15 | +; CHECK-NEXT: [[TMP7:%.*]] = trunc <2 x i32> [[TMP6]] to <2 x i16> |
| 16 | +; CHECK-NEXT: [[TMP8:%.*]] = mul <2 x i16> [[TMP4]], [[TMP7]] |
| 17 | +; CHECK-NEXT: [[TMP9:%.*]] = zext <2 x i16> [[TMP8]] to <2 x i64> |
| 18 | +; CHECK-NEXT: [[TMP10:%.*]] = mul nuw nsw <2 x i64> [[TMP9]], <i64 5039, i64 5039> |
| 19 | +; CHECK-NEXT: [[TMP11:%.*]] = lshr <2 x i64> [[TMP10]], <i64 24, i64 24> |
| 20 | +; CHECK-NEXT: [[TMP12:%.*]] = trunc <2 x i64> [[TMP11]] to <2 x i16> |
| 21 | +; CHECK-NEXT: [[TMP13:%.*]] = mul <2 x i16> [[TMP12]], <i16 -3329, i16 -3329> |
| 22 | +; CHECK-NEXT: [[TMP14:%.*]] = add <2 x i16> [[TMP13]], [[TMP8]] |
| 23 | +; CHECK-NEXT: [[TMP15:%.*]] = add <2 x i16> [[TMP14]], <i16 -3329, i16 -3329> |
| 24 | +; CHECK-NEXT: [[TMP16:%.*]] = icmp slt <2 x i16> [[TMP15]], zeroinitializer |
| 25 | +; CHECK-NEXT: [[TMP17:%.*]] = select <2 x i1> [[TMP16]], <2 x i16> [[TMP14]], <2 x i16> zeroinitializer |
| 26 | +; CHECK-NEXT: [[TMP18:%.*]] = call <2 x i16> @llvm.smax.v2i16(<2 x i16> [[TMP15]], <2 x i16> zeroinitializer) |
| 27 | +; CHECK-NEXT: [[TMP19:%.*]] = or <2 x i16> [[TMP17]], [[TMP18]] |
| 28 | +; CHECK-NEXT: store <2 x i16> [[TMP19]], ptr [[P]], align 2 |
| 29 | +; CHECK-NEXT: ret void |
| 30 | +; |
| 31 | + %zext795 = zext i16 %load794 to i32 |
| 32 | + %load798 = load i16, ptr %p, align 2 |
| 33 | + %gep799 = getelementptr inbounds i8, ptr %p, i64 16 |
| 34 | + %load800 = load i16, ptr %gep799, align 2 |
| 35 | + %zext801 = zext i16 %load798 to i32 |
| 36 | + %zext802 = zext i16 %load800 to i32 |
| 37 | + %sub809 = sub nsw i32 %zext802, %zext801 |
| 38 | + %add810 = add nsw i32 %sub809, 3329 |
| 39 | + %mul811 = mul i32 %add810, %zext795 |
| 40 | + %zext812 = zext i32 %mul811 to i64 |
| 41 | + %mul813 = mul nuw nsw i64 %zext812, 5039 |
| 42 | + %lshr814 = lshr i64 %mul813, 24 |
| 43 | + %trunc815 = trunc nuw nsw i64 %lshr814 to i32 |
| 44 | + %mul816 = mul i32 %trunc815, 62207 |
| 45 | + %add817 = add i32 %mul816, %mul811 |
| 46 | + %trunc818 = trunc i32 %add817 to i16 |
| 47 | + %add819 = add i16 %trunc818, -3329 |
| 48 | + %icmp820 = icmp slt i16 %add819, 0 |
| 49 | + %select821 = select i1 %icmp820, i16 %trunc818, i16 0 |
| 50 | + %call822 = call i16 @llvm.smax.i16(i16 %add819, i16 0) |
| 51 | + %or823 = or i16 %select821, %call822 |
| 52 | + store i16 %or823, ptr %p, align 2 |
| 53 | + %gep826 = getelementptr inbounds i8, ptr %p, i64 2 |
| 54 | + %load827 = load i16, ptr %gep826, align 2 |
| 55 | + %gep828 = getelementptr inbounds i8, ptr %p, i64 18 |
| 56 | + %load829 = load i16, ptr %gep828, align 2 |
| 57 | + %zext830 = zext i16 %load827 to i32 |
| 58 | + %zext831 = zext i16 %load829 to i32 |
| 59 | + %sub838 = sub nsw i32 %zext831, %zext830 |
| 60 | + %add839 = add nsw i32 %sub838, 3329 |
| 61 | + %mul840 = mul i32 %add839, %zext795 |
| 62 | + %zext841 = zext i32 %mul840 to i64 |
| 63 | + %mul842 = mul nuw nsw i64 %zext841, 5039 |
| 64 | + %lshr843 = lshr i64 %mul842, 24 |
| 65 | + %trunc844 = trunc nuw nsw i64 %lshr843 to i32 |
| 66 | + %mul845 = mul i32 %trunc844, 62207 |
| 67 | + %add846 = add i32 %mul845, %mul840 |
| 68 | + %trunc847 = trunc i32 %add846 to i16 |
| 69 | + %add848 = add i16 %trunc847, -3329 |
| 70 | + %icmp849 = icmp slt i16 %add848, 0 |
| 71 | + %select850 = select i1 %icmp849, i16 %trunc847, i16 0 |
| 72 | + %call851 = call i16 @llvm.smax.i16(i16 %add848, i16 0) |
| 73 | + %or852 = or i16 %select850, %call851 |
| 74 | + store i16 %or852, ptr %gep826, align 2 |
| 75 | + ret void |
| 76 | +} |
| 77 | + |
0 commit comments