|
1 |
| -; RUN: opt -loop-vectorize -mtriple=arm64-apple-iphoneos -S %s | FileCheck %s |
| 1 | +; RUN: opt -loop-vectorize -mtriple=arm64-apple-iphoneos -vectorizer-min-trip-count=8 -S %s | FileCheck %s |
2 | 2 |
|
3 | 3 | ; Tests for loops with large numbers of runtime checks. Check that loops are
|
4 | 4 | ; vectorized, if the loop trip counts are large and the impact of the runtime
|
@@ -50,7 +50,7 @@ loop: ; preds = %bb54, %bb37
|
50 | 50 | %gep.4 = getelementptr inbounds i16, i16* %ptr.4, i64 %iv
|
51 | 51 | store i16 %trunc.2, i16* %gep.4, align 2
|
52 | 52 | %iv.next = add nuw nsw i64 %iv, 1
|
53 |
| - %cmp = icmp ult i64 %iv, 50 |
| 53 | + %cmp = icmp ult i64 %iv, 10 |
54 | 54 | br i1 %cmp, label %loop, label %exit
|
55 | 55 |
|
56 | 56 | exit:
|
@@ -109,3 +109,55 @@ loop: ; preds = %bb54, %bb37
|
109 | 109 | exit:
|
110 | 110 | ret void
|
111 | 111 | }
|
| 112 | + |
| 113 | +define void @test_tc_unknown(i16* %ptr.1, i16* %ptr.2, i16* %ptr.3, i16* %ptr.4, i64 %off.1, i64 %off.2, i64 %N) { |
| 114 | +; CHECK-LABEL: define void @test_tc_unknown |
| 115 | +; CHECK-NOT: vector.memcheck |
| 116 | +; CHECK-NOT: vector.body |
| 117 | +; |
| 118 | +entry: |
| 119 | + br label %loop |
| 120 | + |
| 121 | +loop: ; preds = %bb54, %bb37 |
| 122 | + %iv = phi i64 [ 0, %entry ], [ %iv.next, %loop ] |
| 123 | + %gep.1 = getelementptr inbounds i16, i16* %ptr.1, i64 %iv |
| 124 | + %lv.1 = load i16, i16* %gep.1, align 2 |
| 125 | + %ext.1 = sext i16 %lv.1 to i32 |
| 126 | + %gep.2 = getelementptr inbounds i16, i16* %ptr.2, i64 %iv |
| 127 | + %lv.2 = load i16, i16* %gep.2, align 2 |
| 128 | + %ext.2 = sext i16 %lv.2 to i32 |
| 129 | + %gep.off.1 = getelementptr inbounds i16, i16* %gep.2, i64 %off.1 |
| 130 | + %lv.3 = load i16, i16* %gep.off.1, align 2 |
| 131 | + %ext.3 = sext i16 %lv.3 to i32 |
| 132 | + %gep.off.2 = getelementptr inbounds i16, i16* %gep.2, i64 %off.2 |
| 133 | + %lv.4 = load i16, i16* %gep.off.2, align 2 |
| 134 | + %ext.4 = sext i16 %lv.4 to i32 |
| 135 | + %tmp62 = mul nsw i32 %ext.2, 11 |
| 136 | + %tmp66 = mul nsw i32 %ext.3, -4 |
| 137 | + %tmp70 = add nsw i32 %tmp62, 4 |
| 138 | + %tmp71 = add nsw i32 %tmp70, %tmp66 |
| 139 | + %tmp72 = add nsw i32 %tmp71, %ext.4 |
| 140 | + %tmp73 = lshr i32 %tmp72, 3 |
| 141 | + %tmp74 = add nsw i32 %tmp73, %ext.1 |
| 142 | + %tmp75 = lshr i32 %tmp74, 1 |
| 143 | + %tmp76 = mul nsw i32 %ext.2, 5 |
| 144 | + %tmp77 = shl nsw i32 %ext.3, 2 |
| 145 | + %tmp78 = add nsw i32 %tmp76, 4 |
| 146 | + %tmp79 = add nsw i32 %tmp78, %tmp77 |
| 147 | + %tmp80 = sub nsw i32 %tmp79, %ext.4 |
| 148 | + %tmp81 = lshr i32 %tmp80, 3 |
| 149 | + %tmp82 = sub nsw i32 %tmp81, %ext.1 |
| 150 | + %tmp83 = lshr i32 %tmp82, 1 |
| 151 | + %trunc.1 = trunc i32 %tmp75 to i16 |
| 152 | + %gep.3 = getelementptr inbounds i16, i16* %ptr.3, i64 %iv |
| 153 | + store i16 %trunc.1, i16* %gep.3, align 2 |
| 154 | + %trunc.2 = trunc i32 %tmp83 to i16 |
| 155 | + %gep.4 = getelementptr inbounds i16, i16* %ptr.4, i64 %iv |
| 156 | + store i16 %trunc.2, i16* %gep.4, align 2 |
| 157 | + %iv.next = add nuw nsw i64 %iv, 1 |
| 158 | + %cmp = icmp ult i64 %iv, %N |
| 159 | + br i1 %cmp, label %loop, label %exit |
| 160 | + |
| 161 | +exit: |
| 162 | + ret void |
| 163 | +} |
0 commit comments