|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5 |
1 | 2 | ; RUN: opt -passes=loop-vectorize -force-vector-interleave=1 -force-vector-width=2 -S < %s | FileCheck %s --check-prefix=CHECK-VF2IC1
|
2 | 3 | ; RUN: opt -passes=loop-vectorize -force-vector-interleave=2 -force-vector-width=1 -S < %s | FileCheck %s --check-prefix=CHECK-VF1IC2
|
3 | 4 |
|
4 | 5 | define i32 @pred_select_const_i32_from_icmp(ptr noalias nocapture readonly %src1, ptr noalias nocapture readonly %src2, i64 %n) {
|
5 |
| -; CHECK-VF2IC1-LABEL: @pred_select_const_i32_from_icmp( |
6 |
| -; CHECK-VF2IC1: vector.body: |
7 |
| -; CHECK-VF2IC1: [[VEC_PHI:%.*]] = phi <2 x i1> [ zeroinitializer, %vector.ph ], [ [[PREDPHI:%.*]], %pred.load.continue2 ] |
8 |
| -; CHECK-VF2IC1: [[WIDE_LOAD:%.*]] = load <2 x i32>, ptr {{%.*}}, align 4 |
| 6 | +; CHECK-VF2IC1-LABEL: define i32 @pred_select_const_i32_from_icmp( |
| 7 | +; CHECK-VF2IC1-SAME: ptr noalias readonly captures(none) [[SRC1:%.*]], ptr noalias readonly captures(none) [[SRC2:%.*]], i64 [[N:%.*]]) { |
| 8 | +; CHECK-VF2IC1-NEXT: [[ENTRY:.*]]: |
| 9 | +; CHECK-VF2IC1-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 2 |
| 10 | +; CHECK-VF2IC1-NEXT: br i1 [[MIN_ITERS_CHECK]], label %[[SCALAR_PH:.*]], label %[[VECTOR_PH:.*]] |
| 11 | +; CHECK-VF2IC1: [[VECTOR_PH]]: |
| 12 | +; CHECK-VF2IC1-NEXT: [[N_MOD_VF:%.*]] = urem i64 [[N]], 2 |
| 13 | +; CHECK-VF2IC1-NEXT: [[N_VEC:%.*]] = sub i64 [[N]], [[N_MOD_VF]] |
| 14 | +; CHECK-VF2IC1-NEXT: br label %[[VECTOR_BODY:.*]] |
| 15 | +; CHECK-VF2IC1: [[VECTOR_BODY]]: |
| 16 | +; CHECK-VF2IC1-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[PRED_LOAD_CONTINUE2:.*]] ] |
| 17 | +; CHECK-VF2IC1-NEXT: [[VEC_PHI:%.*]] = phi <2 x i1> [ zeroinitializer, %[[VECTOR_PH]] ], [ [[PREDPHI:%.*]], %[[PRED_LOAD_CONTINUE2]] ] |
| 18 | +; CHECK-VF2IC1-NEXT: [[TMP0:%.*]] = add i64 [[INDEX]], 0 |
| 19 | +; CHECK-VF2IC1-NEXT: [[TMP1:%.*]] = getelementptr inbounds i32, ptr [[SRC1]], i64 [[TMP0]] |
| 20 | +; CHECK-VF2IC1-NEXT: [[TMP2:%.*]] = getelementptr inbounds i32, ptr [[TMP1]], i32 0 |
| 21 | +; CHECK-VF2IC1-NEXT: [[WIDE_LOAD:%.*]] = load <2 x i32>, ptr [[TMP2]], align 4 |
9 | 22 | ; CHECK-VF2IC1-NEXT: [[TMP4:%.*]] = icmp sgt <2 x i32> [[WIDE_LOAD]], splat (i32 35)
|
10 | 23 | ; CHECK-VF2IC1-NEXT: [[TMP5:%.*]] = extractelement <2 x i1> [[TMP4]], i32 0
|
11 |
| -; CHECK-VF2IC1-NEXT: br i1 [[TMP5]], label %pred.load.if, label %pred.load.continue |
12 |
| -; CHECK-VF2IC1: pred.load.if: |
13 |
| -; CHECK-VF2IC1-NEXT: [[TMP6:%.*]] = getelementptr inbounds i32, ptr [[SRC2:%.*]], i64 {{%.*}} |
| 24 | +; CHECK-VF2IC1-NEXT: br i1 [[TMP5]], label %[[PRED_LOAD_IF:.*]], label %[[PRED_LOAD_CONTINUE:.*]] |
| 25 | +; CHECK-VF2IC1: [[PRED_LOAD_IF]]: |
| 26 | +; CHECK-VF2IC1-NEXT: [[TMP6:%.*]] = getelementptr inbounds i32, ptr [[SRC2]], i64 [[TMP0]] |
14 | 27 | ; CHECK-VF2IC1-NEXT: [[TMP7:%.*]] = load i32, ptr [[TMP6]], align 4
|
15 | 28 | ; CHECK-VF2IC1-NEXT: [[TMP8:%.*]] = insertelement <2 x i32> poison, i32 [[TMP7]], i32 0
|
16 |
| -; CHECK-VF2IC1-NEXT: br label %pred.load.continue |
17 |
| -; CHECK-VF2IC1: pred.load.continue: |
18 |
| -; CHECK-VF2IC1-NEXT: [[TMP9:%.*]] = phi <2 x i32> [ poison, %vector.body ], [ [[TMP8]], %pred.load.if ] |
| 29 | +; CHECK-VF2IC1-NEXT: br label %[[PRED_LOAD_CONTINUE]] |
| 30 | +; CHECK-VF2IC1: [[PRED_LOAD_CONTINUE]]: |
| 31 | +; CHECK-VF2IC1-NEXT: [[TMP9:%.*]] = phi <2 x i32> [ poison, %[[VECTOR_BODY]] ], [ [[TMP8]], %[[PRED_LOAD_IF]] ] |
19 | 32 | ; CHECK-VF2IC1-NEXT: [[TMP10:%.*]] = extractelement <2 x i1> [[TMP4]], i32 1
|
20 |
| -; CHECK-VF2IC1-NEXT: br i1 [[TMP10]], label %pred.load.if1, label %pred.load.continue2 |
21 |
| -; CHECK-VF2IC1: pred.load.if1: |
22 |
| -; CHECK-VF2IC1: [[TMP12:%.*]] = getelementptr inbounds i32, ptr [[SRC2]], i64 {{%.*}} |
| 33 | +; CHECK-VF2IC1-NEXT: br i1 [[TMP10]], label %[[PRED_LOAD_IF1:.*]], label %[[PRED_LOAD_CONTINUE2]] |
| 34 | +; CHECK-VF2IC1: [[PRED_LOAD_IF1]]: |
| 35 | +; CHECK-VF2IC1-NEXT: [[TMP11:%.*]] = add i64 [[INDEX]], 1 |
| 36 | +; CHECK-VF2IC1-NEXT: [[TMP12:%.*]] = getelementptr inbounds i32, ptr [[SRC2]], i64 [[TMP11]] |
23 | 37 | ; CHECK-VF2IC1-NEXT: [[TMP13:%.*]] = load i32, ptr [[TMP12]], align 4
|
24 | 38 | ; CHECK-VF2IC1-NEXT: [[TMP14:%.*]] = insertelement <2 x i32> [[TMP9]], i32 [[TMP13]], i32 1
|
25 |
| -; CHECK-VF2IC1-NEXT: br label %pred.load.continue2 |
26 |
| -; CHECK-VF2IC1: pred.load.continue2: |
27 |
| -; CHECK-VF2IC1-NEXT: [[TMP15:%.*]] = phi <2 x i32> [ [[TMP9]], %pred.load.continue ], [ [[TMP14]], %pred.load.if1 ] |
| 39 | +; CHECK-VF2IC1-NEXT: br label %[[PRED_LOAD_CONTINUE2]] |
| 40 | +; CHECK-VF2IC1: [[PRED_LOAD_CONTINUE2]]: |
| 41 | +; CHECK-VF2IC1-NEXT: [[TMP15:%.*]] = phi <2 x i32> [ [[TMP9]], %[[PRED_LOAD_CONTINUE]] ], [ [[TMP14]], %[[PRED_LOAD_IF1]] ] |
28 | 42 | ; CHECK-VF2IC1-NEXT: [[TMP16:%.*]] = icmp eq <2 x i32> [[TMP15]], splat (i32 2)
|
29 | 43 | ; CHECK-VF2IC1-NEXT: [[TMP17:%.*]] = or <2 x i1> [[VEC_PHI]], [[TMP16]]
|
30 | 44 | ; CHECK-VF2IC1-NEXT: [[PREDPHI]] = select <2 x i1> [[TMP4]], <2 x i1> [[TMP17]], <2 x i1> [[VEC_PHI]]
|
31 |
| -; CHECK-VF2IC1: br i1 {{%.*}}, label %middle.block, label %vector.body |
32 |
| -; CHECK-VF2IC1: middle.block: |
| 45 | +; CHECK-VF2IC1-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 2 |
| 46 | +; CHECK-VF2IC1-NEXT: [[TMP18:%.*]] = icmp eq i64 [[INDEX_NEXT]], [[N_VEC]] |
| 47 | +; CHECK-VF2IC1-NEXT: br i1 [[TMP18]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]] |
| 48 | +; CHECK-VF2IC1: [[MIDDLE_BLOCK]]: |
33 | 49 | ; CHECK-VF2IC1-NEXT: [[TMP20:%.*]] = call i1 @llvm.vector.reduce.or.v2i1(<2 x i1> [[PREDPHI]])
|
34 | 50 | ; CHECK-VF2IC1-NEXT: [[FR_TMP20:%.*]] = freeze i1 [[TMP20]]
|
35 | 51 | ; CHECK-VF2IC1-NEXT: [[RDX_SELECT:%.*]] = select i1 [[FR_TMP20]], i32 1, i32 0
|
36 |
| -; CHECK-VF2IC1-NEXT: %cmp.n = icmp eq i64 %n, %n.vec |
37 |
| -; CHECK-VF2IC1: scalar.ph: |
38 |
| -; CHECK-VF2IC1: [[BC_RESUME_VAL:%.*]] = phi i64 [ {{%.*}}, %middle.block ], [ 0, %entry ] |
39 |
| -; CHECK-VF2IC1-NEXT: [[BC_MERGE_RDX:%.*]] = phi i32 [ [[RDX_SELECT]], %middle.block ], [ 0, %entry ] |
40 |
| -; CHECK-VF2IC1-NEXT: br label %for.body |
41 |
| -; CHECK-VF2IC1: for.body: |
42 |
| -; CHECK-VF2IC1: [[R_012:%.*]] = phi i32 [ [[R_1:%.*]], %for.inc ], [ [[BC_MERGE_RDX]], %scalar.ph ] |
43 |
| -; CHECK-VF2IC1: [[TMP21:%.*]] = load i32, ptr {{%.*}}, align 4 |
| 52 | +; CHECK-VF2IC1-NEXT: [[CMP_N:%.*]] = icmp eq i64 [[N]], [[N_VEC]] |
| 53 | +; CHECK-VF2IC1-NEXT: br i1 [[CMP_N]], label %[[FOR_END_LOOPEXIT:.*]], label %[[SCALAR_PH]] |
| 54 | +; CHECK-VF2IC1: [[SCALAR_PH]]: |
| 55 | +; CHECK-VF2IC1-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ [[N_VEC]], %[[MIDDLE_BLOCK]] ], [ 0, %[[ENTRY]] ] |
| 56 | +; CHECK-VF2IC1-NEXT: [[BC_MERGE_RDX:%.*]] = phi i32 [ [[RDX_SELECT]], %[[MIDDLE_BLOCK]] ], [ 0, %[[ENTRY]] ] |
| 57 | +; CHECK-VF2IC1-NEXT: br label %[[FOR_BODY:.*]] |
| 58 | +; CHECK-VF2IC1: [[FOR_BODY]]: |
| 59 | +; CHECK-VF2IC1-NEXT: [[I_013:%.*]] = phi i64 [ [[INC:%.*]], %[[FOR_INC:.*]] ], [ [[BC_RESUME_VAL]], %[[SCALAR_PH]] ] |
| 60 | +; CHECK-VF2IC1-NEXT: [[R_012:%.*]] = phi i32 [ [[R_1:%.*]], %[[FOR_INC]] ], [ [[BC_MERGE_RDX]], %[[SCALAR_PH]] ] |
| 61 | +; CHECK-VF2IC1-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, ptr [[SRC1]], i64 [[I_013]] |
| 62 | +; CHECK-VF2IC1-NEXT: [[TMP21:%.*]] = load i32, ptr [[ARRAYIDX]], align 4 |
44 | 63 | ; CHECK-VF2IC1-NEXT: [[CMP1:%.*]] = icmp sgt i32 [[TMP21]], 35
|
45 |
| -; CHECK-VF2IC1-NEXT: br i1 [[CMP1]], label %if.then, label %for.inc |
46 |
| -; CHECK-VF2IC1: if.then: |
47 |
| -; CHECK-VF2IC1: [[TMP22:%.*]] = load i32, ptr {{%.*}}, align 4 |
| 64 | +; CHECK-VF2IC1-NEXT: br i1 [[CMP1]], label %[[IF_THEN:.*]], label %[[FOR_INC]] |
| 65 | +; CHECK-VF2IC1: [[IF_THEN]]: |
| 66 | +; CHECK-VF2IC1-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds i32, ptr [[SRC2]], i64 [[I_013]] |
| 67 | +; CHECK-VF2IC1-NEXT: [[TMP22:%.*]] = load i32, ptr [[ARRAYIDX2]], align 4 |
48 | 68 | ; CHECK-VF2IC1-NEXT: [[CMP3:%.*]] = icmp eq i32 [[TMP22]], 2
|
49 | 69 | ; CHECK-VF2IC1-NEXT: [[SPEC_SELECT:%.*]] = select i1 [[CMP3]], i32 1, i32 [[R_012]]
|
50 |
| -; CHECK-VF2IC1-NEXT: br label %for.inc |
51 |
| -; CHECK-VF2IC1: for.inc: |
52 |
| -; CHECK-VF2IC1-NEXT: [[R_1]] = phi i32 [ [[R_012]], %for.body ], [ [[SPEC_SELECT]], %if.then ] |
53 |
| -; CHECK-VF2IC1: for.end.loopexit: |
54 |
| -; CHECK-VF2IC1-NEXT: [[R_1_LCSSA:%.*]] = phi i32 [ [[R_1]], %for.inc ], [ [[RDX_SELECT]], %middle.block ] |
| 70 | +; CHECK-VF2IC1-NEXT: br label %[[FOR_INC]] |
| 71 | +; CHECK-VF2IC1: [[FOR_INC]]: |
| 72 | +; CHECK-VF2IC1-NEXT: [[R_1]] = phi i32 [ [[R_012]], %[[FOR_BODY]] ], [ [[SPEC_SELECT]], %[[IF_THEN]] ] |
| 73 | +; CHECK-VF2IC1-NEXT: [[INC]] = add nuw nsw i64 [[I_013]], 1 |
| 74 | +; CHECK-VF2IC1-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[INC]], [[N]] |
| 75 | +; CHECK-VF2IC1-NEXT: br i1 [[EXITCOND_NOT]], label %[[FOR_END_LOOPEXIT]], label %[[FOR_BODY]], !llvm.loop [[LOOP3:![0-9]+]] |
| 76 | +; CHECK-VF2IC1: [[FOR_END_LOOPEXIT]]: |
| 77 | +; CHECK-VF2IC1-NEXT: [[R_1_LCSSA:%.*]] = phi i32 [ [[R_1]], %[[FOR_INC]] ], [ [[RDX_SELECT]], %[[MIDDLE_BLOCK]] ] |
55 | 78 | ; CHECK-VF2IC1-NEXT: ret i32 [[R_1_LCSSA]]
|
56 | 79 | ;
|
57 |
| -; CHECK-VF1IC2-LABEL: @pred_select_const_i32_from_icmp( |
58 |
| -; CHECK-VF1IC2: vector.body: |
59 |
| -; CHECK-VF1IC2: [[VEC_PHI:%.*]] = phi i1 [ false, %vector.ph ], [ [[PREDPHI:%.*]], %pred.load.continue3 ] |
60 |
| -; CHECK-VF1IC2-NEXT: [[VEC_PHI2:%.*]] = phi i1 [ false, %vector.ph ], [ [[PREDPHI5:%.*]], %pred.load.continue3 ] |
61 |
| -; CHECK-VF1IC2: [[TMP0:%.*]] = getelementptr inbounds i32, ptr [[SRC1:%.*]], i64 {{%.*}} |
62 |
| -; CHECK-VF1IC2-NEXT: [[TMP1:%.*]] = getelementptr inbounds i32, ptr [[SRC1]], i64 {{%.*}} |
| 80 | +; CHECK-VF1IC2-LABEL: define i32 @pred_select_const_i32_from_icmp( |
| 81 | +; CHECK-VF1IC2-SAME: ptr noalias readonly captures(none) [[SRC1:%.*]], ptr noalias readonly captures(none) [[SRC2:%.*]], i64 [[N:%.*]]) { |
| 82 | +; CHECK-VF1IC2-NEXT: [[ENTRY:.*]]: |
| 83 | +; CHECK-VF1IC2-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[N]], 2 |
| 84 | +; CHECK-VF1IC2-NEXT: br i1 [[MIN_ITERS_CHECK]], label %[[SCALAR_PH:.*]], label %[[VECTOR_PH:.*]] |
| 85 | +; CHECK-VF1IC2: [[VECTOR_PH]]: |
| 86 | +; CHECK-VF1IC2-NEXT: [[N_MOD_VF:%.*]] = urem i64 [[N]], 2 |
| 87 | +; CHECK-VF1IC2-NEXT: [[N_VEC:%.*]] = sub i64 [[N]], [[N_MOD_VF]] |
| 88 | +; CHECK-VF1IC2-NEXT: br label %[[VECTOR_BODY:.*]] |
| 89 | +; CHECK-VF1IC2: [[VECTOR_BODY]]: |
| 90 | +; CHECK-VF1IC2-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[PRED_LOAD_CONTINUE3:.*]] ] |
| 91 | +; CHECK-VF1IC2-NEXT: [[VEC_PHI:%.*]] = phi i1 [ false, %[[VECTOR_PH]] ], [ [[PREDPHI:%.*]], %[[PRED_LOAD_CONTINUE3]] ] |
| 92 | +; CHECK-VF1IC2-NEXT: [[VEC_PHI2:%.*]] = phi i1 [ false, %[[VECTOR_PH]] ], [ [[PREDPHI5:%.*]], %[[PRED_LOAD_CONTINUE3]] ] |
| 93 | +; CHECK-VF1IC2-NEXT: [[TMP16:%.*]] = add i64 [[INDEX]], 0 |
| 94 | +; CHECK-VF1IC2-NEXT: [[TMP17:%.*]] = add i64 [[INDEX]], 1 |
| 95 | +; CHECK-VF1IC2-NEXT: [[TMP0:%.*]] = getelementptr inbounds i32, ptr [[SRC1]], i64 [[TMP16]] |
| 96 | +; CHECK-VF1IC2-NEXT: [[TMP1:%.*]] = getelementptr inbounds i32, ptr [[SRC1]], i64 [[TMP17]] |
63 | 97 | ; CHECK-VF1IC2-NEXT: [[TMP2:%.*]] = load i32, ptr [[TMP0]], align 4
|
64 | 98 | ; CHECK-VF1IC2-NEXT: [[TMP3:%.*]] = load i32, ptr [[TMP1]], align 4
|
65 | 99 | ; CHECK-VF1IC2-NEXT: [[TMP4:%.*]] = icmp sgt i32 [[TMP2]], 35
|
66 | 100 | ; CHECK-VF1IC2-NEXT: [[TMP5:%.*]] = icmp sgt i32 [[TMP3]], 35
|
67 |
| -; CHECK-VF1IC2-NEXT: br i1 [[TMP4]], label %pred.load.if, label %pred.load.continue |
68 |
| -; CHECK-VF1IC2: pred.load.if: |
69 |
| -; CHECK-VF1IC2-NEXT: [[TMP6:%.*]] = getelementptr inbounds i32, ptr [[SRC2:%.*]], i64 {{%.*}} |
| 101 | +; CHECK-VF1IC2-NEXT: br i1 [[TMP4]], label %[[PRED_LOAD_IF:.*]], label %[[PRED_LOAD_CONTINUE:.*]] |
| 102 | +; CHECK-VF1IC2: [[PRED_LOAD_IF]]: |
| 103 | +; CHECK-VF1IC2-NEXT: [[TMP6:%.*]] = getelementptr inbounds i32, ptr [[SRC2]], i64 [[TMP16]] |
70 | 104 | ; CHECK-VF1IC2-NEXT: [[TMP7:%.*]] = load i32, ptr [[TMP6]], align 4
|
71 |
| -; CHECK-VF1IC2-NEXT: br label %pred.load.continue |
72 |
| -; CHECK-VF1IC2: pred.load.continue: |
73 |
| -; CHECK-VF1IC2-NEXT: [[TMP8:%.*]] = phi i32 [ poison, %vector.body ], [ [[TMP7]], %pred.load.if ] |
74 |
| -; CHECK-VF1IC2-NEXT: br i1 [[TMP5]], label %pred.load.if2, label %pred.load.continue3 |
75 |
| -; CHECK-VF1IC2: pred.load.if2: |
76 |
| -; CHECK-VF1IC2-NEXT: [[TMP9:%.*]] = getelementptr inbounds i32, ptr [[SRC2]], i64 {{%.*}} |
| 105 | +; CHECK-VF1IC2-NEXT: br label %[[PRED_LOAD_CONTINUE]] |
| 106 | +; CHECK-VF1IC2: [[PRED_LOAD_CONTINUE]]: |
| 107 | +; CHECK-VF1IC2-NEXT: [[TMP8:%.*]] = phi i32 [ poison, %[[VECTOR_BODY]] ], [ [[TMP7]], %[[PRED_LOAD_IF]] ] |
| 108 | +; CHECK-VF1IC2-NEXT: br i1 [[TMP5]], label %[[PRED_LOAD_IF2:.*]], label %[[PRED_LOAD_CONTINUE3]] |
| 109 | +; CHECK-VF1IC2: [[PRED_LOAD_IF2]]: |
| 110 | +; CHECK-VF1IC2-NEXT: [[TMP9:%.*]] = getelementptr inbounds i32, ptr [[SRC2]], i64 [[TMP17]] |
77 | 111 | ; CHECK-VF1IC2-NEXT: [[TMP10:%.*]] = load i32, ptr [[TMP9]], align 4
|
78 |
| -; CHECK-VF1IC2-NEXT: br label %pred.load.continue3 |
79 |
| -; CHECK-VF1IC2: pred.load.continue3: |
80 |
| -; CHECK-VF1IC2-NEXT: [[TMP11:%.*]] = phi i32 [ poison, %pred.load.continue ], [ [[TMP10]], %pred.load.if2 ] |
| 112 | +; CHECK-VF1IC2-NEXT: br label %[[PRED_LOAD_CONTINUE3]] |
| 113 | +; CHECK-VF1IC2: [[PRED_LOAD_CONTINUE3]]: |
| 114 | +; CHECK-VF1IC2-NEXT: [[TMP11:%.*]] = phi i32 [ poison, %[[PRED_LOAD_CONTINUE]] ], [ [[TMP10]], %[[PRED_LOAD_IF2]] ] |
81 | 115 | ; CHECK-VF1IC2-NEXT: [[TMP12:%.*]] = icmp eq i32 [[TMP8]], 2
|
82 | 116 | ; CHECK-VF1IC2-NEXT: [[TMP13:%.*]] = icmp eq i32 [[TMP11]], 2
|
83 | 117 | ; CHECK-VF1IC2-NEXT: [[TMP14:%.*]] = or i1 [[VEC_PHI]], [[TMP12]]
|
84 | 118 | ; CHECK-VF1IC2-NEXT: [[TMP15:%.*]] = or i1 [[VEC_PHI2]], [[TMP13]]
|
85 | 119 | ; CHECK-VF1IC2-NEXT: [[PREDPHI]] = select i1 [[TMP4]], i1 [[TMP14]], i1 [[VEC_PHI]]
|
86 | 120 | ; CHECK-VF1IC2-NEXT: [[PREDPHI5]] = select i1 [[TMP5]], i1 [[TMP15]], i1 [[VEC_PHI2]]
|
87 |
| -; CHECK-VF1IC2: br i1 {{%.*}}, label %middle.block, label %vector.body |
88 |
| -; CHECK-VF1IC2: middle.block: |
| 121 | +; CHECK-VF1IC2-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 2 |
| 122 | +; CHECK-VF1IC2-NEXT: [[TMP18:%.*]] = icmp eq i64 [[INDEX_NEXT]], [[N_VEC]] |
| 123 | +; CHECK-VF1IC2-NEXT: br i1 [[TMP18]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]] |
| 124 | +; CHECK-VF1IC2: [[MIDDLE_BLOCK]]: |
89 | 125 | ; CHECK-VF1IC2-NEXT: [[OR:%.*]] = or i1 [[PREDPHI5]], [[PREDPHI]]
|
90 | 126 | ; CHECK-VF1IC2-NEXT: [[FR_OR:%.*]] = freeze i1 [[OR]]
|
91 | 127 | ; CHECK-VF1IC2-NEXT: [[RDX_SELECT:%.*]] = select i1 [[FR_OR]], i32 1, i32 0
|
92 |
| -; CHECK-VF1IC2-NEXT: %cmp.n = icmp eq i64 %n, %n.vec |
93 |
| -; CHECK-VF1IC2: br i1 %cmp.n, label %for.end.loopexit, label %scalar.ph |
94 |
| -; CHECK-VF1IC2: scalar.ph: |
95 |
| -; CHECK-VF1IC2-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ {{%.*}}, %middle.block ], [ 0, %entry ] |
96 |
| -; CHECK-VF1IC2-NEXT: [[BC_MERGE_RDX:%.*]] = phi i32 [ [[RDX_SELECT]], %middle.block ], [ 0, %entry ] |
97 |
| -; CHECK-VF1IC2-NEXT: br label %for.body |
98 |
| -; CHECK-VF1IC2: for.body: |
99 |
| -; CHECK-VF1IC2-NEXT: [[I_013:%.*]] = phi i64 [ [[INC:%.*]], %for.inc ], [ [[BC_RESUME_VAL]], %scalar.ph ] |
100 |
| -; CHECK-VF1IC2-NEXT: [[R_012:%.*]] = phi i32 [ [[R_1:%.*]], %for.inc ], [ [[BC_MERGE_RDX]], %scalar.ph ] |
101 |
| -; CHECK-VF1IC2: [[TMP19:%.*]] = load i32, ptr {{%.*}}, align 4 |
| 128 | +; CHECK-VF1IC2-NEXT: [[CMP_N:%.*]] = icmp eq i64 [[N]], [[N_VEC]] |
| 129 | +; CHECK-VF1IC2-NEXT: br i1 [[CMP_N]], label %[[FOR_END_LOOPEXIT:.*]], label %[[SCALAR_PH]] |
| 130 | +; CHECK-VF1IC2: [[SCALAR_PH]]: |
| 131 | +; CHECK-VF1IC2-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ [[N_VEC]], %[[MIDDLE_BLOCK]] ], [ 0, %[[ENTRY]] ] |
| 132 | +; CHECK-VF1IC2-NEXT: [[BC_MERGE_RDX:%.*]] = phi i32 [ [[RDX_SELECT]], %[[MIDDLE_BLOCK]] ], [ 0, %[[ENTRY]] ] |
| 133 | +; CHECK-VF1IC2-NEXT: br label %[[FOR_BODY:.*]] |
| 134 | +; CHECK-VF1IC2: [[FOR_BODY]]: |
| 135 | +; CHECK-VF1IC2-NEXT: [[I_013:%.*]] = phi i64 [ [[INC:%.*]], %[[FOR_INC:.*]] ], [ [[BC_RESUME_VAL]], %[[SCALAR_PH]] ] |
| 136 | +; CHECK-VF1IC2-NEXT: [[R_012:%.*]] = phi i32 [ [[R_1:%.*]], %[[FOR_INC]] ], [ [[BC_MERGE_RDX]], %[[SCALAR_PH]] ] |
| 137 | +; CHECK-VF1IC2-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, ptr [[SRC1]], i64 [[I_013]] |
| 138 | +; CHECK-VF1IC2-NEXT: [[TMP19:%.*]] = load i32, ptr [[ARRAYIDX]], align 4 |
102 | 139 | ; CHECK-VF1IC2-NEXT: [[CMP1:%.*]] = icmp sgt i32 [[TMP19]], 35
|
103 |
| -; CHECK-VF1IC2-NEXT: br i1 [[CMP1]], label [[IF_THEN:%.*]], label %for.inc |
104 |
| -; CHECK-VF1IC2: if.then: |
105 |
| -; CHECK-VF1IC2: [[TMP20:%.*]] = load i32, ptr {{%.*}}, align 4 |
| 140 | +; CHECK-VF1IC2-NEXT: br i1 [[CMP1]], label %[[IF_THEN:.*]], label %[[FOR_INC]] |
| 141 | +; CHECK-VF1IC2: [[IF_THEN]]: |
| 142 | +; CHECK-VF1IC2-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds i32, ptr [[SRC2]], i64 [[I_013]] |
| 143 | +; CHECK-VF1IC2-NEXT: [[TMP20:%.*]] = load i32, ptr [[ARRAYIDX2]], align 4 |
106 | 144 | ; CHECK-VF1IC2-NEXT: [[CMP3:%.*]] = icmp eq i32 [[TMP20]], 2
|
107 | 145 | ; CHECK-VF1IC2-NEXT: [[SPEC_SELECT:%.*]] = select i1 [[CMP3]], i32 1, i32 [[R_012]]
|
108 |
| -; CHECK-VF1IC2-NEXT: br label %for.inc |
109 |
| -; CHECK-VF1IC2: for.inc: |
110 |
| -; CHECK-VF1IC2-NEXT: [[R_1]] = phi i32 [ [[R_012]], %for.body ], [ [[SPEC_SELECT]], %if.then ] |
111 |
| -; CHECK-VF1IC2: br i1 {{%.*}}, label %for.end.loopexit, label %for.body |
112 |
| -; CHECK-VF1IC2: for.end.loopexit: |
113 |
| -; CHECK-VF1IC2-NEXT: [[R_1_LCSSA:%.*]] = phi i32 [ [[R_1]], %for.inc ], [ [[RDX_SELECT]], %middle.block ] |
| 146 | +; CHECK-VF1IC2-NEXT: br label %[[FOR_INC]] |
| 147 | +; CHECK-VF1IC2: [[FOR_INC]]: |
| 148 | +; CHECK-VF1IC2-NEXT: [[R_1]] = phi i32 [ [[R_012]], %[[FOR_BODY]] ], [ [[SPEC_SELECT]], %[[IF_THEN]] ] |
| 149 | +; CHECK-VF1IC2-NEXT: [[INC]] = add nuw nsw i64 [[I_013]], 1 |
| 150 | +; CHECK-VF1IC2-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[INC]], [[N]] |
| 151 | +; CHECK-VF1IC2-NEXT: br i1 [[EXITCOND_NOT]], label %[[FOR_END_LOOPEXIT]], label %[[FOR_BODY]], !llvm.loop [[LOOP3:![0-9]+]] |
| 152 | +; CHECK-VF1IC2: [[FOR_END_LOOPEXIT]]: |
| 153 | +; CHECK-VF1IC2-NEXT: [[R_1_LCSSA:%.*]] = phi i32 [ [[R_1]], %[[FOR_INC]] ], [ [[RDX_SELECT]], %[[MIDDLE_BLOCK]] ] |
114 | 154 | ; CHECK-VF1IC2-NEXT: ret i32 [[R_1_LCSSA]]
|
115 | 155 | ;
|
116 | 156 | entry:
|
@@ -141,3 +181,14 @@ for.end.loopexit: ; preds = %for.inc
|
141 | 181 | %r.1.lcssa = phi i32 [ %r.1, %for.inc ]
|
142 | 182 | ret i32 %r.1.lcssa
|
143 | 183 | }
|
| 184 | +;. |
| 185 | +; CHECK-VF2IC1: [[LOOP0]] = distinct !{[[LOOP0]], [[META1:![0-9]+]], [[META2:![0-9]+]]} |
| 186 | +; CHECK-VF2IC1: [[META1]] = !{!"llvm.loop.isvectorized", i32 1} |
| 187 | +; CHECK-VF2IC1: [[META2]] = !{!"llvm.loop.unroll.runtime.disable"} |
| 188 | +; CHECK-VF2IC1: [[LOOP3]] = distinct !{[[LOOP3]], [[META2]], [[META1]]} |
| 189 | +;. |
| 190 | +; CHECK-VF1IC2: [[LOOP0]] = distinct !{[[LOOP0]], [[META1:![0-9]+]], [[META2:![0-9]+]]} |
| 191 | +; CHECK-VF1IC2: [[META1]] = !{!"llvm.loop.isvectorized", i32 1} |
| 192 | +; CHECK-VF1IC2: [[META2]] = !{!"llvm.loop.unroll.runtime.disable"} |
| 193 | +; CHECK-VF1IC2: [[LOOP3]] = distinct !{[[LOOP3]], [[META1]]} |
| 194 | +;. |
0 commit comments