Skip to content

Commit 150a7ec

Browse files
committed
[InstCombine] Handle vector gep with scalar argument in evaluateInDifferentElementOrder
Summary: This fixes PR41270. The recursive function evaluateInDifferentElementOrder expects to be called on a vector Value, so when we call it on a vector GEP's arguments, we must first check that the argument is indeed a vector. Reviewers: reames, spatel Reviewed By: spatel Subscribers: llvm-commits Tags: #llvm Differential Revision: https://reviews.llvm.org/D60058 llvm-svn: 357389
1 parent ebf90db commit 150a7ec

File tree

2 files changed

+24
-1
lines changed

2 files changed

+24
-1
lines changed

llvm/lib/Transforms/InstCombine/InstCombineVectorOps.cpp

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1171,7 +1171,14 @@ static Value *evaluateInDifferentElementOrder(Value *V, ArrayRef<int> Mask) {
11711171
SmallVector<Value*, 8> NewOps;
11721172
bool NeedsRebuild = (Mask.size() != I->getType()->getVectorNumElements());
11731173
for (int i = 0, e = I->getNumOperands(); i != e; ++i) {
1174-
Value *V = evaluateInDifferentElementOrder(I->getOperand(i), Mask);
1174+
Value *V;
1175+
// Recursively call evaluateInDifferentElementOrder on vector arguments
1176+
// as well. E.g. GetElementPtr may have scalar operands even if the
1177+
// return value is a vector, so we need to examine the operand type.
1178+
if (I->getOperand(i)->getType()->isVectorTy())
1179+
V = evaluateInDifferentElementOrder(I->getOperand(i), Mask);
1180+
else
1181+
V = I->getOperand(i);
11751182
NewOps.push_back(V);
11761183
NeedsRebuild |= (V != I->getOperand(i));
11771184
}
Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,16 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2+
; RUN: opt -instcombine -S < %s | FileCheck %s
3+
4+
define <4 x i16*> @PR41270([4 x i16]* %x) {
5+
; CHECK-LABEL: @PR41270(
6+
; CHECK-NEXT: [[TMP1:%.*]] = insertelement <4 x [4 x i16]*> undef, [4 x i16]* [[X:%.*]], i32 0
7+
; CHECK-NEXT: [[TMP2:%.*]] = getelementptr inbounds [4 x i16], <4 x [4 x i16]*> [[TMP1]], i64 0, i64 3
8+
; CHECK-NEXT: ret <4 x i16*> [[TMP2]]
9+
;
10+
%ins = insertelement <4 x [4 x i16]*> undef, [4 x i16]* %x, i32 0
11+
%splat = shufflevector <4 x [4 x i16]*> %ins, <4 x [4 x i16]*> undef, <4 x i32> zeroinitializer
12+
%t2 = getelementptr inbounds [4 x i16], <4 x [4 x i16]*> %splat, i32 0, i32 3
13+
%t3 = extractelement <4 x i16*> %t2, i32 3
14+
%ins2 = insertelement <4 x i16*> undef, i16* %t3, i32 0
15+
ret <4 x i16*> %ins2
16+
}

0 commit comments

Comments
 (0)