Skip to content

Commit 691badc

Browse files
[InstCombine] C - ctpop(a) - > ctpop(~a)) if C is bitwidth (PR50104)
Proof: https://alive2.llvm.org/ce/z/mncA9K Solves https://bugs.llvm.org/show_bug.cgi?id=50104 Reviewed By: spatel Differential Revision: https://reviews.llvm.org/D101257
1 parent 8705399 commit 691badc

File tree

3 files changed

+18
-11
lines changed

3 files changed

+18
-11
lines changed

llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2112,6 +2112,13 @@ Instruction *InstCombinerImpl::visitSub(BinaryOperator &I) {
21122112
return replaceInstUsesWith(
21132113
I, Builder.CreateIntrinsic(Intrinsic::umin, {I.getType()}, {Op0, Y}));
21142114

2115+
// C - ctpop(X) => ctpop(~X) if C is bitwidth
2116+
if (match(Op0, m_SpecificInt(Ty->getScalarSizeInBits())) &&
2117+
match(Op1, m_OneUse(m_Intrinsic<Intrinsic::ctpop>(m_Value(X)))))
2118+
return replaceInstUsesWith(
2119+
I, Builder.CreateIntrinsic(Intrinsic::ctpop, {I.getType()},
2120+
{Builder.CreateNot(X)}));
2121+
21152122
return TryToNarrowDeduceFlags();
21162123
}
21172124

llvm/test/Transforms/InstCombine/ctpop-cttz.ll

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ declare <2 x i32> @llvm.ctpop.v2i32(<2 x i32>)
88
; __builtin_popcount(i | -i) -> 32 - __builtin_cttz(i, false)
99
define i32 @ctpop1(i32 %0) {
1010
; CHECK-LABEL: @ctpop1(
11-
; CHECK-NEXT: [[TMP2:%.*]] = call i32 @llvm.cttz.i32(i32 [[TMP0:%.*]], i1 false), !range !0
11+
; CHECK-NEXT: [[TMP2:%.*]] = call i32 @llvm.cttz.i32(i32 [[TMP0:%.*]], i1 false), !range [[RNG0:![0-9]+]]
1212
; CHECK-NEXT: ret i32 [[TMP2]]
1313
;
1414
%2 = sub i32 0, %0
@@ -34,8 +34,8 @@ define i32 @ctpop1_multiuse(i32 %0) {
3434
; CHECK-LABEL: @ctpop1_multiuse(
3535
; CHECK-NEXT: [[TMP2:%.*]] = sub i32 0, [[TMP0:%.*]]
3636
; CHECK-NEXT: [[TMP3:%.*]] = or i32 [[TMP2]], [[TMP0]]
37-
; CHECK-NEXT: [[TMP4:%.*]] = tail call i32 @llvm.ctpop.i32(i32 [[TMP3]]), !range !0
38-
; CHECK-NEXT: [[TMP5:%.*]] = sub nuw nsw i32 32, [[TMP4]]
37+
; CHECK-NEXT: [[TMP4:%.*]] = xor i32 [[TMP3]], -1
38+
; CHECK-NEXT: [[TMP5:%.*]] = call i32 @llvm.ctpop.i32(i32 [[TMP4]]), !range [[RNG0]]
3939
; CHECK-NEXT: [[TMP6:%.*]] = add i32 [[TMP5]], [[TMP3]]
4040
; CHECK-NEXT: ret i32 [[TMP6]]
4141
;
@@ -51,7 +51,7 @@ define i32 @ctpop1_multiuse(i32 %0) {
5151
; __builtin_popcount(~i & (i-1)) -> __builtin_cttz(i, false)
5252
define i32 @ctpop2(i32 %0) {
5353
; CHECK-LABEL: @ctpop2(
54-
; CHECK-NEXT: [[TMP2:%.*]] = call i32 @llvm.cttz.i32(i32 [[TMP0:%.*]], i1 false), !range !0
54+
; CHECK-NEXT: [[TMP2:%.*]] = call i32 @llvm.cttz.i32(i32 [[TMP0:%.*]], i1 false), !range [[RNG0]]
5555
; CHECK-NEXT: ret i32 [[TMP2]]
5656
;
5757
%2 = xor i32 %0, -1
@@ -78,7 +78,7 @@ define i32 @ctpop2_multiuse(i32 %0) {
7878
; CHECK-NEXT: [[TMP2:%.*]] = xor i32 [[TMP0:%.*]], -1
7979
; CHECK-NEXT: [[TMP3:%.*]] = add i32 [[TMP0]], -1
8080
; CHECK-NEXT: [[TMP4:%.*]] = and i32 [[TMP3]], [[TMP2]]
81-
; CHECK-NEXT: [[TMP5:%.*]] = call i32 @llvm.cttz.i32(i32 [[TMP0]], i1 false), !range !0
81+
; CHECK-NEXT: [[TMP5:%.*]] = call i32 @llvm.cttz.i32(i32 [[TMP0]], i1 false), !range [[RNG0]]
8282
; CHECK-NEXT: [[TMP6:%.*]] = add i32 [[TMP5]], [[TMP4]]
8383
; CHECK-NEXT: ret i32 [[TMP6]]
8484
;

llvm/test/Transforms/InstCombine/ctpop.ll

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -292,9 +292,9 @@ declare i8 @llvm.fshr.i8(i8, i8, i8)
292292

293293
define i8 @sub_ctpop(i8 %a) {
294294
; CHECK-LABEL: @sub_ctpop(
295-
; CHECK-NEXT: [[CNT:%.*]] = tail call i8 @llvm.ctpop.i8(i8 [[A:%.*]]), !range [[RNG0]]
296-
; CHECK-NEXT: [[RES:%.*]] = sub nuw nsw i8 8, [[CNT]]
297-
; CHECK-NEXT: ret i8 [[RES]]
295+
; CHECK-NEXT: [[TMP1:%.*]] = xor i8 [[A:%.*]], -1
296+
; CHECK-NEXT: [[TMP2:%.*]] = call i8 @llvm.ctpop.i8(i8 [[TMP1]]), !range [[RNG0]]
297+
; CHECK-NEXT: ret i8 [[TMP2]]
298298
;
299299
%cnt = tail call i8 @llvm.ctpop.i8(i8 %a)
300300
%res = sub i8 8, %cnt
@@ -325,9 +325,9 @@ define i8 @sub_ctpop_unknown(i8 %a, i8 %b) {
325325

326326
define <2 x i32> @sub_ctpop_vec(<2 x i32> %a) {
327327
; CHECK-LABEL: @sub_ctpop_vec(
328-
; CHECK-NEXT: [[CNT:%.*]] = tail call <2 x i32> @llvm.ctpop.v2i32(<2 x i32> [[A:%.*]])
329-
; CHECK-NEXT: [[RES:%.*]] = sub nuw nsw <2 x i32> <i32 32, i32 32>, [[CNT]]
330-
; CHECK-NEXT: ret <2 x i32> [[RES]]
328+
; CHECK-NEXT: [[TMP1:%.*]] = xor <2 x i32> [[A:%.*]], <i32 -1, i32 -1>
329+
; CHECK-NEXT: [[TMP2:%.*]] = call <2 x i32> @llvm.ctpop.v2i32(<2 x i32> [[TMP1]])
330+
; CHECK-NEXT: ret <2 x i32> [[TMP2]]
331331
;
332332
%cnt = tail call <2 x i32> @llvm.ctpop.v2i32(<2 x i32> %a)
333333
%res = sub <2 x i32> <i32 32, i32 32>, %cnt

0 commit comments

Comments
 (0)