diff --git a/llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp b/llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp --- a/llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp +++ b/llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp @@ -2112,6 +2112,13 @@ return replaceInstUsesWith( I, Builder.CreateIntrinsic(Intrinsic::umin, {I.getType()}, {Op0, Y})); + // C - ctpop(X) => ctpop(~X) if C is bitwidth + if (match(Op0, m_SpecificInt(Ty->getScalarSizeInBits())) && + match(Op1, m_OneUse(m_Intrinsic(m_Value(X))))) + return replaceInstUsesWith( + I, Builder.CreateIntrinsic(Intrinsic::ctpop, {I.getType()}, + {Builder.CreateNot(X)})); + return TryToNarrowDeduceFlags(); } diff --git a/llvm/test/Transforms/InstCombine/ctpop.ll b/llvm/test/Transforms/InstCombine/ctpop.ll --- a/llvm/test/Transforms/InstCombine/ctpop.ll +++ b/llvm/test/Transforms/InstCombine/ctpop.ll @@ -292,9 +292,9 @@ define i8 @sub_ctpop(i8 %a) { ; CHECK-LABEL: @sub_ctpop( -; CHECK-NEXT: [[CNT:%.*]] = tail call i8 @llvm.ctpop.i8(i8 [[A:%.*]]), !range [[RNG0]] -; CHECK-NEXT: [[RES:%.*]] = sub nuw nsw i8 8, [[CNT]] -; CHECK-NEXT: ret i8 [[RES]] +; CHECK-NEXT: [[TMP1:%.*]] = xor i8 [[A:%.*]], -1 +; CHECK-NEXT: [[TMP2:%.*]] = call i8 @llvm.ctpop.i8(i8 [[TMP1]]), !range [[RNG0]] +; CHECK-NEXT: ret i8 [[TMP2]] ; %cnt = tail call i8 @llvm.ctpop.i8(i8 %a) %res = sub i8 8, %cnt @@ -325,9 +325,9 @@ define <2 x i32> @sub_ctpop_vec(<2 x i32> %a) { ; CHECK-LABEL: @sub_ctpop_vec( -; CHECK-NEXT: [[CNT:%.*]] = tail call <2 x i32> @llvm.ctpop.v2i32(<2 x i32> [[A:%.*]]) -; CHECK-NEXT: [[RES:%.*]] = sub nuw nsw <2 x i32> , [[CNT]] -; CHECK-NEXT: ret <2 x i32> [[RES]] +; CHECK-NEXT: [[TMP1:%.*]] = xor <2 x i32> [[A:%.*]], +; CHECK-NEXT: [[TMP2:%.*]] = call <2 x i32> @llvm.ctpop.v2i32(<2 x i32> [[TMP1]]) +; CHECK-NEXT: ret <2 x i32> [[TMP2]] ; %cnt = tail call <2 x i32> @llvm.ctpop.v2i32(<2 x i32> %a) %res = sub <2 x i32> , %cnt