Index: lib/Analysis/ValueTracking.cpp =================================================================== --- lib/Analysis/ValueTracking.cpp +++ lib/Analysis/ValueTracking.cpp @@ -4073,29 +4073,45 @@ RHS = FalseVal; // Recognize variations of: - // CLAMP(v,l,h) ==> ((v) < (l) ? (l) : ((v) > (h) ? (h) : (v))) + // + // CLAMP(v,l,h) ==> ((v) < (l) ? (l) : ((v) > (h) ? (h) : (v))) + // + // We don't want to break the canonical form for further matchers in this + // function. That is why just create new pointers to false, true values and + // new predicate so that we can match only one order of select values to + // recognize clamp. const APInt *C1; - if (CmpRHS == TrueVal && match(CmpRHS, m_APInt(C1))) { + Value *TrueValPtr = TrueVal, *FalseValPtr = FalseVal; + CmpInst::Predicate NewPred = Pred; + if (CmpRHS != TrueVal) { + std::swap(TrueValPtr, FalseValPtr); + NewPred = CmpInst::getInversePredicate(Pred); + } + if (CmpRHS == TrueValPtr && match(CmpRHS, m_APInt(C1))) { const APInt *C2; // (X SMAX(SMIN(X, C2), C1) - if (match(FalseVal, m_SMin(m_Specific(CmpLHS), m_APInt(C2))) && - C1->slt(*C2) && Pred == CmpInst::ICMP_SLT) + // (X <=s C1) ? C1 : SMIN(X, C2) ==> SMAX(SMIN(X, C2), C1) + if (match(FalseValPtr, m_SMin(m_Specific(CmpLHS), m_APInt(C2))) && + C1->slt(*C2) && (NewPred == CmpInst::ICMP_SLT || NewPred == CmpInst::ICMP_SLE)) return {SPF_SMAX, SPNB_NA, false}; // (X >s C1) ? C1 : SMAX(X, C2) ==> SMIN(SMAX(X, C2), C1) - if (match(FalseVal, m_SMax(m_Specific(CmpLHS), m_APInt(C2))) && - C1->sgt(*C2) && Pred == CmpInst::ICMP_SGT) + // (X >=s C1) ? C1 : SMAX(X, C2) ==> SMIN(SMAX(X, C2), C1) + if (match(FalseValPtr, m_SMax(m_Specific(CmpLHS), m_APInt(C2))) && + C1->sgt(*C2) && (NewPred == CmpInst::ICMP_SGT || NewPred == CmpInst::ICMP_SGE)) return {SPF_SMIN, SPNB_NA, false}; // (X UMAX(UMIN(X, C2), C1) - if (match(FalseVal, m_UMin(m_Specific(CmpLHS), m_APInt(C2))) && - C1->ult(*C2) && Pred == CmpInst::ICMP_ULT) + // (X <=u C1) ? C1 : UMIN(X, C2) ==> UMAX(UMIN(X, C2), C1) + if (match(FalseValPtr, m_UMin(m_Specific(CmpLHS), m_APInt(C2))) && + C1->ult(*C2) && (NewPred == CmpInst::ICMP_ULT || NewPred == CmpInst::ICMP_ULE)) return {SPF_UMAX, SPNB_NA, false}; // (X >u C1) ? C1 : UMAX(X, C2) ==> UMIN(UMAX(X, C2), C1) - if (match(FalseVal, m_UMax(m_Specific(CmpLHS), m_APInt(C2))) && - C1->ugt(*C2) && Pred == CmpInst::ICMP_UGT) + // (X >=u C1) ? C1 : UMAX(X, C2) ==> UMIN(UMAX(X, C2), C1) + if (match(FalseValPtr, m_UMax(m_Specific(CmpLHS), m_APInt(C2))) && + C1->ugt(*C2) && (NewPred == CmpInst::ICMP_UGT || NewPred == CmpInst::ICMP_UGE)) return {SPF_UMIN, SPNB_NA, false}; } Index: test/CodeGen/NVPTX/minmax-negative.ll =================================================================== --- /dev/null +++ test/CodeGen/NVPTX/minmax-negative.ll @@ -0,0 +1,9 @@ +; RUN: llc < %s -march=nvptx -O0 | FileCheck %s + +define i16 @test1(i16* %sur1) { +; CHECK-NOT: mov.u16 %rs{{[0-9]+}}, 32767 + %_tmp21.i = icmp sle i16 0, 0 + %_tmp22.i = select i1 %_tmp21.i, i16 0, i16 32767 + store i16 %_tmp22.i, i16* %sur1 + ret i16 0 +} Index: test/Transforms/InstCombine/minmax-fold.ll =================================================================== --- test/Transforms/InstCombine/minmax-fold.ll +++ test/Transforms/InstCombine/minmax-fold.ll @@ -404,8 +404,8 @@ ; CHECK-LABEL: @clamp_signed3( ; CHECK-NEXT: [[CMP2:%.*]] = icmp slt i32 [[X:%.*]], 255 ; CHECK-NEXT: [[MIN:%.*]] = select i1 [[CMP2]], i32 [[X]], i32 255 -; CHECK-NEXT: [[CMP1:%.*]] = icmp sgt i32 [[X]], 15 -; CHECK-NEXT: [[R:%.*]] = select i1 [[CMP1]], i32 [[MIN]], i32 15 +; CHECK-NEXT: [[TMP1:%.*]] = icmp sgt i32 [[MIN]], 15 +; CHECK-NEXT: [[R:%.*]] = select i1 [[TMP1]], i32 [[MIN]], i32 15 ; CHECK-NEXT: ret i32 [[R]] ; %cmp2 = icmp slt i32 %x, 255 @@ -421,8 +421,8 @@ ; CHECK-LABEL: @clamp_signed4( ; CHECK-NEXT: [[CMP2:%.*]] = icmp sgt i32 [[X:%.*]], 15 ; CHECK-NEXT: [[MAX:%.*]] = select i1 [[CMP2]], i32 [[X]], i32 15 -; CHECK-NEXT: [[CMP1:%.*]] = icmp slt i32 [[X]], 255 -; CHECK-NEXT: [[R:%.*]] = select i1 [[CMP1]], i32 [[MAX]], i32 255 +; CHECK-NEXT: [[TMP1:%.*]] = icmp slt i32 [[MAX]], 255 +; CHECK-NEXT: [[R:%.*]] = select i1 [[TMP1]], i32 [[MAX]], i32 255 ; CHECK-NEXT: ret i32 [[R]] ; %cmp2 = icmp sgt i32 %x, 15 @@ -472,8 +472,8 @@ ; CHECK-LABEL: @clamp_unsigned3( ; CHECK-NEXT: [[CMP2:%.*]] = icmp ult i32 [[X:%.*]], 255 ; CHECK-NEXT: [[MIN:%.*]] = select i1 [[CMP2]], i32 [[X]], i32 255 -; CHECK-NEXT: [[CMP1:%.*]] = icmp ugt i32 [[X]], 15 -; CHECK-NEXT: [[R:%.*]] = select i1 [[CMP1]], i32 [[MIN]], i32 15 +; CHECK-NEXT: [[TMP1:%.*]] = icmp ugt i32 [[MIN]], 15 +; CHECK-NEXT: [[R:%.*]] = select i1 [[TMP1]], i32 [[MIN]], i32 15 ; CHECK-NEXT: ret i32 [[R]] ; %cmp2 = icmp ult i32 %x, 255 @@ -489,8 +489,8 @@ ; CHECK-LABEL: @clamp_unsigned4( ; CHECK-NEXT: [[CMP2:%.*]] = icmp ugt i32 [[X:%.*]], 15 ; CHECK-NEXT: [[MAX:%.*]] = select i1 [[CMP2]], i32 [[X]], i32 15 -; CHECK-NEXT: [[CMP1:%.*]] = icmp ult i32 [[X]], 255 -; CHECK-NEXT: [[R:%.*]] = select i1 [[CMP1]], i32 [[MAX]], i32 255 +; CHECK-NEXT: [[TMP1:%.*]] = icmp ult i32 [[MAX]], 255 +; CHECK-NEXT: [[R:%.*]] = select i1 [[TMP1]], i32 [[MAX]], i32 255 ; CHECK-NEXT: ret i32 [[R]] ; %cmp2 = icmp ugt i32 %x, 15 @@ -523,8 +523,8 @@ ; CHECK-LABEL: @clamp_check_for_no_infinite_loop2( ; CHECK-NEXT: [[CMP1:%.*]] = icmp sgt i32 [[I:%.*]], -255 ; CHECK-NEXT: [[SEL1:%.*]] = select i1 [[CMP1]], i32 [[I]], i32 -255 -; CHECK-NEXT: [[CMP2:%.*]] = icmp slt i32 [[I]], 0 -; CHECK-NEXT: [[RES:%.*]] = select i1 [[CMP2]], i32 [[SEL1]], i32 0 +; CHECK-NEXT: [[TMP1:%.*]] = icmp slt i32 [[SEL1]], 0 +; CHECK-NEXT: [[RES:%.*]] = select i1 [[TMP1]], i32 [[SEL1]], i32 0 ; CHECK-NEXT: ret i32 [[RES]] ; %cmp1 = icmp sgt i32 %i, -255