CbC/CbC_llvm: lib/Transforms/InstCombine/InstCombineShifts.cpp comparison

comparison lib/Transforms/InstCombine/InstCombineShifts.cpp @ 121:803732b1fca8

LLVM 5.0

author	kono
date	Fri, 27 Oct 2017 17:07:41 +0900
parents	1172e4bd9c6f
children	3a76565eade5

comparison

equal deleted inserted replaced

-:1172e4bd9c6f
+:803732b1fca8
 using namespace PatternMatch;
 #define DEBUG_TYPE "instcombine"
 Instruction *InstCombiner::commonShiftTransforms(BinaryOperator &I) {
-assert(I.getOperand(1)->getType() == I.getOperand(0)->getType());
 Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
+assert(Op0->getType() == Op1->getType());
 // See if we can fold away this shift.
 if (SimplifyDemandedInstructionBits(I))
 return &I;
 // (C1 shift (A add C2)) -> (C1 shift C2) shift A)
 // iff A and C2 are both positive.
 Value *A;
 Constant *C;
 if (match(Op0, m_Constant()) && match(Op1, m_Add(m_Value(A), m_Constant(C))))
-if (isKnownNonNegative(A, DL) && isKnownNonNegative(C, DL))
+if (isKnownNonNegative(A, DL, 0, &AC, &I, &DT) &&
+isKnownNonNegative(C, DL, 0, &AC, &I, &DT))
 return BinaryOperator::Create(
-I.getOpcode(), Builder->CreateBinOp(I.getOpcode(), Op0, C), A);
+I.getOpcode(), Builder.CreateBinOp(I.getOpcode(), Op0, C), A);
 // X shift (A srem B) -> X shift (A and B-1) iff B is a power of 2.
 // Because shifts by negative values (which could occur if A were negative)
 // are undefined.
 const APInt *B;
 if (Op1->hasOneUse() && match(Op1, m_SRem(m_Value(A), m_Power2(B)))) {
 // FIXME: Should this get moved into SimplifyDemandedBits by saying we don't
 // demand the sign bit (and many others) here??
-Value *Rem = Builder->CreateAnd(A, ConstantInt::get(I.getType(), *B-1),
+Value *Rem = Builder.CreateAnd(A, ConstantInt::get(I.getType(), *B - 1),
 Op1->getName());
 I.setOperand(1, Rem);
 return &I;
 }
 return nullptr;
 }
 /// Return true if we can simplify two logical (either left or right) shifts
-/// that have constant shift amounts.
+/// that have constant shift amounts: OuterShift (InnerShift X, C1), C2.
-static bool canEvaluateShiftedShift(unsigned FirstShiftAmt,
+static bool canEvaluateShiftedShift(unsigned OuterShAmt, bool IsOuterShl,
-bool IsFirstShiftLeft,
+Instruction *InnerShift, InstCombiner &IC,
-Instruction *SecondShift, InstCombiner &IC,
 Instruction *CxtI) {
-assert(SecondShift->isLogicalShift() && "Unexpected instruction type");
+assert(InnerShift->isLogicalShift() && "Unexpected instruction type");
-// We need constant shifts.
+// We need constant scalar or constant splat shifts.
-auto *SecondShiftConst = dyn_cast<ConstantInt>(SecondShift->getOperand(1));
+const APInt *InnerShiftConst;
-if (!SecondShiftConst)
+if (!match(InnerShift->getOperand(1), m_APInt(InnerShiftConst)))
 return false;
-unsigned SecondShiftAmt = SecondShiftConst->getZExtValue();
+// Two logical shifts in the same direction:
-bool IsSecondShiftLeft = SecondShift->getOpcode() == Instruction::Shl;
+// shl (shl X, C1), C2 -->  shl X, C1 + C2
+// lshr (lshr X, C1), C2 --> lshr X, C1 + C2
-// We can always fold  shl(c1) +  shl(c2) ->  shl(c1+c2).
+bool IsInnerShl = InnerShift->getOpcode() == Instruction::Shl;
-// We can always fold lshr(c1) + lshr(c2) -> lshr(c1+c2).
+if (IsInnerShl == IsOuterShl)
-if (IsFirstShiftLeft == IsSecondShiftLeft)
 return true;
-// We can always fold lshr(c) +  shl(c) -> and(c2).
+// Equal shift amounts in opposite directions become bitwise 'and':
-// We can always fold  shl(c) + lshr(c) -> and(c2).
+// lshr (shl X, C), C --> and X, C'
-if (FirstShiftAmt == SecondShiftAmt)
+// shl (lshr X, C), C --> and X, C'
+unsigned InnerShAmt = InnerShiftConst->getZExtValue();
+if (InnerShAmt == OuterShAmt)
 return true;
-unsigned TypeWidth = SecondShift->getType()->getScalarSizeInBits();
 // If the 2nd shift is bigger than the 1st, we can fold:
-//   lshr(c1) +  shl(c2) ->  shl(c3) + and(c4) or
+// lshr (shl X, C1), C2 -->  and (shl X, C1 - C2), C3
-//   shl(c1)  + lshr(c2) -> lshr(c3) + and(c4),
+// shl (lshr X, C1), C2 --> and (lshr X, C1 - C2), C3
 // but it isn't profitable unless we know the and'd out bits are already zero.
-// Also check that the 2nd shift is valid (less than the type width) or we'll
+// Also, check that the inner shift is valid (less than the type width) or
-// crash trying to produce the bit mask for the 'and'.
+// we'll crash trying to produce the bit mask for the 'and'.
-if (SecondShiftAmt > FirstShiftAmt && SecondShiftAmt < TypeWidth) {
+unsigned TypeWidth = InnerShift->getType()->getScalarSizeInBits();
-unsigned MaskShift = IsSecondShiftLeft ? TypeWidth - SecondShiftAmt
+if (InnerShAmt > OuterShAmt && InnerShAmt < TypeWidth) {
-: SecondShiftAmt - FirstShiftAmt;
+unsigned MaskShift =
-APInt Mask = APInt::getLowBitsSet(TypeWidth, FirstShiftAmt) << MaskShift;
+IsInnerShl ? TypeWidth - InnerShAmt : InnerShAmt - OuterShAmt;
-if (IC.MaskedValueIsZero(SecondShift->getOperand(0), Mask, 0, CxtI))
+APInt Mask = APInt::getLowBitsSet(TypeWidth, OuterShAmt) << MaskShift;
+if (IC.MaskedValueIsZero(InnerShift->getOperand(0), Mask, 0, CxtI))
 return true;
 }
 return false;
 }
-/// See if we can compute the specified value, but shifted
+/// See if we can compute the specified value, but shifted logically to the left
-/// logically to the left or right by some number of bits.  This should return
+/// or right by some number of bits. This should return true if the expression
-/// true if the expression can be computed for the same cost as the current
+/// can be computed for the same cost as the current expression tree. This is
-/// expression tree.  This is used to eliminate extraneous shifting from things
+/// used to eliminate extraneous shifting from things like:
-/// like:
 ///      %C = shl i128 %A, 64
 ///      %D = shl i128 %B, 96
 ///      %E = or i128 %C, %D
 ///      %F = lshr i128 %E, 64
-/// where the client will ask if E can be computed shifted right by 64-bits.  If
+/// where the client will ask if E can be computed shifted right by 64-bits. If
-/// this succeeds, the GetShiftedValue function will be called to produce the
+/// this succeeds, getShiftedValue() will be called to produce the value.
-/// value.
+static bool canEvaluateShifted(Value *V, unsigned NumBits, bool IsLeftShift,
-static bool CanEvaluateShifted(Value *V, unsigned NumBits, bool IsLeftShift,
 InstCombiner &IC, Instruction *CxtI) {
 // We can always evaluate constants shifted.
 if (isa<Constant>(V))
 return true;
 default: return false;
 case Instruction::And:
 case Instruction::Or:
 case Instruction::Xor:
 // Bitwise operators can all arbitrarily be arbitrarily evaluated shifted.
-return CanEvaluateShifted(I->getOperand(0), NumBits, IsLeftShift, IC, I) &&
+return canEvaluateShifted(I->getOperand(0), NumBits, IsLeftShift, IC, I) &&
-CanEvaluateShifted(I->getOperand(1), NumBits, IsLeftShift, IC, I);
+canEvaluateShifted(I->getOperand(1), NumBits, IsLeftShift, IC, I);
 case Instruction::Shl:
 case Instruction::LShr:
 return canEvaluateShiftedShift(NumBits, IsLeftShift, I, IC, CxtI);
 case Instruction::Select: {
 SelectInst *SI = cast<SelectInst>(I);
 Value *TrueVal = SI->getTrueValue();
 Value *FalseVal = SI->getFalseValue();
-return CanEvaluateShifted(TrueVal, NumBits, IsLeftShift, IC, SI) &&
+return canEvaluateShifted(TrueVal, NumBits, IsLeftShift, IC, SI) &&
-CanEvaluateShifted(FalseVal, NumBits, IsLeftShift, IC, SI);
+canEvaluateShifted(FalseVal, NumBits, IsLeftShift, IC, SI);
 }
 case Instruction::PHI: {
 // We can change a phi if we can change all operands.  Note that we never
 // get into trouble with cyclic PHIs here because we only consider
 // instructions with a single use.
 PHINode *PN = cast<PHINode>(I);
 for (Value *IncValue : PN->incoming_values())
-if (!CanEvaluateShifted(IncValue, NumBits, IsLeftShift, IC, PN))
+if (!canEvaluateShifted(IncValue, NumBits, IsLeftShift, IC, PN))
 return false;
 return true;
 }
 }
 }
-/// When CanEvaluateShifted returned true for an expression,
+/// Fold OuterShift (InnerShift X, C1), C2.
-/// this value inserts the new computation that produces the shifted value.
+/// See canEvaluateShiftedShift() for the constraints on these instructions.
-static Value *GetShiftedValue(Value *V, unsigned NumBits, bool isLeftShift,
+static Value *foldShiftedShift(BinaryOperator *InnerShift, unsigned OuterShAmt,
+bool IsOuterShl,
+InstCombiner::BuilderTy &Builder) {
+bool IsInnerShl = InnerShift->getOpcode() == Instruction::Shl;
+Type *ShType = InnerShift->getType();
+unsigned TypeWidth = ShType->getScalarSizeInBits();
+// We only accept shifts-by-a-constant in canEvaluateShifted().
+const APInt *C1;
+match(InnerShift->getOperand(1), m_APInt(C1));
+unsigned InnerShAmt = C1->getZExtValue();
+// Change the shift amount and clear the appropriate IR flags.
+auto NewInnerShift = [&](unsigned ShAmt) {
+InnerShift->setOperand(1, ConstantInt::get(ShType, ShAmt));
+if (IsInnerShl) {
+InnerShift->setHasNoUnsignedWrap(false);
+InnerShift->setHasNoSignedWrap(false);
+} else {
+InnerShift->setIsExact(false);
+}
+return InnerShift;
+};
+// Two logical shifts in the same direction:
+// shl (shl X, C1), C2 -->  shl X, C1 + C2
+// lshr (lshr X, C1), C2 --> lshr X, C1 + C2
+if (IsInnerShl == IsOuterShl) {
+// If this is an oversized composite shift, then unsigned shifts get 0.
+if (InnerShAmt + OuterShAmt >= TypeWidth)
+return Constant::getNullValue(ShType);
+return NewInnerShift(InnerShAmt + OuterShAmt);
+}
+// Equal shift amounts in opposite directions become bitwise 'and':
+// lshr (shl X, C), C --> and X, C'
+// shl (lshr X, C), C --> and X, C'
+if (InnerShAmt == OuterShAmt) {
+APInt Mask = IsInnerShl
+? APInt::getLowBitsSet(TypeWidth, TypeWidth - OuterShAmt)
+: APInt::getHighBitsSet(TypeWidth, TypeWidth - OuterShAmt);
+Value *And = Builder.CreateAnd(InnerShift->getOperand(0),
+ConstantInt::get(ShType, Mask));
+if (auto *AndI = dyn_cast<Instruction>(And)) {
+AndI->moveBefore(InnerShift);
+AndI->takeName(InnerShift);
+}
+return And;
+}
+assert(InnerShAmt > OuterShAmt &&
+"Unexpected opposite direction logical shift pair");
+// In general, we would need an 'and' for this transform, but
+// canEvaluateShiftedShift() guarantees that the masked-off bits are not used.
+// lshr (shl X, C1), C2 -->  shl X, C1 - C2
+// shl (lshr X, C1), C2 --> lshr X, C1 - C2
+return NewInnerShift(InnerShAmt - OuterShAmt);
+}
+/// When canEvaluateShifted() returns true for an expression, this function
+/// inserts the new computation that produces the shifted value.
+static Value *getShiftedValue(Value *V, unsigned NumBits, bool isLeftShift,
 InstCombiner &IC, const DataLayout &DL) {
 // We can always evaluate constants shifted.
 if (Constant *C = dyn_cast<Constant>(V)) {
 if (isLeftShift)
-V = IC.Builder->CreateShl(C, NumBits);
+V = IC.Builder.CreateShl(C, NumBits);
 else
-V = IC.Builder->CreateLShr(C, NumBits);
+V = IC.Builder.CreateLShr(C, NumBits);
 // If we got a constantexpr back, try to simplify it with TD info.
 if (auto *C = dyn_cast<Constant>(V))
 if (auto *FoldedC =
 ConstantFoldConstant(C, DL, &IC.getTargetLibraryInfo()))
 V = FoldedC;
 case Instruction::And:
 case Instruction::Or:
 case Instruction::Xor:
 // Bitwise operators can all arbitrarily be arbitrarily evaluated shifted.
 I->setOperand(
-0, GetShiftedValue(I->getOperand(0), NumBits, isLeftShift, IC, DL));
+0, getShiftedValue(I->getOperand(0), NumBits, isLeftShift, IC, DL));
 I->setOperand(
-1, GetShiftedValue(I->getOperand(1), NumBits, isLeftShift, IC, DL));
+1, getShiftedValue(I->getOperand(1), NumBits, isLeftShift, IC, DL));
 return I;
-case Instruction::Shl: {
+case Instruction::Shl:
-BinaryOperator *BO = cast<BinaryOperator>(I);
+case Instruction::LShr:
-unsigned TypeWidth = BO->getType()->getScalarSizeInBits();
+return foldShiftedShift(cast<BinaryOperator>(I), NumBits, isLeftShift,
+IC.Builder);
-// We only accept shifts-by-a-constant in CanEvaluateShifted.
-ConstantInt *CI = cast<ConstantInt>(BO->getOperand(1));
-// We can always fold shl(c1)+shl(c2) -> shl(c1+c2).
-if (isLeftShift) {
-// If this is oversized composite shift, then unsigned shifts get 0.
-unsigned NewShAmt = NumBits+CI->getZExtValue();
-if (NewShAmt >= TypeWidth)
-return Constant::getNullValue(I->getType());
-BO->setOperand(1, ConstantInt::get(BO->getType(), NewShAmt));
-BO->setHasNoUnsignedWrap(false);
-BO->setHasNoSignedWrap(false);
-return I;
-}
-// We turn shl(c)+lshr(c) -> and(c2) if the input doesn't already have
-// zeros.
-if (CI->getValue() == NumBits) {
-APInt Mask(APInt::getLowBitsSet(TypeWidth, TypeWidth - NumBits));
-V = IC.Builder->CreateAnd(BO->getOperand(0),
-ConstantInt::get(BO->getContext(), Mask));
-if (Instruction *VI = dyn_cast<Instruction>(V)) {
-VI->moveBefore(BO);
-VI->takeName(BO);
-}
-return V;
-}
-// We turn shl(c1)+shr(c2) -> shl(c3)+and(c4), but only when we know that
-// the and won't be needed.
-assert(CI->getZExtValue() > NumBits);
-BO->setOperand(1, ConstantInt::get(BO->getType(),
-CI->getZExtValue() - NumBits));
-BO->setHasNoUnsignedWrap(false);
-BO->setHasNoSignedWrap(false);
-return BO;
-}
-// FIXME: This is almost identical to the SHL case. Refactor both cases into
-// a helper function.
-case Instruction::LShr: {
-BinaryOperator *BO = cast<BinaryOperator>(I);
-unsigned TypeWidth = BO->getType()->getScalarSizeInBits();
-// We only accept shifts-by-a-constant in CanEvaluateShifted.
-ConstantInt *CI = cast<ConstantInt>(BO->getOperand(1));
-// We can always fold lshr(c1)+lshr(c2) -> lshr(c1+c2).
-if (!isLeftShift) {
-// If this is oversized composite shift, then unsigned shifts get 0.
-unsigned NewShAmt = NumBits+CI->getZExtValue();
-if (NewShAmt >= TypeWidth)
-return Constant::getNullValue(BO->getType());
-BO->setOperand(1, ConstantInt::get(BO->getType(), NewShAmt));
-BO->setIsExact(false);
-return I;
-}
-// We turn lshr(c)+shl(c) -> and(c2) if the input doesn't already have
-// zeros.
-if (CI->getValue() == NumBits) {
-APInt Mask(APInt::getHighBitsSet(TypeWidth, TypeWidth - NumBits));
-V = IC.Builder->CreateAnd(I->getOperand(0),
-ConstantInt::get(BO->getContext(), Mask));
-if (Instruction *VI = dyn_cast<Instruction>(V)) {
-VI->moveBefore(I);
-VI->takeName(I);
-}
-return V;
-}
-// We turn lshr(c1)+shl(c2) -> lshr(c3)+and(c4), but only when we know that
-// the and won't be needed.
-assert(CI->getZExtValue() > NumBits);
-BO->setOperand(1, ConstantInt::get(BO->getType(),
-CI->getZExtValue() - NumBits));
-BO->setIsExact(false);
-return BO;
-}
 case Instruction::Select:
 I->setOperand(
-1, GetShiftedValue(I->getOperand(1), NumBits, isLeftShift, IC, DL));
+1, getShiftedValue(I->getOperand(1), NumBits, isLeftShift, IC, DL));
 I->setOperand(
-2, GetShiftedValue(I->getOperand(2), NumBits, isLeftShift, IC, DL));
+2, getShiftedValue(I->getOperand(2), NumBits, isLeftShift, IC, DL));
 return I;
 case Instruction::PHI: {
 // We can change a phi if we can change all operands.  Note that we never
 // get into trouble with cyclic PHIs here because we only consider
 // instructions with a single use.
 PHINode *PN = cast<PHINode>(I);
 for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i)
-PN->setIncomingValue(i, GetShiftedValue(PN->getIncomingValue(i), NumBits,
+PN->setIncomingValue(i, getShiftedValue(PN->getIncomingValue(i), NumBits,
 isLeftShift, IC, DL));
 return PN;
 }
 }
 }
 Instruction *InstCombiner::FoldShiftByConstant(Value *Op0, Constant *Op1,
 BinaryOperator &I) {
 bool isLeftShift = I.getOpcode() == Instruction::Shl;
-ConstantInt *COp1 = nullptr;
+const APInt *Op1C;
-if (ConstantDataVector *CV = dyn_cast<ConstantDataVector>(Op1))
+if (!match(Op1, m_APInt(Op1C)))
-COp1 = dyn_cast_or_null<ConstantInt>(CV->getSplatValue());
-else if (ConstantVector *CV = dyn_cast<ConstantVector>(Op1))
-COp1 = dyn_cast_or_null<ConstantInt>(CV->getSplatValue());
-else
-COp1 = dyn_cast<ConstantInt>(Op1);
-if (!COp1)
 return nullptr;
 // See if we can propagate this shift into the input, this covers the trivial
 // cast of lshr(shl(x,c1),c2) as well as other more complex cases.
 if (I.getOpcode() != Instruction::AShr &&
-CanEvaluateShifted(Op0, COp1->getZExtValue(), isLeftShift, *this, &I)) {
+canEvaluateShifted(Op0, Op1C->getZExtValue(), isLeftShift, *this, &I)) {
 DEBUG(dbgs() << "ICE: GetShiftedValue propagating shift through expression"
 " to eliminate shift:\n  IN: " << *Op0 << "\n  SH: " << I <<"\n");
 return replaceInstUsesWith(
-I, GetShiftedValue(Op0, COp1->getZExtValue(), isLeftShift, *this, DL));
+I, getShiftedValue(Op0, Op1C->getZExtValue(), isLeftShift, *this, DL));
 }
 // See if we can simplify any instructions used by the instruction whose sole
 // purpose is to compute bits we don't care about.
-uint32_t TypeBits = Op0->getType()->getScalarSizeInBits();
+unsigned TypeBits = Op0->getType()->getScalarSizeInBits();
-assert(!COp1->uge(TypeBits) &&
+assert(!Op1C->uge(TypeBits) &&
 "Shift over the type width should have been removed already");
-// ((X*C1) << C2) == (X * (C1 << C2))
+if (Instruction *FoldedShift = foldOpWithConstantIntoOperand(I))
-if (BinaryOperator *BO = dyn_cast<BinaryOperator>(Op0))
+return FoldedShift;
-if (BO->getOpcode() == Instruction::Mul && isLeftShift)
-if (Constant *BOOp = dyn_cast<Constant>(BO->getOperand(1)))
-return BinaryOperator::CreateMul(BO->getOperand(0),
-ConstantExpr::getShl(BOOp, Op1));
-// Try to fold constant and into select arguments.
-if (SelectInst *SI = dyn_cast<SelectInst>(Op0))
-if (Instruction *R = FoldOpIntoSelect(I, SI))
-return R;
-if (isa<PHINode>(Op0))
-if (Instruction *NV = FoldOpIntoPhi(I))
-return NV;
 // Fold shift2(trunc(shift1(x,c1)), c2) -> trunc(shift2(shift1(x,c1),c2))
 if (TruncInst *TI = dyn_cast<TruncInst>(Op0)) {
 Instruction *TrOp = dyn_cast<Instruction>(TI->getOperand(0));
 // If 'shift2' is an ashr, we would have to get the sign bit into a funny
 // confidence that the shifts will get folded together.  We could do this
 // xform in more cases, but it is unlikely to be profitable.
 if (TrOp && I.isLogicalShift() && TrOp->isShift() &&
 isa<ConstantInt>(TrOp->getOperand(1))) {
 // Okay, we'll do this xform.  Make the shift of shift.
-Constant *ShAmt = ConstantExpr::getZExt(COp1, TrOp->getType());
+Constant *ShAmt =
+ConstantExpr::getZExt(cast<Constant>(Op1), TrOp->getType());
 // (shift2 (shift1 & 0x00FF), c2)
-Value *NSh = Builder->CreateBinOp(I.getOpcode(), TrOp, ShAmt,I.getName());
+Value *NSh = Builder.CreateBinOp(I.getOpcode(), TrOp, ShAmt, I.getName());
 // For logical shifts, the truncation has the effect of making the high
 // part of the register be zeros.  Emulate this by inserting an AND to
 // clear the top bits as needed.  This 'and' will usually be zapped by
 // other xforms later if dead.
 // The mask we constructed says what the trunc would do if occurring
 // between the shifts.  We want to know the effect *after* the second
 // shift.  We know that it is a logical shift by a constant, so adjust the
 // mask as appropriate.
 if (I.getOpcode() == Instruction::Shl)
-MaskV <<= COp1->getZExtValue();
+MaskV <<= Op1C->getZExtValue();
 else {
 assert(I.getOpcode() == Instruction::LShr && "Unknown logical shift");
-MaskV = MaskV.lshr(COp1->getZExtValue());
+MaskV.lshrInPlace(Op1C->getZExtValue());
 }
 // shift1 & 0x00FF
-Value *And = Builder->CreateAnd(NSh,
+Value *And = Builder.CreateAnd(NSh,
 ConstantInt::get(I.getContext(), MaskV),
 TI->getName());
 // Return the value truncated to the interesting size.
 return new TruncInst(And, I.getType());
 }
 }
 // Turn (Y + (X >> C)) << C  ->  (X + (Y << C)) & (~0 << C)
 if (isLeftShift && Op0BO->getOperand(1)->hasOneUse() &&
 match(Op0BO->getOperand(1), m_Shr(m_Value(V1),
 m_Specific(Op1)))) {
 Value *YS =         // (Y << C)
-Builder->CreateShl(Op0BO->getOperand(0), Op1, Op0BO->getName());
+Builder.CreateShl(Op0BO->getOperand(0), Op1, Op0BO->getName());
 // (X + (Y << C))
-Value *X = Builder->CreateBinOp(Op0BO->getOpcode(), YS, V1,
+Value *X = Builder.CreateBinOp(Op0BO->getOpcode(), YS, V1,
 Op0BO->getOperand(1)->getName());
-uint32_t Op1Val = COp1->getLimitedValue(TypeBits);
+unsigned Op1Val = Op1C->getLimitedValue(TypeBits);
 APInt Bits = APInt::getHighBitsSet(TypeBits, TypeBits - Op1Val);
 Constant *Mask = ConstantInt::get(I.getContext(), Bits);
 if (VectorType *VT = dyn_cast<VectorType>(X->getType()))
 Mask = ConstantVector::getSplat(VT->getNumElements(), Mask);
 if (isLeftShift && Op0BOOp1->hasOneUse() &&
 match(Op0BOOp1,
 m_And(m_OneUse(m_Shr(m_Value(V1), m_Specific(Op1))),
 m_ConstantInt(CC)))) {
 Value *YS =   // (Y << C)
-Builder->CreateShl(Op0BO->getOperand(0), Op1,
+Builder.CreateShl(Op0BO->getOperand(0), Op1, Op0BO->getName());
-Op0BO->getName());
 // X & (CC << C)
-Value *XM = Builder->CreateAnd(V1, ConstantExpr::getShl(CC, Op1),
+Value *XM = Builder.CreateAnd(V1, ConstantExpr::getShl(CC, Op1),
 V1->getName()+".mask");
 return BinaryOperator::Create(Op0BO->getOpcode(), YS, XM);
 }
 LLVM_FALLTHROUGH;
 }
 // Turn ((X >> C) + Y) << C  ->  (X + (Y << C)) & (~0 << C)
 if (isLeftShift && Op0BO->getOperand(0)->hasOneUse() &&
 match(Op0BO->getOperand(0), m_Shr(m_Value(V1),
 m_Specific(Op1)))) {
 Value *YS =  // (Y << C)
-Builder->CreateShl(Op0BO->getOperand(1), Op1, Op0BO->getName());
+Builder.CreateShl(Op0BO->getOperand(1), Op1, Op0BO->getName());
 // (X + (Y << C))
-Value *X = Builder->CreateBinOp(Op0BO->getOpcode(), V1, YS,
+Value *X = Builder.CreateBinOp(Op0BO->getOpcode(), V1, YS,
 Op0BO->getOperand(0)->getName());
-uint32_t Op1Val = COp1->getLimitedValue(TypeBits);
+unsigned Op1Val = Op1C->getLimitedValue(TypeBits);
 APInt Bits = APInt::getHighBitsSet(TypeBits, TypeBits - Op1Val);
 Constant *Mask = ConstantInt::get(I.getContext(), Bits);
 if (VectorType *VT = dyn_cast<VectorType>(X->getType()))
 Mask = ConstantVector::getSplat(VT->getNumElements(), Mask);
 if (isLeftShift && Op0BO->getOperand(0)->hasOneUse() &&
 match(Op0BO->getOperand(0),
 m_And(m_OneUse(m_Shr(m_Value(V1), m_Value(V2))),
 m_ConstantInt(CC))) && V2 == Op1) {
 Value *YS = // (Y << C)
-Builder->CreateShl(Op0BO->getOperand(1), Op1, Op0BO->getName());
+Builder.CreateShl(Op0BO->getOperand(1), Op1, Op0BO->getName());
 // X & (CC << C)
-Value *XM = Builder->CreateAnd(V1, ConstantExpr::getShl(CC, Op1),
+Value *XM = Builder.CreateAnd(V1, ConstantExpr::getShl(CC, Op1),
 V1->getName()+".mask");
 return BinaryOperator::Create(Op0BO->getOpcode(), XM, YS);
 }
 break;
 }
 // If the operand is a bitwise operator with a constant RHS, and the
 // shift is the only use, we can pull it out of the shift.
-if (ConstantInt *Op0C = dyn_cast<ConstantInt>(Op0BO->getOperand(1))) {
+const APInt *Op0C;
+if (match(Op0BO->getOperand(1), m_APInt(Op0C))) {
 bool isValid = true;     // Valid only for And, Or, Xor
 bool highBitSet = false; // Transform if high bit of constant set?
 switch (Op0BO->getOpcode()) {
 default: isValid = false; break;   // Do not perform transform!
 // The highBitSet boolean indicates the value of the high bit of
 // the constant which would cause it to be modified for this
 // operation.
 //
 if (isValid && I.getOpcode() == Instruction::AShr)
-isValid = Op0C->getValue()[TypeBits-1] == highBitSet;
+isValid = Op0C->isNegative() == highBitSet;
 if (isValid) {
-Constant *NewRHS = ConstantExpr::get(I.getOpcode(), Op0C, Op1);
+Constant *NewRHS = ConstantExpr::get(I.getOpcode(),
+cast<Constant>(Op0BO->getOperand(1)), Op1);
 Value *NewShift =
-Builder->CreateBinOp(I.getOpcode(), Op0BO->getOperand(0), Op1);
+Builder.CreateBinOp(I.getOpcode(), Op0BO->getOperand(0), Op1);
 NewShift->takeName(Op0BO);
 return BinaryOperator::Create(Op0BO->getOpcode(), NewShift,
 NewRHS);
 }
 }
-}
-}
+// If the operand is a subtract with a constant LHS, and the shift
+// is the only use, we can pull it out of the shift.
-// Find out if this is a shift of a shift by a constant.
+// This folds (shl (sub C1, X), C2) -> (sub (C1 << C2), (shl X, C2))
-BinaryOperator *ShiftOp = dyn_cast<BinaryOperator>(Op0);
+if (isLeftShift && Op0BO->getOpcode() == Instruction::Sub &&
-if (ShiftOp && !ShiftOp->isShift())
+match(Op0BO->getOperand(0), m_APInt(Op0C))) {
-ShiftOp = nullptr;
+Constant *NewRHS = ConstantExpr::get(I.getOpcode(),
+cast<Constant>(Op0BO->getOperand(0)), Op1);
-if (ShiftOp && isa<ConstantInt>(ShiftOp->getOperand(1))) {
+Value *NewShift = Builder.CreateShl(Op0BO->getOperand(1), Op1);
-// This is a constant shift of a constant shift. Be careful about hiding
+NewShift->takeName(Op0BO);
-// shl instructions behind bit masks. They are used to represent multiplies
-// by a constant, and it is important that simple arithmetic expressions
+return BinaryOperator::CreateSub(NewRHS, NewShift);
-// are still recognizable by scalar evolution.
+}
-//
+}
-// The transforms applied to shl are very similar to the transforms applied
+}
-// to mul by constant. We can be more aggressive about optimizing right
-// shifts.
+return nullptr;
-//
+}
-// Combinations of right and left shifts will still be optimized in
-// DAGCombine where scalar evolution no longer applies.
+Instruction *InstCombiner::visitShl(BinaryOperator &I) {
+if (Value *V = SimplifyVectorOp(I))
-ConstantInt *ShiftAmt1C = cast<ConstantInt>(ShiftOp->getOperand(1));
+return replaceInstUsesWith(I, V);
-uint32_t ShiftAmt1 = ShiftAmt1C->getLimitedValue(TypeBits);
-uint32_t ShiftAmt2 = COp1->getLimitedValue(TypeBits);
+Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
-assert(ShiftAmt2 != 0 && "Should have been simplified earlier");
+if (Value *V =
-if (ShiftAmt1 == 0) return nullptr;  // Will be simplified in the future.
+SimplifyShlInst(Op0, Op1, I.hasNoSignedWrap(), I.hasNoUnsignedWrap(),
-Value *X = ShiftOp->getOperand(0);
+SQ.getWithInstruction(&I)))
+return replaceInstUsesWith(I, V);
-IntegerType *Ty = cast<IntegerType>(I.getType());
+if (Instruction *V = commonShiftTransforms(I))
-// Check for (X << c1) << c2  and  (X >> c1) >> c2
+return V;
-if (I.getOpcode() == ShiftOp->getOpcode()) {
-uint32_t AmtSum = ShiftAmt1+ShiftAmt2;   // Fold into one big shift.
+const APInt *ShAmtAPInt;
-// If this is oversized composite shift, then unsigned shifts get 0, ashr
+if (match(Op1, m_APInt(ShAmtAPInt))) {
-// saturates.
+unsigned ShAmt = ShAmtAPInt->getZExtValue();
-if (AmtSum >= TypeBits) {
+unsigned BitWidth = I.getType()->getScalarSizeInBits();
-if (I.getOpcode() != Instruction::AShr)
+Type *Ty = I.getType();
-return replaceInstUsesWith(I, Constant::getNullValue(I.getType()));
-AmtSum = TypeBits-1;  // Saturate to 31 for i32 ashr.
+// shl (zext X), ShAmt --> zext (shl X, ShAmt)
-}
+// This is only valid if X would have zeros shifted out.
+Value *X;
-return BinaryOperator::Create(I.getOpcode(), X,
+if (match(Op0, m_ZExt(m_Value(X)))) {
-ConstantInt::get(Ty, AmtSum));
+unsigned SrcWidth = X->getType()->getScalarSizeInBits();
-}
+if (ShAmt < SrcWidth &&
+MaskedValueIsZero(X, APInt::getHighBitsSet(SrcWidth, ShAmt), 0, &I))
-if (ShiftAmt1 == ShiftAmt2) {
+return new ZExtInst(Builder.CreateShl(X, ShAmt), Ty);
-// If we have ((X << C) >>u C), turn this into X & (-1 >>u C).
+}
-if (I.getOpcode() == Instruction::LShr &&
-ShiftOp->getOpcode() == Instruction::Shl) {
+// (X >> C) << C --> X & (-1 << C)
-APInt Mask(APInt::getLowBitsSet(TypeBits, TypeBits - ShiftAmt1));
+if (match(Op0, m_Shr(m_Value(X), m_Specific(Op1)))) {
-return BinaryOperator::CreateAnd(X,
+APInt Mask(APInt::getHighBitsSet(BitWidth, BitWidth - ShAmt));
-ConstantInt::get(I.getContext(), Mask));
+return BinaryOperator::CreateAnd(X, ConstantInt::get(Ty, Mask));
 }
-} else if (ShiftAmt1 < ShiftAmt2) {
-uint32_t ShiftDiff = ShiftAmt2-ShiftAmt1;
+// Be careful about hiding shl instructions behind bit masks. They are used
+// to represent multiplies by a constant, and it is important that simple
-// (X >>?,exact C1) << C2 --> X << (C2-C1)
+// arithmetic expressions are still recognizable by scalar evolution.
-// The inexact version is deferred to DAGCombine so we don't hide shl
+// The inexact versions are deferred to DAGCombine, so we don't hide shl
 // behind a bit mask.
-if (I.getOpcode() == Instruction::Shl &&
+const APInt *ShOp1;
-ShiftOp->getOpcode() != Instruction::Shl &&
+if (match(Op0, m_Exact(m_Shr(m_Value(X), m_APInt(ShOp1))))) {
-ShiftOp->isExact()) {
+unsigned ShrAmt = ShOp1->getZExtValue();
-assert(ShiftOp->getOpcode() == Instruction::LShr ||
+if (ShrAmt < ShAmt) {
-ShiftOp->getOpcode() == Instruction::AShr);
+// If C1 < C2: (X >>?,exact C1) << C2 --> X << (C2 - C1)
-ConstantInt *ShiftDiffCst = ConstantInt::get(Ty, ShiftDiff);
+Constant *ShiftDiff = ConstantInt::get(Ty, ShAmt - ShrAmt);
-BinaryOperator *NewShl = BinaryOperator::Create(Instruction::Shl,
+auto *NewShl = BinaryOperator::CreateShl(X, ShiftDiff);
-X, ShiftDiffCst);
 NewShl->setHasNoUnsignedWrap(I.hasNoUnsignedWrap());
 NewShl->setHasNoSignedWrap(I.hasNoSignedWrap());
 return NewShl;
 }
+if (ShrAmt > ShAmt) {
-// (X << C1) >>u C2  --> X >>u (C2-C1) & (-1 >> C2)
+// If C1 > C2: (X >>?exact C1) << C2 --> X >>?exact (C1 - C2)
-if (I.getOpcode() == Instruction::LShr &&
+Constant *ShiftDiff = ConstantInt::get(Ty, ShrAmt - ShAmt);
-ShiftOp->getOpcode() == Instruction::Shl) {
+auto *NewShr = BinaryOperator::Create(
-ConstantInt *ShiftDiffCst = ConstantInt::get(Ty, ShiftDiff);
+cast<BinaryOperator>(Op0)->getOpcode(), X, ShiftDiff);
-// (X <<nuw C1) >>u C2 --> X >>u (C2-C1)
+NewShr->setIsExact(true);
-if (ShiftOp->hasNoUnsignedWrap()) {
+return NewShr;
-BinaryOperator *NewLShr = BinaryOperator::Create(Instruction::LShr,
+}
-X, ShiftDiffCst);
+}
+if (match(Op0, m_Shl(m_Value(X), m_APInt(ShOp1)))) {
+unsigned AmtSum = ShAmt + ShOp1->getZExtValue();
+// Oversized shifts are simplified to zero in InstSimplify.
+if (AmtSum < BitWidth)
+// (X << C1) << C2 --> X << (C1 + C2)
+return BinaryOperator::CreateShl(X, ConstantInt::get(Ty, AmtSum));
+}
+// If the shifted-out value is known-zero, then this is a NUW shift.
+if (!I.hasNoUnsignedWrap() &&
+MaskedValueIsZero(Op0, APInt::getHighBitsSet(BitWidth, ShAmt), 0, &I)) {
+I.setHasNoUnsignedWrap();
+return &I;
+}
+// If the shifted-out value is all signbits, then this is a NSW shift.
+if (!I.hasNoSignedWrap() && ComputeNumSignBits(Op0, 0, &I) > ShAmt) {
+I.setHasNoSignedWrap();
+return &I;
+}
+}
+Constant *C1;
+if (match(Op1, m_Constant(C1))) {
+Constant *C2;
+Value *X;
+// (C2 << X) << C1 --> (C2 << C1) << X
+if (match(Op0, m_OneUse(m_Shl(m_Constant(C2), m_Value(X)))))
+return BinaryOperator::CreateShl(ConstantExpr::getShl(C2, C1), X);
+// (X * C2) << C1 --> X * (C2 << C1)
+if (match(Op0, m_Mul(m_Value(X), m_Constant(C2))))
+return BinaryOperator::CreateMul(X, ConstantExpr::getShl(C2, C1));
+}
+return nullptr;
+}
+Instruction *InstCombiner::visitLShr(BinaryOperator &I) {
+if (Value *V = SimplifyVectorOp(I))
+return replaceInstUsesWith(I, V);
+Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
+if (Value *V =
+SimplifyLShrInst(Op0, Op1, I.isExact(), SQ.getWithInstruction(&I)))
+return replaceInstUsesWith(I, V);
+if (Instruction *R = commonShiftTransforms(I))
+return R;
+Type *Ty = I.getType();
+const APInt *ShAmtAPInt;
+if (match(Op1, m_APInt(ShAmtAPInt))) {
+unsigned ShAmt = ShAmtAPInt->getZExtValue();
+unsigned BitWidth = Ty->getScalarSizeInBits();
+auto *II = dyn_cast<IntrinsicInst>(Op0);
+if (II && isPowerOf2_32(BitWidth) && Log2_32(BitWidth) == ShAmt &&
+(II->getIntrinsicID() == Intrinsic::ctlz ||
+II->getIntrinsicID() == Intrinsic::cttz ||
+II->getIntrinsicID() == Intrinsic::ctpop)) {
+// ctlz.i32(x)>>5  --> zext(x == 0)
+// cttz.i32(x)>>5  --> zext(x == 0)
+// ctpop.i32(x)>>5 --> zext(x == -1)
+bool IsPop = II->getIntrinsicID() == Intrinsic::ctpop;
+Constant *RHS = ConstantInt::getSigned(Ty, IsPop ? -1 : 0);
+Value *Cmp = Builder.CreateICmpEQ(II->getArgOperand(0), RHS);
+return new ZExtInst(Cmp, Ty);
+}
+Value *X;
+const APInt *ShOp1;
+if (match(Op0, m_Shl(m_Value(X), m_APInt(ShOp1)))) {
+unsigned ShlAmt = ShOp1->getZExtValue();
+if (ShlAmt < ShAmt) {
+Constant *ShiftDiff = ConstantInt::get(Ty, ShAmt - ShlAmt);
+if (cast<BinaryOperator>(Op0)->hasNoUnsignedWrap()) {
+// (X <<nuw C1) >>u C2 --> X >>u (C2 - C1)
+auto *NewLShr = BinaryOperator::CreateLShr(X, ShiftDiff);
 NewLShr->setIsExact(I.isExact());
 return NewLShr;
 }
-Value *Shift = Builder->CreateLShr(X, ShiftDiffCst);
+// (X << C1) >>u C2  --> (X >>u (C2 - C1)) & (-1 >> C2)
+Value *NewLShr = Builder.CreateLShr(X, ShiftDiff, "", I.isExact());
-APInt Mask(APInt::getLowBitsSet(TypeBits, TypeBits - ShiftAmt2));
+APInt Mask(APInt::getLowBitsSet(BitWidth, BitWidth - ShAmt));
-return BinaryOperator::CreateAnd(Shift,
+return BinaryOperator::CreateAnd(NewLShr, ConstantInt::get(Ty, Mask));
-ConstantInt::get(I.getContext(),Mask));
+}
-}
+if (ShlAmt > ShAmt) {
+Constant *ShiftDiff = ConstantInt::get(Ty, ShlAmt - ShAmt);
-// We can't handle (X << C1) >>s C2, it shifts arbitrary bits in. However,
+if (cast<BinaryOperator>(Op0)->hasNoUnsignedWrap()) {
-// we can handle (X <<nsw C1) >>s C2 since it only shifts in sign bits.
+// (X <<nuw C1) >>u C2 --> X <<nuw (C1 - C2)
-if (I.getOpcode() == Instruction::AShr &&
+auto *NewShl = BinaryOperator::CreateShl(X, ShiftDiff);
-ShiftOp->getOpcode() == Instruction::Shl) {
-if (ShiftOp->hasNoSignedWrap()) {
-// (X <<nsw C1) >>s C2 --> X >>s (C2-C1)
-ConstantInt *ShiftDiffCst = ConstantInt::get(Ty, ShiftDiff);
-BinaryOperator *NewAShr = BinaryOperator::Create(Instruction::AShr,
-X, ShiftDiffCst);
-NewAShr->setIsExact(I.isExact());
-return NewAShr;
-}
-}
-} else {
-assert(ShiftAmt2 < ShiftAmt1);
-uint32_t ShiftDiff = ShiftAmt1-ShiftAmt2;
-// (X >>?exact C1) << C2 --> X >>?exact (C1-C2)
-// The inexact version is deferred to DAGCombine so we don't hide shl
-// behind a bit mask.
-if (I.getOpcode() == Instruction::Shl &&
-ShiftOp->getOpcode() != Instruction::Shl &&
-ShiftOp->isExact()) {
-ConstantInt *ShiftDiffCst = ConstantInt::get(Ty, ShiftDiff);
-BinaryOperator *NewShr = BinaryOperator::Create(ShiftOp->getOpcode(),
-X, ShiftDiffCst);
-NewShr->setIsExact(true);
-return NewShr;
-}
-// (X << C1) >>u C2  --> X << (C1-C2) & (-1 >> C2)
-if (I.getOpcode() == Instruction::LShr &&
-ShiftOp->getOpcode() == Instruction::Shl) {
-ConstantInt *ShiftDiffCst = ConstantInt::get(Ty, ShiftDiff);
-if (ShiftOp->hasNoUnsignedWrap()) {
-// (X <<nuw C1) >>u C2 --> X <<nuw (C1-C2)
-BinaryOperator *NewShl = BinaryOperator::Create(Instruction::Shl,
-X, ShiftDiffCst);
 NewShl->setHasNoUnsignedWrap(true);
 return NewShl;
 }
-Value *Shift = Builder->CreateShl(X, ShiftDiffCst);
+// (X << C1) >>u C2  --> X << (C1 - C2) & (-1 >> C2)
+Value *NewShl = Builder.CreateShl(X, ShiftDiff);
-APInt Mask(APInt::getLowBitsSet(TypeBits, TypeBits - ShiftAmt2));
+APInt Mask(APInt::getLowBitsSet(BitWidth, BitWidth - ShAmt));
-return BinaryOperator::CreateAnd(Shift,
+return BinaryOperator::CreateAnd(NewShl, ConstantInt::get(Ty, Mask));
-ConstantInt::get(I.getContext(),Mask));
+}
-}
+assert(ShlAmt == ShAmt);
+// (X << C) >>u C --> X & (-1 >>u C)
-// We can't handle (X << C1) >>s C2, it shifts arbitrary bits in. However,
+APInt Mask(APInt::getLowBitsSet(BitWidth, BitWidth - ShAmt));
-// we can handle (X <<nsw C1) >>s C2 since it only shifts in sign bits.
+return BinaryOperator::CreateAnd(X, ConstantInt::get(Ty, Mask));
-if (I.getOpcode() == Instruction::AShr &&
+}
-ShiftOp->getOpcode() == Instruction::Shl) {
-if (ShiftOp->hasNoSignedWrap()) {
+if (match(Op0, m_OneUse(m_ZExt(m_Value(X)))) &&
-// (X <<nsw C1) >>s C2 --> X <<nsw (C1-C2)
+(!Ty->isIntegerTy() || shouldChangeType(Ty, X->getType()))) {
-ConstantInt *ShiftDiffCst = ConstantInt::get(Ty, ShiftDiff);
+assert(ShAmt < X->getType()->getScalarSizeInBits() &&
-BinaryOperator *NewShl = BinaryOperator::Create(Instruction::Shl,
+"Big shift not simplified to zero?");
-X, ShiftDiffCst);
+// lshr (zext iM X to iN), C --> zext (lshr X, C) to iN
-NewShl->setHasNoSignedWrap(true);
+Value *NewLShr = Builder.CreateLShr(X, ShAmt);
-return NewShl;
+return new ZExtInst(NewLShr, Ty);
+}
+if (match(Op0, m_SExt(m_Value(X))) &&
+(!Ty->isIntegerTy() || shouldChangeType(Ty, X->getType()))) {
+// Are we moving the sign bit to the low bit and widening with high zeros?
+unsigned SrcTyBitWidth = X->getType()->getScalarSizeInBits();
+if (ShAmt == BitWidth - 1) {
+// lshr (sext i1 X to iN), N-1 --> zext X to iN
+if (SrcTyBitWidth == 1)
+return new ZExtInst(X, Ty);
+// lshr (sext iM X to iN), N-1 --> zext (lshr X, M-1) to iN
+if (Op0->hasOneUse()) {
+Value *NewLShr = Builder.CreateLShr(X, SrcTyBitWidth - 1);
+return new ZExtInst(NewLShr, Ty);
 }
 }
-}
-}
+// lshr (sext iM X to iN), N-M --> zext (ashr X, min(N-M, M-1)) to iN
-return nullptr;
+if (ShAmt == BitWidth - SrcTyBitWidth && Op0->hasOneUse()) {
-}
+// The new shift amount can't be more than the narrow source type.
+unsigned NewShAmt = std::min(ShAmt, SrcTyBitWidth - 1);
-Instruction *InstCombiner::visitShl(BinaryOperator &I) {
+Value *AShr = Builder.CreateAShr(X, NewShAmt);
-if (Value *V = SimplifyVectorOp(I))
+return new ZExtInst(AShr, Ty);
-return replaceInstUsesWith(I, V);
+}
+}
-if (Value *V =
-SimplifyShlInst(I.getOperand(0), I.getOperand(1), I.hasNoSignedWrap(),
+if (match(Op0, m_LShr(m_Value(X), m_APInt(ShOp1)))) {
-I.hasNoUnsignedWrap(), DL, &TLI, &DT, &AC))
+unsigned AmtSum = ShAmt + ShOp1->getZExtValue();
-return replaceInstUsesWith(I, V);
+// Oversized shifts are simplified to zero in InstSimplify.
+if (AmtSum < BitWidth)
-if (Instruction *V = commonShiftTransforms(I))
+// (X >>u C1) >>u C2 --> X >>u (C1 + C2)
-return V;
+return BinaryOperator::CreateLShr(X, ConstantInt::get(Ty, AmtSum));
-if (ConstantInt *Op1C = dyn_cast<ConstantInt>(I.getOperand(1))) {
-unsigned ShAmt = Op1C->getZExtValue();
-// If the shifted-out value is known-zero, then this is a NUW shift.
-if (!I.hasNoUnsignedWrap() &&
-MaskedValueIsZero(I.getOperand(0),
-APInt::getHighBitsSet(Op1C->getBitWidth(), ShAmt), 0,
-&I)) {
-I.setHasNoUnsignedWrap();
-return &I;
-}
-// If the shifted out value is all signbits, this is a NSW shift.
-if (!I.hasNoSignedWrap() &&
-ComputeNumSignBits(I.getOperand(0), 0, &I) > ShAmt) {
-I.setHasNoSignedWrap();
-return &I;
-}
-}
-// (C1 << A) << C2 -> (C1 << C2) << A
-Constant *C1, *C2;
-Value *A;
-if (match(I.getOperand(0), m_OneUse(m_Shl(m_Constant(C1), m_Value(A)))) &&
-match(I.getOperand(1), m_Constant(C2)))
-return BinaryOperator::CreateShl(ConstantExpr::getShl(C1, C2), A);
-return nullptr;
-}
-Instruction *InstCombiner::visitLShr(BinaryOperator &I) {
-if (Value *V = SimplifyVectorOp(I))
-return replaceInstUsesWith(I, V);
-if (Value *V = SimplifyLShrInst(I.getOperand(0), I.getOperand(1), I.isExact(),
-DL, &TLI, &DT, &AC))
-return replaceInstUsesWith(I, V);
-if (Instruction *R = commonShiftTransforms(I))
-return R;
-Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
-if (ConstantInt *Op1C = dyn_cast<ConstantInt>(Op1)) {
-unsigned ShAmt = Op1C->getZExtValue();
-if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(Op0)) {
-unsigned BitWidth = Op0->getType()->getScalarSizeInBits();
-// ctlz.i32(x)>>5  --> zext(x == 0)
-// cttz.i32(x)>>5  --> zext(x == 0)
-// ctpop.i32(x)>>5 --> zext(x == -1)
-if ((II->getIntrinsicID() == Intrinsic::ctlz ||
-II->getIntrinsicID() == Intrinsic::cttz ||
-II->getIntrinsicID() == Intrinsic::ctpop) &&
-isPowerOf2_32(BitWidth) && Log2_32(BitWidth) == ShAmt) {
-bool isCtPop = II->getIntrinsicID() == Intrinsic::ctpop;
-Constant *RHS = ConstantInt::getSigned(Op0->getType(), isCtPop ? -1:0);
-Value *Cmp = Builder->CreateICmpEQ(II->getArgOperand(0), RHS);
-return new ZExtInst(Cmp, II->getType());
-}
 }
 // If the shifted-out value is known-zero, then this is an exact shift.
 if (!I.isExact() &&
-MaskedValueIsZero(Op0, APInt::getLowBitsSet(Op1C->getBitWidth(), ShAmt),
+MaskedValueIsZero(Op0, APInt::getLowBitsSet(BitWidth, ShAmt), 0, &I)) {
-0, &I)){
 I.setIsExact();
 return &I;
 }
 }
 return nullptr;
 }
 Instruction *InstCombiner::visitAShr(BinaryOperator &I) {
 if (Value *V = SimplifyVectorOp(I))
 return replaceInstUsesWith(I, V);
-if (Value *V = SimplifyAShrInst(I.getOperand(0), I.getOperand(1), I.isExact(),
+Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
-DL, &TLI, &DT, &AC))
+if (Value *V =
+SimplifyAShrInst(Op0, Op1, I.isExact(), SQ.getWithInstruction(&I)))
 return replaceInstUsesWith(I, V);
 if (Instruction *R = commonShiftTransforms(I))
 return R;
-Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);
+Type *Ty = I.getType();
+unsigned BitWidth = Ty->getScalarSizeInBits();
-if (ConstantInt *Op1C = dyn_cast<ConstantInt>(Op1)) {
+const APInt *ShAmtAPInt;
-unsigned ShAmt = Op1C->getZExtValue();
+if (match(Op1, m_APInt(ShAmtAPInt))) {
+unsigned ShAmt = ShAmtAPInt->getZExtValue();
-// If the input is a SHL by the same constant (ashr (shl X, C), C), then we
-// have a sign-extend idiom.
+// If the shift amount equals the difference in width of the destination
+// and source scalar types:
+// ashr (shl (zext X), C), C --> sext X
 Value *X;
-if (match(Op0, m_Shl(m_Value(X), m_Specific(Op1)))) {
+if (match(Op0, m_Shl(m_ZExt(m_Value(X)), m_Specific(Op1))) &&
-// If the input is an extension from the shifted amount value, e.g.
+ShAmt == BitWidth - X->getType()->getScalarSizeInBits())
-//   %x = zext i8 %A to i32
+return new SExtInst(X, Ty);
-//   %y = shl i32 %x, 24
-//   %z = ashr %y, 24
+// We can't handle (X << C1) >>s C2. It shifts arbitrary bits in. However,
-// then turn this into "z = sext i8 A to i32".
+// we can handle (X <<nsw C1) >>s C2 since it only shifts in sign bits.
-if (ZExtInst *ZI = dyn_cast<ZExtInst>(X)) {
+const APInt *ShOp1;
-uint32_t SrcBits = ZI->getOperand(0)->getType()->getScalarSizeInBits();
+if (match(Op0, m_NSWShl(m_Value(X), m_APInt(ShOp1)))) {
-uint32_t DestBits = ZI->getType()->getScalarSizeInBits();
+unsigned ShlAmt = ShOp1->getZExtValue();
-if (Op1C->getZExtValue() == DestBits-SrcBits)
+if (ShlAmt < ShAmt) {
-return new SExtInst(ZI->getOperand(0), ZI->getType());
+// (X <<nsw C1) >>s C2 --> X >>s (C2 - C1)
-}
+Constant *ShiftDiff = ConstantInt::get(Ty, ShAmt - ShlAmt);
+auto *NewAShr = BinaryOperator::CreateAShr(X, ShiftDiff);
+NewAShr->setIsExact(I.isExact());
+return NewAShr;
+}
+if (ShlAmt > ShAmt) {
+// (X <<nsw C1) >>s C2 --> X <<nsw (C1 - C2)
+Constant *ShiftDiff = ConstantInt::get(Ty, ShlAmt - ShAmt);
+auto *NewShl = BinaryOperator::Create(Instruction::Shl, X, ShiftDiff);
+NewShl->setHasNoSignedWrap(true);
+return NewShl;
+}
+}
+if (match(Op0, m_AShr(m_Value(X), m_APInt(ShOp1)))) {
+unsigned AmtSum = ShAmt + ShOp1->getZExtValue();
+// Oversized arithmetic shifts replicate the sign bit.
+AmtSum = std::min(AmtSum, BitWidth - 1);
+// (X >>s C1) >>s C2 --> X >>s (C1 + C2)
+return BinaryOperator::CreateAShr(X, ConstantInt::get(Ty, AmtSum));
+}
+if (match(Op0, m_OneUse(m_SExt(m_Value(X)))) &&
+(Ty->isVectorTy() || shouldChangeType(Ty, X->getType()))) {
+// ashr (sext X), C --> sext (ashr X, C')
+Type *SrcTy = X->getType();
+ShAmt = std::min(ShAmt, SrcTy->getScalarSizeInBits() - 1);
+Value *NewSh = Builder.CreateAShr(X, ConstantInt::get(SrcTy, ShAmt));
+return new SExtInst(NewSh, Ty);
 }
 // If the shifted-out value is known-zero, then this is an exact shift.
 if (!I.isExact() &&
-MaskedValueIsZero(Op0, APInt::getLowBitsSet(Op1C->getBitWidth(), ShAmt),
+MaskedValueIsZero(Op0, APInt::getLowBitsSet(BitWidth, ShAmt), 0, &I)) {
-0, &I)) {
 I.setIsExact();
 return &I;
 }
 }
 // See if we can turn a signed shr into an unsigned shr.
-if (MaskedValueIsZero(Op0,
+if (MaskedValueIsZero(Op0, APInt::getSignMask(BitWidth), 0, &I))
-APInt::getSignBit(I.getType()->getScalarSizeInBits()),
-0, &I))
 return BinaryOperator::CreateLShr(Op0, Op1);
 return nullptr;
 }

Mercurial > hg > CbC > CbC_llvm

comparison lib/Transforms/InstCombine/InstCombineShifts.cpp @ 121:803732b1fca8