LLVM: lib/Transforms/InstCombine/InstCombineCompares.cpp Source File

//===- InstCombineCompares.cpp --------------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the visitICmp and visitFCmp functions.

//

//===----------------------------------------------------------------------===//


#include "InstCombineInternal.h"

#include "llvm/ADT/APFloat.h"

#include "llvm/ADT/APSInt.h"

#include "llvm/ADT/SetVector.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/CaptureTracking.h"

#include "llvm/Analysis/CmpInstAnalysis.h"

#include "llvm/Analysis/ConstantFolding.h"

#include "llvm/Analysis/InstructionSimplify.h"

#include "llvm/Analysis/Loads.h"

#include "llvm/Analysis/Utils/Local.h"

#include "llvm/Analysis/VectorUtils.h"

#include "llvm/IR/ConstantRange.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/Support/KnownBits.h"

#include "llvm/Transforms/InstCombine/InstCombiner.h"

#include <bitset>


using namespace llvm;

using namespace PatternMatch;


#define DEBUG_TYPE "instcombine"


// How many times is a select replaced by one of its operands?

STATISTIC(NumSel, "Number of select opts");


/// Compute Result = In1+In2, returning true if the result overflowed for this

/// type.


static bool addWithOverflow(APInt &Result, const APInt &In1, const APInt &In2,

                            bool IsSigned = false) {

  bool Overflow;

  if (IsSigned)

    Result = In1.sadd_ov(In2, Overflow);

  else

    Result = In1.uadd_ov(In2, Overflow);


  return Overflow;

}


/// Compute Result = In1-In2, returning true if the result overflowed for this

/// type.


static bool subWithOverflow(APInt &Result, const APInt &In1, const APInt &In2,

                            bool IsSigned = false) {

  bool Overflow;

  if (IsSigned)

    Result = In1.ssub_ov(In2, Overflow);

  else

    Result = In1.usub_ov(In2, Overflow);


  return Overflow;

}


/// Given an icmp instruction, return true if any use of this comparison is a

/// branch on sign bit comparison.


static bool hasBranchUse(ICmpInst &I) {

  for (auto *U : I.users())

    if (isa<BranchInst>(U))

      return true;

  return false;

}


/// Returns true if the exploded icmp can be expressed as a signed comparison

/// to zero and updates the predicate accordingly.

/// The signedness of the comparison is preserved.

/// TODO: Refactor with decomposeBitTestICmp()?


static bool isSignTest(ICmpInst::Predicate &Pred, const APInt &C) {

  if (!ICmpInst::isSigned(Pred))

    return false;


  if (C.isZero())

    return ICmpInst::isRelational(Pred);


  if (C.isOne()) {

    if (Pred == ICmpInst::ICMP_SLT) {

      Pred = ICmpInst::ICMP_SLE;

      return true;

    }

  } else if (C.isAllOnes()) {

    if (Pred == ICmpInst::ICMP_SGT) {

      Pred = ICmpInst::ICMP_SGE;

      return true;

    }

  }


  return false;

}


/// This is called when we see this pattern:

///   cmp pred (load (gep GV, ...)), cmpcst

/// where GV is a global variable with a constant initializer. Try to simplify

/// this into some simple computation that does not need the load. For example

/// we can optimize "icmp eq (load (gep "foo", 0, i)), 0" into "icmp eq i, 3".

///

/// If AndCst is non-null, then the loaded value is masked with that constant

/// before doing the comparison. This handles cases like "A[i]&4 == 0".


Instruction *InstCombinerImpl::foldCmpLoadFromIndexedGlobal(

    LoadInst *LI, GetElementPtrInst *GEP, CmpInst &ICI, ConstantInt *AndCst) {

  auto *GV = dyn_cast<GlobalVariable>(getUnderlyingObject(GEP));

  if (LI->isVolatile() || !GV || !GV->isConstant() ||

      !GV->hasDefinitiveInitializer())

    return nullptr;


  Type *EltTy = LI->getType();

  TypeSize EltSize = DL.getTypeStoreSize(EltTy);

  if (EltSize.isScalable())

    return nullptr;


  LinearExpression Expr = decomposeLinearExpression(DL, GEP);

  if (!Expr.Index || Expr.BasePtr != GV || Expr.Offset.getBitWidth() > 64)

    return nullptr;


  Constant *Init = GV->getInitializer();

  TypeSize GlobalSize = DL.getTypeAllocSize(Init->getType());


  Value *Idx = Expr.Index;

  const APInt &Stride = Expr.Scale;

  const APInt &ConstOffset = Expr.Offset;


  // Allow an additional context offset, but only within the stride.

  if (!ConstOffset.ult(Stride))

    return nullptr;


  // Don't handle overlapping loads for now.

  if (!Stride.uge(EltSize.getFixedValue()))

    return nullptr;


  // Don't blow up on huge arrays.

  uint64_t ArrayElementCount =

      divideCeil((GlobalSize.getFixedValue() - ConstOffset.getZExtValue()),

                 Stride.getZExtValue());

  if (ArrayElementCount > MaxArraySizeForCombine)

    return nullptr;


  enum { Overdefined = -3, Undefined = -2 };


  // Variables for our state machines.


  // FirstTrueElement/SecondTrueElement - Used to emit a comparison of the form

  // "i == 47 | i == 87", where 47 is the first index the condition is true for,

  // and 87 is the second (and last) index.  FirstTrueElement is -2 when

  // undefined, otherwise set to the first true element.  SecondTrueElement is

  // -2 when undefined, -3 when overdefined and >= 0 when that index is true.

  int FirstTrueElement = Undefined, SecondTrueElement = Undefined;


  // FirstFalseElement/SecondFalseElement - Used to emit a comparison of the

  // form "i != 47 & i != 87".  Same state transitions as for true elements.

  int FirstFalseElement = Undefined, SecondFalseElement = Undefined;


  /// TrueRangeEnd/FalseRangeEnd - In conjunction with First*Element, these

  /// define a state machine that triggers for ranges of values that the index

  /// is true or false for.  This triggers on things like "abbbbc"[i] == 'b'.

  /// This is -2 when undefined, -3 when overdefined, and otherwise the last

  /// index in the range (inclusive).  We use -2 for undefined here because we

  /// use relative comparisons and don't want 0-1 to match -1.

  int TrueRangeEnd = Undefined, FalseRangeEnd = Undefined;


  // MagicBitvector - This is a magic bitvector where we set a bit if the

  // comparison is true for element 'i'.  If there are 64 elements or less in

  // the array, this will fully represent all the comparison results.

  uint64_t MagicBitvector = 0;


  // Scan the array and see if one of our patterns matches.

  Constant *CompareRHS = cast<Constant>(ICI.getOperand(1));

  APInt Offset = ConstOffset;

  for (unsigned i = 0, e = ArrayElementCount; i != e; ++i, Offset += Stride) {

    Constant *Elt = ConstantFoldLoadFromConst(Init, EltTy, Offset, DL);

    if (!Elt)

      return nullptr;


    // If the element is masked, handle it.

    if (AndCst) {

      Elt = ConstantFoldBinaryOpOperands(Instruction::And, Elt, AndCst, DL);

      if (!Elt)

        return nullptr;

    }


    // Find out if the comparison would be true or false for the i'th element.

    Constant *C = ConstantFoldCompareInstOperands(ICI.getPredicate(), Elt,

                                                  CompareRHS, DL, &TLI);

    if (!C)

      return nullptr;


    // If the result is undef for this element, ignore it.

    if (isa<UndefValue>(C)) {

      // Extend range state machines to cover this element in case there is an

      // undef in the middle of the range.

      if (TrueRangeEnd == (int)i - 1)

        TrueRangeEnd = i;

      if (FalseRangeEnd == (int)i - 1)

        FalseRangeEnd = i;

      continue;

    }


    // If we can't compute the result for any of the elements, we have to give

    // up evaluating the entire conditional.

    if (!isa<ConstantInt>(C))

      return nullptr;


    // Otherwise, we know if the comparison is true or false for this element,

    // update our state machines.

    bool IsTrueForElt = !cast<ConstantInt>(C)->isZero();


    // State machine for single/double/range index comparison.

    if (IsTrueForElt) {

      // Update the TrueElement state machine.

      if (FirstTrueElement == Undefined)

        FirstTrueElement = TrueRangeEnd = i; // First true element.

      else {

        // Update double-compare state machine.

        if (SecondTrueElement == Undefined)

          SecondTrueElement = i;

        else

          SecondTrueElement = Overdefined;


        // Update range state machine.

        if (TrueRangeEnd == (int)i - 1)

          TrueRangeEnd = i;

        else

          TrueRangeEnd = Overdefined;

      }

    } else {

      // Update the FalseElement state machine.

      if (FirstFalseElement == Undefined)

        FirstFalseElement = FalseRangeEnd = i; // First false element.

      else {

        // Update double-compare state machine.

        if (SecondFalseElement == Undefined)

          SecondFalseElement = i;

        else

          SecondFalseElement = Overdefined;


        // Update range state machine.

        if (FalseRangeEnd == (int)i - 1)

          FalseRangeEnd = i;

        else

          FalseRangeEnd = Overdefined;

      }

    }


    // If this element is in range, update our magic bitvector.

    if (i < 64 && IsTrueForElt)

      MagicBitvector |= 1ULL << i;


    // If all of our states become overdefined, bail out early.  Since the

    // predicate is expensive, only check it every 8 elements.  This is only

    // really useful for really huge arrays.

    if ((i & 8) == 0 && i >= 64 && SecondTrueElement == Overdefined &&

        SecondFalseElement == Overdefined && TrueRangeEnd == Overdefined &&

        FalseRangeEnd == Overdefined)

      return nullptr;

  }


  // Now that we've scanned the entire array, emit our new comparison(s).  We

  // order the state machines in complexity of the generated code.


  // If inbounds keyword is not present, Idx * Stride can overflow.

  // Let's assume that Stride is 2 and the wanted value is at offset 0.

  // Then, there are two possible values for Idx to match offset 0:

  // 0x00..00, 0x80..00.

  // Emitting 'icmp eq Idx, 0' isn't correct in this case because the

  // comparison is false if Idx was 0x80..00.

  // We need to erase the highest countTrailingZeros(ElementSize) bits of Idx.

  auto MaskIdx = [&](Value *Idx) {

    if (!Expr.Flags.isInBounds() && Stride.countr_zero() != 0) {

      Value *Mask = Constant::getAllOnesValue(Idx->getType());

      Mask = Builder.CreateLShr(Mask, Stride.countr_zero());

      Idx = Builder.CreateAnd(Idx, Mask);

    }

    return Idx;

  };


  // If the comparison is only true for one or two elements, emit direct

  // comparisons.

  if (SecondTrueElement != Overdefined) {

    Idx = MaskIdx(Idx);

    // None true -> false.

    if (FirstTrueElement == Undefined)

      return replaceInstUsesWith(ICI, Builder.getFalse());


    Value *FirstTrueIdx = ConstantInt::get(Idx->getType(), FirstTrueElement);


    // True for one element -> 'i == 47'.

    if (SecondTrueElement == Undefined)

      return new ICmpInst(ICmpInst::ICMP_EQ, Idx, FirstTrueIdx);


    // True for two elements -> 'i == 47 | i == 72'.

    Value *C1 = Builder.CreateICmpEQ(Idx, FirstTrueIdx);

    Value *SecondTrueIdx = ConstantInt::get(Idx->getType(), SecondTrueElement);

    Value *C2 = Builder.CreateICmpEQ(Idx, SecondTrueIdx);

    return BinaryOperator::CreateOr(C1, C2);

  }


  // If the comparison is only false for one or two elements, emit direct

  // comparisons.

  if (SecondFalseElement != Overdefined) {

    Idx = MaskIdx(Idx);

    // None false -> true.

    if (FirstFalseElement == Undefined)

      return replaceInstUsesWith(ICI, Builder.getTrue());


    Value *FirstFalseIdx = ConstantInt::get(Idx->getType(), FirstFalseElement);


    // False for one element -> 'i != 47'.

    if (SecondFalseElement == Undefined)

      return new ICmpInst(ICmpInst::ICMP_NE, Idx, FirstFalseIdx);


    // False for two elements -> 'i != 47 & i != 72'.

    Value *C1 = Builder.CreateICmpNE(Idx, FirstFalseIdx);

    Value *SecondFalseIdx =

        ConstantInt::get(Idx->getType(), SecondFalseElement);

    Value *C2 = Builder.CreateICmpNE(Idx, SecondFalseIdx);

    return BinaryOperator::CreateAnd(C1, C2);

  }


  // If the comparison can be replaced with a range comparison for the elements

  // where it is true, emit the range check.

  if (TrueRangeEnd != Overdefined) {

    assert(TrueRangeEnd != FirstTrueElement && "Should emit single compare");

    Idx = MaskIdx(Idx);


    // Generate (i-FirstTrue) <u (TrueRangeEnd-FirstTrue+1).

    if (FirstTrueElement) {

      Value *Offs = ConstantInt::get(Idx->getType(), -FirstTrueElement);

      Idx = Builder.CreateAdd(Idx, Offs);

    }


    Value *End =

        ConstantInt::get(Idx->getType(), TrueRangeEnd - FirstTrueElement + 1);

    return new ICmpInst(ICmpInst::ICMP_ULT, Idx, End);

  }


  // False range check.

  if (FalseRangeEnd != Overdefined) {

    assert(FalseRangeEnd != FirstFalseElement && "Should emit single compare");

    Idx = MaskIdx(Idx);

    // Generate (i-FirstFalse) >u (FalseRangeEnd-FirstFalse).

    if (FirstFalseElement) {

      Value *Offs = ConstantInt::get(Idx->getType(), -FirstFalseElement);

      Idx = Builder.CreateAdd(Idx, Offs);

    }


    Value *End =

        ConstantInt::get(Idx->getType(), FalseRangeEnd - FirstFalseElement);

    return new ICmpInst(ICmpInst::ICMP_UGT, Idx, End);

  }


  // If a magic bitvector captures the entire comparison state

  // of this load, replace it with computation that does:

  //   ((magic_cst >> i) & 1) != 0

  {

    Type *Ty = nullptr;


    // Look for an appropriate type:

    // - The type of Idx if the magic fits

    // - The smallest fitting legal type

    if (ArrayElementCount <= Idx->getType()->getIntegerBitWidth())

      Ty = Idx->getType();

    else

      Ty = DL.getSmallestLegalIntType(Init->getContext(), ArrayElementCount);


    if (Ty) {

      Idx = MaskIdx(Idx);

      Value *V = Builder.CreateIntCast(Idx, Ty, false);

      V = Builder.CreateLShr(ConstantInt::get(Ty, MagicBitvector), V);

      V = Builder.CreateAnd(ConstantInt::get(Ty, 1), V);

      return new ICmpInst(ICmpInst::ICMP_NE, V, ConstantInt::get(Ty, 0));

    }

  }


  return nullptr;

}


/// Returns true if we can rewrite Start as a GEP with pointer Base

/// and some integer offset. The nodes that need to be re-written

/// for this transformation will be added to Explored.


static bool canRewriteGEPAsOffset(Value *Start, Value *Base, GEPNoWrapFlags &NW,

                                  const DataLayout &DL,

                                  SetVector<Value *> &Explored) {

  SmallVector<Value *, 16> WorkList(1, Start);

  Explored.insert(Base);


  // The following traversal gives us an order which can be used

  // when doing the final transformation. Since in the final

  // transformation we create the PHI replacement instructions first,

  // we don't have to get them in any particular order.

  //

  // However, for other instructions we will have to traverse the

  // operands of an instruction first, which means that we have to

  // do a post-order traversal.

  while (!WorkList.empty()) {

    SetVector<PHINode *> PHIs;


    while (!WorkList.empty()) {

      if (Explored.size() >= 100)

        return false;


      Value *V = WorkList.back();


      if (Explored.contains(V)) {

        WorkList.pop_back();

        continue;

      }


      if (!isa<GetElementPtrInst>(V) && !isa<PHINode>(V))

        // We've found some value that we can't explore which is different from

        // the base. Therefore we can't do this transformation.

        return false;


      if (auto *GEP = dyn_cast<GEPOperator>(V)) {

        // Only allow inbounds GEPs with at most one variable offset.

        auto IsNonConst = [](Value *V) { return !isa<ConstantInt>(V); };

        if (!GEP->isInBounds() || count_if(GEP->indices(), IsNonConst) > 1)

          return false;


        NW = NW.intersectForOffsetAdd(GEP->getNoWrapFlags());

        if (!Explored.contains(GEP->getOperand(0)))

          WorkList.push_back(GEP->getOperand(0));

      }


      if (WorkList.back() == V) {

        WorkList.pop_back();

        // We've finished visiting this node, mark it as such.

        Explored.insert(V);

      }


      if (auto *PN = dyn_cast<PHINode>(V)) {

        // We cannot transform PHIs on unsplittable basic blocks.

        if (isa<CatchSwitchInst>(PN->getParent()->getTerminator()))

          return false;

        Explored.insert(PN);

        PHIs.insert(PN);

      }

    }


    // Explore the PHI nodes further.

    for (auto *PN : PHIs)

      for (Value *Op : PN->incoming_values())

        if (!Explored.contains(Op))

          WorkList.push_back(Op);

  }


  // Make sure that we can do this. Since we can't insert GEPs in a basic

  // block before a PHI node, we can't easily do this transformation if

  // we have PHI node users of transformed instructions.

  for (Value *Val : Explored) {

    for (Value *Use : Val->uses()) {


      auto *PHI = dyn_cast<PHINode>(Use);

      auto *Inst = dyn_cast<Instruction>(Val);


      if (Inst == Base || Inst == PHI || !Inst || !PHI ||

          !Explored.contains(PHI))

        continue;


      if (PHI->getParent() == Inst->getParent())

        return false;

    }

  }

  return true;

}


// Sets the appropriate insert point on Builder where we can add

// a replacement Instruction for V (if that is possible).


static void setInsertionPoint(IRBuilder<> &Builder, Value *V,

                              bool Before = true) {

  if (auto *PHI = dyn_cast<PHINode>(V)) {

    BasicBlock *Parent = PHI->getParent();

    Builder.SetInsertPoint(Parent, Parent->getFirstInsertionPt());

    return;

  }

  if (auto *I = dyn_cast<Instruction>(V)) {

    if (!Before)

      I = &*std::next(I->getIterator());

    Builder.SetInsertPoint(I);

    return;

  }

  if (auto *A = dyn_cast<Argument>(V)) {

    // Set the insertion point in the entry block.

    BasicBlock &Entry = A->getParent()->getEntryBlock();

    Builder.SetInsertPoint(&Entry, Entry.getFirstInsertionPt());

    return;

  }

  // Otherwise, this is a constant and we don't need to set a new

  // insertion point.

  assert(isa<Constant>(V) && "Setting insertion point for unknown value!");

}


/// Returns a re-written value of Start as an indexed GEP using Base as a

/// pointer.


static Value *rewriteGEPAsOffset(Value *Start, Value *Base, GEPNoWrapFlags NW,

                                 const DataLayout &DL,

                                 SetVector<Value *> &Explored,

                                 InstCombiner &IC) {

  // Perform all the substitutions. This is a bit tricky because we can

  // have cycles in our use-def chains.

  // 1. Create the PHI nodes without any incoming values.

  // 2. Create all the other values.

  // 3. Add the edges for the PHI nodes.

  // 4. Emit GEPs to get the original pointers.

  // 5. Remove the original instructions.

  Type *IndexType = IntegerType::get(

      Base->getContext(), DL.getIndexTypeSizeInBits(Start->getType()));


  DenseMap<Value *, Value *> NewInsts;

  NewInsts[Base] = ConstantInt::getNullValue(IndexType);


  // Create the new PHI nodes, without adding any incoming values.

  for (Value *Val : Explored) {

    if (Val == Base)

      continue;

    // Create empty phi nodes. This avoids cyclic dependencies when creating

    // the remaining instructions.

    if (auto *PHI = dyn_cast<PHINode>(Val))

      NewInsts[PHI] =

          PHINode::Create(IndexType, PHI->getNumIncomingValues(),

                          PHI->getName() + ".idx", PHI->getIterator());

  }

  IRBuilder<> Builder(Base->getContext());


  // Create all the other instructions.

  for (Value *Val : Explored) {

    if (NewInsts.contains(Val))

      continue;


    if (auto *GEP = dyn_cast<GEPOperator>(Val)) {

      setInsertionPoint(Builder, GEP);

      Value *Op = NewInsts[GEP->getOperand(0)];

      Value *OffsetV = emitGEPOffset(&Builder, DL, GEP);

      if (isa<ConstantInt>(Op) && cast<ConstantInt>(Op)->isZero())

        NewInsts[GEP] = OffsetV;

      else

        NewInsts[GEP] = Builder.CreateAdd(

            Op, OffsetV, GEP->getOperand(0)->getName() + ".add",

            /*NUW=*/NW.hasNoUnsignedWrap(),

            /*NSW=*/NW.hasNoUnsignedSignedWrap());

      continue;

    }

    if (isa<PHINode>(Val))

      continue;


    llvm_unreachable("Unexpected instruction type");

  }


  // Add the incoming values to the PHI nodes.

  for (Value *Val : Explored) {

    if (Val == Base)

      continue;

    // All the instructions have been created, we can now add edges to the

    // phi nodes.

    if (auto *PHI = dyn_cast<PHINode>(Val)) {

      PHINode *NewPhi = static_cast<PHINode *>(NewInsts[PHI]);

      for (unsigned I = 0, E = PHI->getNumIncomingValues(); I < E; ++I) {

        Value *NewIncoming = PHI->getIncomingValue(I);


        auto It = NewInsts.find(NewIncoming);

        if (It != NewInsts.end())

          NewIncoming = It->second;


        NewPhi->addIncoming(NewIncoming, PHI->getIncomingBlock(I));

      }

    }

  }


  for (Value *Val : Explored) {

    if (Val == Base)

      continue;


    setInsertionPoint(Builder, Val, false);

    // Create GEP for external users.

    Value *NewVal = Builder.CreateGEP(Builder.getInt8Ty(), Base, NewInsts[Val],

                                      Val->getName() + ".ptr", NW);

    IC.replaceInstUsesWith(*cast<Instruction>(Val), NewVal);

    // Add old instruction to worklist for DCE. We don't directly remove it

    // here because the original compare is one of the users.

    IC.addToWorklist(cast<Instruction>(Val));

  }


  return NewInsts[Start];

}


/// Converts (CMP GEPLHS, RHS) if this change would make RHS a constant.

/// We can look through PHIs, GEPs and casts in order to determine a common base

/// between GEPLHS and RHS.


static Instruction *transformToIndexedCompare(GEPOperator *GEPLHS, Value *RHS,

                                              CmpPredicate Cond,

                                              const DataLayout &DL,

                                              InstCombiner &IC) {

  // FIXME: Support vector of pointers.

  if (GEPLHS->getType()->isVectorTy())

    return nullptr;


  if (!GEPLHS->hasAllConstantIndices())

    return nullptr;


  APInt Offset(DL.getIndexTypeSizeInBits(GEPLHS->getType()), 0);

  Value *PtrBase =

      GEPLHS->stripAndAccumulateConstantOffsets(DL, Offset,

                                                /*AllowNonInbounds*/ false);


  // Bail if we looked through addrspacecast.

  if (PtrBase->getType() != GEPLHS->getType())

    return nullptr;


  // The set of nodes that will take part in this transformation.

  SetVector<Value *> Nodes;

  GEPNoWrapFlags NW = GEPLHS->getNoWrapFlags();

  if (!canRewriteGEPAsOffset(RHS, PtrBase, NW, DL, Nodes))

    return nullptr;


  // We know we can re-write this as

  //  ((gep Ptr, OFFSET1) cmp (gep Ptr, OFFSET2)

  // Since we've only looked through inbouds GEPs we know that we

  // can't have overflow on either side. We can therefore re-write

  // this as:

  //   OFFSET1 cmp OFFSET2

  Value *NewRHS = rewriteGEPAsOffset(RHS, PtrBase, NW, DL, Nodes, IC);


  // RewriteGEPAsOffset has replaced RHS and all of its uses with a re-written

  // GEP having PtrBase as the pointer base, and has returned in NewRHS the

  // offset. Since Index is the offset of LHS to the base pointer, we will now

  // compare the offsets instead of comparing the pointers.

  return new ICmpInst(ICmpInst::getSignedPredicate(Cond),

                      IC.Builder.getInt(Offset), NewRHS);

}


/// Fold comparisons between a GEP instruction and something else. At this point

/// we know that the GEP is on the LHS of the comparison.


Instruction *InstCombinerImpl::foldGEPICmp(GEPOperator *GEPLHS, Value *RHS,

                                           CmpPredicate Cond, Instruction &I) {

  // Don't transform signed compares of GEPs into index compares. Even if the

  // GEP is inbounds, the final add of the base pointer can have signed overflow

  // and would change the result of the icmp.

  // e.g. "&foo[0] <s &foo[1]" can't be folded to "true" because "foo" could be

  // the maximum signed value for the pointer type.

  if (ICmpInst::isSigned(Cond))

    return nullptr;


  // Look through bitcasts and addrspacecasts. We do not however want to remove

  // 0 GEPs.

  if (!isa<GetElementPtrInst>(RHS))

    RHS = RHS->stripPointerCasts();


  auto CanFold = [Cond](GEPNoWrapFlags NW) {

    if (ICmpInst::isEquality(Cond))

      return true;


    // Unsigned predicates can be folded if the GEPs have *any* nowrap flags.

    assert(ICmpInst::isUnsigned(Cond));

    return NW != GEPNoWrapFlags::none();

  };


  auto NewICmp = [Cond](GEPNoWrapFlags NW, Value *Op1, Value *Op2) {

    if (!NW.hasNoUnsignedWrap()) {

      // Convert signed to unsigned comparison.

      return new ICmpInst(ICmpInst::getSignedPredicate(Cond), Op1, Op2);

    }


    auto *I = new ICmpInst(Cond, Op1, Op2);

    I->setSameSign(NW.hasNoUnsignedSignedWrap());

    return I;

  };


  CommonPointerBase Base = CommonPointerBase::compute(GEPLHS, RHS);

  if (Base.Ptr == RHS && CanFold(Base.LHSNW) && !Base.isExpensive()) {

    // ((gep Ptr, OFFSET) cmp Ptr)   ---> (OFFSET cmp 0).

    Type *IdxTy = DL.getIndexType(GEPLHS->getType());

    Value *Offset =

        EmitGEPOffsets(Base.LHSGEPs, Base.LHSNW, IdxTy, /*RewriteGEPs=*/true);

    return NewICmp(Base.LHSNW, Offset,

                   Constant::getNullValue(Offset->getType()));

  }


  if (GEPLHS->isInBounds() && ICmpInst::isEquality(Cond) &&

      isa<Constant>(RHS) && cast<Constant>(RHS)->isNullValue() &&

      !NullPointerIsDefined(I.getFunction(),

                            RHS->getType()->getPointerAddressSpace())) {

    // For most address spaces, an allocation can't be placed at null, but null

    // itself is treated as a 0 size allocation in the in bounds rules.  Thus,

    // the only valid inbounds address derived from null, is null itself.

    // Thus, we have four cases to consider:

    // 1) Base == nullptr, Offset == 0 -> inbounds, null

    // 2) Base == nullptr, Offset != 0 -> poison as the result is out of bounds

    // 3) Base != nullptr, Offset == (-base) -> poison (crossing allocations)

    // 4) Base != nullptr, Offset != (-base) -> nonnull (and possibly poison)

    //

    // (Note if we're indexing a type of size 0, that simply collapses into one

    //  of the buckets above.)

    //

    // In general, we're allowed to make values less poison (i.e. remove

    //   sources of full UB), so in this case, we just select between the two

    //   non-poison cases (1 and 4 above).

    //

    // For vectors, we apply the same reasoning on a per-lane basis.

    auto *Base = GEPLHS->getPointerOperand();

    if (GEPLHS->getType()->isVectorTy() && Base->getType()->isPointerTy()) {

      auto EC = cast<VectorType>(GEPLHS->getType())->getElementCount();

      Base = Builder.CreateVectorSplat(EC, Base);

    }

    return new ICmpInst(Cond, Base,

                        ConstantExpr::getPointerBitCastOrAddrSpaceCast(

                            cast<Constant>(RHS), Base->getType()));

  } else if (GEPOperator *GEPRHS = dyn_cast<GEPOperator>(RHS)) {

    GEPNoWrapFlags NW = GEPLHS->getNoWrapFlags() & GEPRHS->getNoWrapFlags();


    // If the base pointers are different, but the indices are the same, just

    // compare the base pointer.

    if (GEPLHS->getOperand(0) != GEPRHS->getOperand(0)) {

      bool IndicesTheSame =

          GEPLHS->getNumOperands() == GEPRHS->getNumOperands() &&

          GEPLHS->getPointerOperand()->getType() ==

              GEPRHS->getPointerOperand()->getType() &&

          GEPLHS->getSourceElementType() == GEPRHS->getSourceElementType();

      if (IndicesTheSame)

        for (unsigned i = 1, e = GEPLHS->getNumOperands(); i != e; ++i)

          if (GEPLHS->getOperand(i) != GEPRHS->getOperand(i)) {

            IndicesTheSame = false;

            break;

          }


      // If all indices are the same, just compare the base pointers.

      Type *BaseType = GEPLHS->getOperand(0)->getType();

      if (IndicesTheSame &&

          CmpInst::makeCmpResultType(BaseType) == I.getType() && CanFold(NW))

        return new ICmpInst(Cond, GEPLHS->getOperand(0), GEPRHS->getOperand(0));


      // If we're comparing GEPs with two base pointers that only differ in type

      // and both GEPs have only constant indices or just one use, then fold

      // the compare with the adjusted indices.

      // FIXME: Support vector of pointers.

      if (GEPLHS->isInBounds() && GEPRHS->isInBounds() &&

          (GEPLHS->hasAllConstantIndices() || GEPLHS->hasOneUse()) &&

          (GEPRHS->hasAllConstantIndices() || GEPRHS->hasOneUse()) &&

          GEPLHS->getOperand(0)->stripPointerCasts() ==

              GEPRHS->getOperand(0)->stripPointerCasts() &&

          !GEPLHS->getType()->isVectorTy()) {

        Value *LOffset = EmitGEPOffset(GEPLHS);

        Value *ROffset = EmitGEPOffset(GEPRHS);


        // If we looked through an addrspacecast between different sized address

        // spaces, the LHS and RHS pointers are different sized

        // integers. Truncate to the smaller one.

        Type *LHSIndexTy = LOffset->getType();

        Type *RHSIndexTy = ROffset->getType();

        if (LHSIndexTy != RHSIndexTy) {

          if (LHSIndexTy->getPrimitiveSizeInBits().getFixedValue() <

              RHSIndexTy->getPrimitiveSizeInBits().getFixedValue()) {

            ROffset = Builder.CreateTrunc(ROffset, LHSIndexTy);

          } else

            LOffset = Builder.CreateTrunc(LOffset, RHSIndexTy);

        }


        Value *Cmp = Builder.CreateICmp(ICmpInst::getSignedPredicate(Cond),

                                        LOffset, ROffset);

        return replaceInstUsesWith(I, Cmp);

      }

    }


    if (GEPLHS->getOperand(0) == GEPRHS->getOperand(0) &&

        GEPLHS->getNumOperands() == GEPRHS->getNumOperands() &&

        GEPLHS->getSourceElementType() == GEPRHS->getSourceElementType()) {

      // If the GEPs only differ by one index, compare it.

      unsigned NumDifferences = 0; // Keep track of # differences.

      unsigned DiffOperand = 0;    // The operand that differs.

      for (unsigned i = 1, e = GEPRHS->getNumOperands(); i != e; ++i)

        if (GEPLHS->getOperand(i) != GEPRHS->getOperand(i)) {

          Type *LHSType = GEPLHS->getOperand(i)->getType();

          Type *RHSType = GEPRHS->getOperand(i)->getType();

          // FIXME: Better support for vector of pointers.

          if (LHSType->getPrimitiveSizeInBits() !=

                  RHSType->getPrimitiveSizeInBits() ||

              (GEPLHS->getType()->isVectorTy() &&

               (!LHSType->isVectorTy() || !RHSType->isVectorTy()))) {

            // Irreconcilable differences.

            NumDifferences = 2;

            break;

          }


          if (NumDifferences++)

            break;

          DiffOperand = i;

        }


      if (NumDifferences == 0) // SAME GEP?

        return replaceInstUsesWith(

            I, // No comparison is needed here.

            ConstantInt::get(I.getType(), ICmpInst::isTrueWhenEqual(Cond)));

      // If two GEPs only differ by an index, compare them.

      // Note that nowrap flags are always needed when comparing two indices.

      else if (NumDifferences == 1 && NW != GEPNoWrapFlags::none()) {

        Value *LHSV = GEPLHS->getOperand(DiffOperand);

        Value *RHSV = GEPRHS->getOperand(DiffOperand);

        return NewICmp(NW, LHSV, RHSV);

      }

    }


    if (Base.Ptr && CanFold(Base.LHSNW & Base.RHSNW) && !Base.isExpensive()) {

      // ((gep Ptr, OFFSET1) cmp (gep Ptr, OFFSET2)  --->  (OFFSET1 cmp OFFSET2)

      Type *IdxTy = DL.getIndexType(GEPLHS->getType());

      Value *L =

          EmitGEPOffsets(Base.LHSGEPs, Base.LHSNW, IdxTy, /*RewriteGEP=*/true);

      Value *R =

          EmitGEPOffsets(Base.RHSGEPs, Base.RHSNW, IdxTy, /*RewriteGEP=*/true);

      return NewICmp(Base.LHSNW & Base.RHSNW, L, R);

    }

  }


  // Try convert this to an indexed compare by looking through PHIs/casts as a

  // last resort.

  return transformToIndexedCompare(GEPLHS, RHS, Cond, DL, *this);

}


bool InstCombinerImpl::foldAllocaCmp(AllocaInst *Alloca) {

  // It would be tempting to fold away comparisons between allocas and any

  // pointer not based on that alloca (e.g. an argument). However, even

  // though such pointers cannot alias, they can still compare equal.

  //

  // But LLVM doesn't specify where allocas get their memory, so if the alloca

  // doesn't escape we can argue that it's impossible to guess its value, and we

  // can therefore act as if any such guesses are wrong.

  //

  // However, we need to ensure that this folding is consistent: We can't fold

  // one comparison to false, and then leave a different comparison against the

  // same value alone (as it might evaluate to true at runtime, leading to a

  // contradiction). As such, this code ensures that all comparisons are folded

  // at the same time, and there are no other escapes.


  struct CmpCaptureTracker : public CaptureTracker {

    AllocaInst *Alloca;

    bool Captured = false;

    /// The value of the map is a bit mask of which icmp operands the alloca is

    /// used in.

    SmallMapVector<ICmpInst *, unsigned, 4> ICmps;


    CmpCaptureTracker(AllocaInst *Alloca) : Alloca(Alloca) {}


    void tooManyUses() override { Captured = true; }


    Action captured(const Use *U, UseCaptureInfo CI) override {

      // TODO(captures): Use UseCaptureInfo.

      auto *ICmp = dyn_cast<ICmpInst>(U->getUser());

      // We need to check that U is based *only* on the alloca, and doesn't

      // have other contributions from a select/phi operand.

      // TODO: We could check whether getUnderlyingObjects() reduces to one

      // object, which would allow looking through phi nodes.

      if (ICmp && ICmp->isEquality() && getUnderlyingObject(*U) == Alloca) {

        // Collect equality icmps of the alloca, and don't treat them as

        // captures.

        ICmps[ICmp] |= 1u << U->getOperandNo();

        return Continue;

      }


      Captured = true;

      return Stop;

    }

  };


  CmpCaptureTracker Tracker(Alloca);

  PointerMayBeCaptured(Alloca, &Tracker);

  if (Tracker.Captured)

    return false;


  bool Changed = false;

  for (auto [ICmp, Operands] : Tracker.ICmps) {

    switch (Operands) {

    case 1:

    case 2: {

      // The alloca is only used in one icmp operand. Assume that the

      // equality is false.

      auto *Res = ConstantInt::get(ICmp->getType(),

                                   ICmp->getPredicate() == ICmpInst::ICMP_NE);

      replaceInstUsesWith(*ICmp, Res);

      eraseInstFromFunction(*ICmp);

      Changed = true;

      break;

    }

    case 3:

      // Both icmp operands are based on the alloca, so this is comparing

      // pointer offsets, without leaking any information about the address

      // of the alloca. Ignore such comparisons.

      break;

    default:

      llvm_unreachable("Cannot happen");

    }

  }


  return Changed;

}


/// Fold "icmp pred (X+C), X".


Instruction *InstCombinerImpl::foldICmpAddOpConst(Value *X, const APInt &C,

                                                  CmpPredicate Pred) {

  // From this point on, we know that (X+C <= X) --> (X+C < X) because C != 0,

  // so the values can never be equal.  Similarly for all other "or equals"

  // operators.

  assert(!!C && "C should not be zero!");


  // (X+1) <u X        --> X >u (MAXUINT-1)        --> X == 255

  // (X+2) <u X        --> X >u (MAXUINT-2)        --> X > 253

  // (X+MAXUINT) <u X  --> X >u (MAXUINT-MAXUINT)  --> X != 0

  if (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_ULE) {

    Constant *R =

        ConstantInt::get(X->getType(), APInt::getMaxValue(C.getBitWidth()) - C);

    return new ICmpInst(ICmpInst::ICMP_UGT, X, R);

  }


  // (X+1) >u X        --> X <u (0-1)        --> X != 255

  // (X+2) >u X        --> X <u (0-2)        --> X <u 254

  // (X+MAXUINT) >u X  --> X <u (0-MAXUINT)  --> X <u 1  --> X == 0

  if (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_UGE)

    return new ICmpInst(ICmpInst::ICMP_ULT, X,

                        ConstantInt::get(X->getType(), -C));


  APInt SMax = APInt::getSignedMaxValue(C.getBitWidth());


  // (X+ 1) <s X       --> X >s (MAXSINT-1)          --> X == 127

  // (X+ 2) <s X       --> X >s (MAXSINT-2)          --> X >s 125

  // (X+MAXSINT) <s X  --> X >s (MAXSINT-MAXSINT)    --> X >s 0

  // (X+MINSINT) <s X  --> X >s (MAXSINT-MINSINT)    --> X >s -1

  // (X+ -2) <s X      --> X >s (MAXSINT- -2)        --> X >s 126

  // (X+ -1) <s X      --> X >s (MAXSINT- -1)        --> X != 127

  if (Pred == ICmpInst::ICMP_SLT || Pred == ICmpInst::ICMP_SLE)

    return new ICmpInst(ICmpInst::ICMP_SGT, X,

                        ConstantInt::get(X->getType(), SMax - C));


  // (X+ 1) >s X       --> X <s (MAXSINT-(1-1))       --> X != 127

  // (X+ 2) >s X       --> X <s (MAXSINT-(2-1))       --> X <s 126

  // (X+MAXSINT) >s X  --> X <s (MAXSINT-(MAXSINT-1)) --> X <s 1

  // (X+MINSINT) >s X  --> X <s (MAXSINT-(MINSINT-1)) --> X <s -2

  // (X+ -2) >s X      --> X <s (MAXSINT-(-2-1))      --> X <s -126

  // (X+ -1) >s X      --> X <s (MAXSINT-(-1-1))      --> X == -128


  assert(Pred == ICmpInst::ICMP_SGT || Pred == ICmpInst::ICMP_SGE);

  return new ICmpInst(ICmpInst::ICMP_SLT, X,

                      ConstantInt::get(X->getType(), SMax - (C - 1)));

}


/// Handle "(icmp eq/ne (ashr/lshr AP2, A), AP1)" ->

/// (icmp eq/ne A, Log2(AP2/AP1)) ->

/// (icmp eq/ne A, Log2(AP2) - Log2(AP1)).


Instruction *InstCombinerImpl::foldICmpShrConstConst(ICmpInst &I, Value *A,

                                                     const APInt &AP1,

                                                     const APInt &AP2) {

  assert(I.isEquality() && "Cannot fold icmp gt/lt");


  auto getICmp = [&I](CmpInst::Predicate Pred, Value *LHS, Value *RHS) {

    if (I.getPredicate() == I.ICMP_NE)

      Pred = CmpInst::getInversePredicate(Pred);

    return new ICmpInst(Pred, LHS, RHS);

  };


  // Don't bother doing any work for cases which InstSimplify handles.

  if (AP2.isZero())

    return nullptr;


  bool IsAShr = isa<AShrOperator>(I.getOperand(0));

  if (IsAShr) {

    if (AP2.isAllOnes())

      return nullptr;

    if (AP2.isNegative() != AP1.isNegative())

      return nullptr;

    if (AP2.sgt(AP1))

      return nullptr;

  }


  if (!AP1)

    // 'A' must be large enough to shift out the highest set bit.

    return getICmp(I.ICMP_UGT, A,

                   ConstantInt::get(A->getType(), AP2.logBase2()));


  if (AP1 == AP2)

    return getICmp(I.ICMP_EQ, A, ConstantInt::getNullValue(A->getType()));


  int Shift;

  if (IsAShr && AP1.isNegative())

    Shift = AP1.countl_one() - AP2.countl_one();

  else

    Shift = AP1.countl_zero() - AP2.countl_zero();


  if (Shift > 0) {

    if (IsAShr && AP1 == AP2.ashr(Shift)) {

      // There are multiple solutions if we are comparing against -1 and the LHS

      // of the ashr is not a power of two.

      if (AP1.isAllOnes() && !AP2.isPowerOf2())

        return getICmp(I.ICMP_UGE, A, ConstantInt::get(A->getType(), Shift));

      return getICmp(I.ICMP_EQ, A, ConstantInt::get(A->getType(), Shift));

    } else if (AP1 == AP2.lshr(Shift)) {

      return getICmp(I.ICMP_EQ, A, ConstantInt::get(A->getType(), Shift));

    }

  }


  // Shifting const2 will never be equal to const1.

  // FIXME: This should always be handled by InstSimplify?

  auto *TorF = ConstantInt::get(I.getType(), I.getPredicate() == I.ICMP_NE);

  return replaceInstUsesWith(I, TorF);

}


/// Handle "(icmp eq/ne (shl AP2, A), AP1)" ->

/// (icmp eq/ne A, TrailingZeros(AP1) - TrailingZeros(AP2)).


Instruction *InstCombinerImpl::foldICmpShlConstConst(ICmpInst &I, Value *A,

                                                     const APInt &AP1,

                                                     const APInt &AP2) {

  assert(I.isEquality() && "Cannot fold icmp gt/lt");


  auto getICmp = [&I](CmpInst::Predicate Pred, Value *LHS, Value *RHS) {

    if (I.getPredicate() == I.ICMP_NE)

      Pred = CmpInst::getInversePredicate(Pred);

    return new ICmpInst(Pred, LHS, RHS);

  };


  // Don't bother doing any work for cases which InstSimplify handles.

  if (AP2.isZero())

    return nullptr;


  unsigned AP2TrailingZeros = AP2.countr_zero();


  if (!AP1 && AP2TrailingZeros != 0)

    return getICmp(

        I.ICMP_UGE, A,

        ConstantInt::get(A->getType(), AP2.getBitWidth() - AP2TrailingZeros));


  if (AP1 == AP2)

    return getICmp(I.ICMP_EQ, A, ConstantInt::getNullValue(A->getType()));


  // Get the distance between the lowest bits that are set.

  int Shift = AP1.countr_zero() - AP2TrailingZeros;


  if (Shift > 0 && AP2.shl(Shift) == AP1)

    return getICmp(I.ICMP_EQ, A, ConstantInt::get(A->getType(), Shift));


  // Shifting const2 will never be equal to const1.

  // FIXME: This should always be handled by InstSimplify?

  auto *TorF = ConstantInt::get(I.getType(), I.getPredicate() == I.ICMP_NE);

  return replaceInstUsesWith(I, TorF);

}


/// The caller has matched a pattern of the form:

///   I = icmp ugt (add (add A, B), CI2), CI1

/// If this is of the form:

///   sum = a + b

///   if (sum+128 >u 255)

/// Then replace it with llvm.sadd.with.overflow.i8.

///


static Instruction *processUGT_ADDCST_ADD(ICmpInst &I, Value *A, Value *B,

                                          ConstantInt *CI2, ConstantInt *CI1,

                                          InstCombinerImpl &IC) {

  // The transformation we're trying to do here is to transform this into an

  // llvm.sadd.with.overflow.  To do this, we have to replace the original add

  // with a narrower add, and discard the add-with-constant that is part of the

  // range check (if we can't eliminate it, this isn't profitable).


  // In order to eliminate the add-with-constant, the compare can be its only

  // use.

  Instruction *AddWithCst = cast<Instruction>(I.getOperand(0));

  if (!AddWithCst->hasOneUse())

    return nullptr;


  // If CI2 is 2^7, 2^15, 2^31, then it might be an sadd.with.overflow.

  if (!CI2->getValue().isPowerOf2())

    return nullptr;

  unsigned NewWidth = CI2->getValue().countr_zero();

  if (NewWidth != 7 && NewWidth != 15 && NewWidth != 31)

    return nullptr;


  // The width of the new add formed is 1 more than the bias.

  ++NewWidth;


  // Check to see that CI1 is an all-ones value with NewWidth bits.

  if (CI1->getBitWidth() == NewWidth ||

      CI1->getValue() != APInt::getLowBitsSet(CI1->getBitWidth(), NewWidth))

    return nullptr;


  // This is only really a signed overflow check if the inputs have been

  // sign-extended; check for that condition. For example, if CI2 is 2^31 and

  // the operands of the add are 64 bits wide, we need at least 33 sign bits.

  if (IC.ComputeMaxSignificantBits(A, &I) > NewWidth ||

      IC.ComputeMaxSignificantBits(B, &I) > NewWidth)

    return nullptr;


  // In order to replace the original add with a narrower

  // llvm.sadd.with.overflow, the only uses allowed are the add-with-constant

  // and truncates that discard the high bits of the add.  Verify that this is

  // the case.

  Instruction *OrigAdd = cast<Instruction>(AddWithCst->getOperand(0));

  for (User *U : OrigAdd->users()) {

    if (U == AddWithCst)

      continue;


    // Only accept truncates for now.  We would really like a nice recursive

    // predicate like SimplifyDemandedBits, but which goes downwards the use-def

    // chain to see which bits of a value are actually demanded.  If the

    // original add had another add which was then immediately truncated, we

    // could still do the transformation.

    TruncInst *TI = dyn_cast<TruncInst>(U);

    if (!TI || TI->getType()->getPrimitiveSizeInBits() > NewWidth)

      return nullptr;

  }


  // If the pattern matches, truncate the inputs to the narrower type and

  // use the sadd_with_overflow intrinsic to efficiently compute both the

  // result and the overflow bit.

  Type *NewType = IntegerType::get(OrigAdd->getContext(), NewWidth);

  Function *F = Intrinsic::getOrInsertDeclaration(

      I.getModule(), Intrinsic::sadd_with_overflow, NewType);


  InstCombiner::BuilderTy &Builder = IC.Builder;


  // Put the new code above the original add, in case there are any uses of the

  // add between the add and the compare.

  Builder.SetInsertPoint(OrigAdd);


  Value *TruncA = Builder.CreateTrunc(A, NewType, A->getName() + ".trunc");

  Value *TruncB = Builder.CreateTrunc(B, NewType, B->getName() + ".trunc");

  CallInst *Call = Builder.CreateCall(F, {TruncA, TruncB}, "sadd");

  Value *Add = Builder.CreateExtractValue(Call, 0, "sadd.result");

  Value *ZExt = Builder.CreateZExt(Add, OrigAdd->getType());


  // The inner add was the result of the narrow add, zero extended to the

  // wider type.  Replace it with the result computed by the intrinsic.

  IC.replaceInstUsesWith(*OrigAdd, ZExt);

  IC.eraseInstFromFunction(*OrigAdd);


  // The original icmp gets replaced with the overflow value.

  return ExtractValueInst::Create(Call, 1, "sadd.overflow");

}


/// If we have:

///   icmp eq/ne (urem/srem %x, %y), 0

/// iff %y is a power-of-two, we can replace this with a bit test:

///   icmp eq/ne (and %x, (add %y, -1)), 0


Instruction *InstCombinerImpl::foldIRemByPowerOfTwoToBitTest(ICmpInst &I) {

  // This fold is only valid for equality predicates.

  if (!I.isEquality())

    return nullptr;

  CmpPredicate Pred;

  Value *X, *Y, *Zero;

  if (!match(&I, m_ICmp(Pred, m_OneUse(m_IRem(m_Value(X), m_Value(Y))),

                        m_CombineAnd(m_Zero(), m_Value(Zero)))))

    return nullptr;

  if (!isKnownToBeAPowerOfTwo(Y, /*OrZero*/ true, &I))

    return nullptr;

  // This may increase instruction count, we don't enforce that Y is a constant.

  Value *Mask = Builder.CreateAdd(Y, Constant::getAllOnesValue(Y->getType()));

  Value *Masked = Builder.CreateAnd(X, Mask);

  return ICmpInst::Create(Instruction::ICmp, Pred, Masked, Zero);

}


/// Fold equality-comparison between zero and any (maybe truncated) right-shift

/// by one-less-than-bitwidth into a sign test on the original value.


Instruction *InstCombinerImpl::foldSignBitTest(ICmpInst &I) {

  Instruction *Val;

  CmpPredicate Pred;

  if (!I.isEquality() || !match(&I, m_ICmp(Pred, m_Instruction(Val), m_Zero())))

    return nullptr;


  Value *X;

  Type *XTy;


  Constant *C;

  if (match(Val, m_TruncOrSelf(m_Shr(m_Value(X), m_Constant(C))))) {

    XTy = X->getType();

    unsigned XBitWidth = XTy->getScalarSizeInBits();

    if (!match(C, m_SpecificInt_ICMP(ICmpInst::Predicate::ICMP_EQ,

                                     APInt(XBitWidth, XBitWidth - 1))))

      return nullptr;

  } else if (isa<BinaryOperator>(Val) &&

             (X = reassociateShiftAmtsOfTwoSameDirectionShifts(

                  cast<BinaryOperator>(Val), SQ.getWithInstruction(Val),

                  /*AnalyzeForSignBitExtraction=*/true))) {

    XTy = X->getType();

  } else

    return nullptr;


  return ICmpInst::Create(Instruction::ICmp,

                          Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_SGE

                                                    : ICmpInst::ICMP_SLT,

                          X, ConstantInt::getNullValue(XTy));

}


// Handle  icmp pred X, 0


Instruction *InstCombinerImpl::foldICmpWithZero(ICmpInst &Cmp) {

  CmpInst::Predicate Pred = Cmp.getPredicate();

  if (!match(Cmp.getOperand(1), m_Zero()))

    return nullptr;


  // (icmp sgt smin(PosA, B) 0) -> (icmp sgt B 0)

  if (Pred == ICmpInst::ICMP_SGT) {

    Value *A, *B;

    if (match(Cmp.getOperand(0), m_SMin(m_Value(A), m_Value(B)))) {

      if (isKnownPositive(A, SQ.getWithInstruction(&Cmp)))

        return new ICmpInst(Pred, B, Cmp.getOperand(1));

      if (isKnownPositive(B, SQ.getWithInstruction(&Cmp)))

        return new ICmpInst(Pred, A, Cmp.getOperand(1));

    }

  }


  if (Instruction *New = foldIRemByPowerOfTwoToBitTest(Cmp))

    return New;


  // Given:

  //   icmp eq/ne (urem %x, %y), 0

  // Iff %x has 0 or 1 bits set, and %y has at least 2 bits set, omit 'urem':

  //   icmp eq/ne %x, 0

  Value *X, *Y;

  if (match(Cmp.getOperand(0), m_URem(m_Value(X), m_Value(Y))) &&

      ICmpInst::isEquality(Pred)) {

    KnownBits XKnown = computeKnownBits(X, &Cmp);

    KnownBits YKnown = computeKnownBits(Y, &Cmp);

    if (XKnown.countMaxPopulation() == 1 && YKnown.countMinPopulation() >= 2)

      return new ICmpInst(Pred, X, Cmp.getOperand(1));

  }


  // (icmp eq/ne (mul X Y)) -> (icmp eq/ne X/Y) if we know about whether X/Y are

  // odd/non-zero/there is no overflow.

  if (match(Cmp.getOperand(0), m_Mul(m_Value(X), m_Value(Y))) &&

      ICmpInst::isEquality(Pred)) {


    KnownBits XKnown = computeKnownBits(X, &Cmp);

    // if X % 2 != 0

    //    (icmp eq/ne Y)

    if (XKnown.countMaxTrailingZeros() == 0)

      return new ICmpInst(Pred, Y, Cmp.getOperand(1));


    KnownBits YKnown = computeKnownBits(Y, &Cmp);

    // if Y % 2 != 0

    //    (icmp eq/ne X)

    if (YKnown.countMaxTrailingZeros() == 0)

      return new ICmpInst(Pred, X, Cmp.getOperand(1));


    auto *BO0 = cast<OverflowingBinaryOperator>(Cmp.getOperand(0));

    if (BO0->hasNoUnsignedWrap() || BO0->hasNoSignedWrap()) {

      const SimplifyQuery Q = SQ.getWithInstruction(&Cmp);

      // `isKnownNonZero` does more analysis than just `!KnownBits.One.isZero()`

      // but to avoid unnecessary work, first just if this is an obvious case.


      // if X non-zero and NoOverflow(X * Y)

      //    (icmp eq/ne Y)

      if (!XKnown.One.isZero() || isKnownNonZero(X, Q))

        return new ICmpInst(Pred, Y, Cmp.getOperand(1));


      // if Y non-zero and NoOverflow(X * Y)

      //    (icmp eq/ne X)

      if (!YKnown.One.isZero() || isKnownNonZero(Y, Q))

        return new ICmpInst(Pred, X, Cmp.getOperand(1));

    }

    // Note, we are skipping cases:

    //      if Y % 2 != 0 AND X % 2 != 0

    //          (false/true)

    //      if X non-zero and Y non-zero and NoOverflow(X * Y)

    //          (false/true)

    // Those can be simplified later as we would have already replaced the (icmp

    // eq/ne (mul X, Y)) with (icmp eq/ne X/Y) and if X/Y is known non-zero that

    // will fold to a constant elsewhere.

  }


  // (icmp eq/ne f(X), 0) -> (icmp eq/ne X, 0)

  // where f(X) == 0 if and only if X == 0

  if (ICmpInst::isEquality(Pred))

    if (Value *Stripped = stripNullTest(Cmp.getOperand(0)))

      return new ICmpInst(Pred, Stripped,

                          Constant::getNullValue(Stripped->getType()));


  return nullptr;

}


/// Fold icmp eq (num + mask) & ~mask, num

///      to

///      icmp eq (and num, mask), 0

/// Where mask is a low bit mask.


Instruction *InstCombinerImpl::foldIsMultipleOfAPowerOfTwo(ICmpInst &Cmp) {

  Value *Num;

  CmpPredicate Pred;

  const APInt *Mask, *Neg;


  if (!match(&Cmp,

             m_c_ICmp(Pred, m_Value(Num),

                      m_OneUse(m_c_And(m_OneUse(m_c_Add(m_Deferred(Num),

                                                        m_LowBitMask(Mask))),

                                       m_APInt(Neg))))))

    return nullptr;


  if (*Neg != ~*Mask)

    return nullptr;


  if (!ICmpInst::isEquality(Pred))

    return nullptr;


  // Create new icmp eq (num & mask), 0

  auto *NewAnd = Builder.CreateAnd(Num, *Mask);

  auto *Zero = Constant::getNullValue(Num->getType());


  return new ICmpInst(Pred, NewAnd, Zero);

}


/// Fold icmp Pred X, C.

/// TODO: This code structure does not make sense. The saturating add fold

/// should be moved to some other helper and extended as noted below (it is also

/// possible that code has been made unnecessary - do we canonicalize IR to

/// overflow/saturating intrinsics or not?).


Instruction *InstCombinerImpl::foldICmpWithConstant(ICmpInst &Cmp) {

  // Match the following pattern, which is a common idiom when writing

  // overflow-safe integer arithmetic functions. The source performs an addition

  // in wider type and explicitly checks for overflow using comparisons against

  // INT_MIN and INT_MAX. Simplify by using the sadd_with_overflow intrinsic.

  //

  // TODO: This could probably be generalized to handle other overflow-safe

  // operations if we worked out the formulas to compute the appropriate magic

  // constants.

  //

  // sum = a + b

  // if (sum+128 >u 255)  ...  -> llvm.sadd.with.overflow.i8

  CmpInst::Predicate Pred = Cmp.getPredicate();

  Value *Op0 = Cmp.getOperand(0), *Op1 = Cmp.getOperand(1);

  Value *A, *B;

  ConstantInt *CI, *CI2; // I = icmp ugt (add (add A, B), CI2), CI

  if (Pred == ICmpInst::ICMP_UGT && match(Op1, m_ConstantInt(CI)) &&

      match(Op0, m_Add(m_Add(m_Value(A), m_Value(B)), m_ConstantInt(CI2))))

    if (Instruction *Res = processUGT_ADDCST_ADD(Cmp, A, B, CI2, CI, *this))

      return Res;


  // icmp(phi(C1, C2, ...), C) -> phi(icmp(C1, C), icmp(C2, C), ...).

  Constant *C = dyn_cast<Constant>(Op1);

  if (!C)

    return nullptr;


  if (auto *Phi = dyn_cast<PHINode>(Op0))

    if (all_of(Phi->operands(), [](Value *V) { return isa<Constant>(V); })) {

      SmallVector<Constant *> Ops;

      for (Value *V : Phi->incoming_values()) {

        Constant *Res =

            ConstantFoldCompareInstOperands(Pred, cast<Constant>(V), C, DL);

        if (!Res)

          return nullptr;

        Ops.push_back(Res);

      }

      Builder.SetInsertPoint(Phi);

      PHINode *NewPhi = Builder.CreatePHI(Cmp.getType(), Phi->getNumOperands());

      for (auto [V, Pred] : zip(Ops, Phi->blocks()))

        NewPhi->addIncoming(V, Pred);

      return replaceInstUsesWith(Cmp, NewPhi);

    }


  if (Instruction *R = tryFoldInstWithCtpopWithNot(&Cmp))

    return R;


  return nullptr;

}


/// Canonicalize icmp instructions based on dominating conditions.


Instruction *InstCombinerImpl::foldICmpWithDominatingICmp(ICmpInst &Cmp) {

  // We already checked simple implication in InstSimplify, only handle complex

  // cases here.

  Value *X = Cmp.getOperand(0), *Y = Cmp.getOperand(1);

  const APInt *C;

  if (!match(Y, m_APInt(C)))

    return nullptr;


  CmpInst::Predicate Pred = Cmp.getPredicate();

  ConstantRange CR = ConstantRange::makeExactICmpRegion(Pred, *C);


  auto handleDomCond = [&](ICmpInst::Predicate DomPred,

                           const APInt *DomC) -> Instruction * {

    // We have 2 compares of a variable with constants. Calculate the constant

    // ranges of those compares to see if we can transform the 2nd compare:

    // DomBB:

    //   DomCond = icmp DomPred X, DomC

    //   br DomCond, CmpBB, FalseBB

    // CmpBB:

    //   Cmp = icmp Pred X, C

    ConstantRange DominatingCR =

        ConstantRange::makeExactICmpRegion(DomPred, *DomC);

    ConstantRange Intersection = DominatingCR.intersectWith(CR);

    ConstantRange Difference = DominatingCR.difference(CR);

    if (Intersection.isEmptySet())

      return replaceInstUsesWith(Cmp, Builder.getFalse());

    if (Difference.isEmptySet())

      return replaceInstUsesWith(Cmp, Builder.getTrue());


    // Canonicalizing a sign bit comparison that gets used in a branch,

    // pessimizes codegen by generating branch on zero instruction instead

    // of a test and branch. So we avoid canonicalizing in such situations

    // because test and branch instruction has better branch displacement

    // than compare and branch instruction.

    bool UnusedBit;

    bool IsSignBit = isSignBitCheck(Pred, *C, UnusedBit);

    if (Cmp.isEquality() || (IsSignBit && hasBranchUse(Cmp)))

      return nullptr;


    // Avoid an infinite loop with min/max canonicalization.

    // TODO: This will be unnecessary if we canonicalize to min/max intrinsics.

    if (Cmp.hasOneUse() &&

        match(Cmp.user_back(), m_MaxOrMin(m_Value(), m_Value())))

      return nullptr;


    if (const APInt *EqC = Intersection.getSingleElement())

      return new ICmpInst(ICmpInst::ICMP_EQ, X, Builder.getInt(*EqC));

    if (const APInt *NeC = Difference.getSingleElement())

      return new ICmpInst(ICmpInst::ICMP_NE, X, Builder.getInt(*NeC));

    return nullptr;

  };


  for (BranchInst *BI : DC.conditionsFor(X)) {

    CmpPredicate DomPred;

    const APInt *DomC;

    if (!match(BI->getCondition(),

               m_ICmp(DomPred, m_Specific(X), m_APInt(DomC))))

      continue;


    BasicBlockEdge Edge0(BI->getParent(), BI->getSuccessor(0));

    if (DT.dominates(Edge0, Cmp.getParent())) {

      if (auto *V = handleDomCond(DomPred, DomC))

        return V;

    } else {

      BasicBlockEdge Edge1(BI->getParent(), BI->getSuccessor(1));

      if (DT.dominates(Edge1, Cmp.getParent()))

        if (auto *V =

                handleDomCond(CmpInst::getInversePredicate(DomPred), DomC))

          return V;

    }

  }


  return nullptr;

}


/// Fold icmp (trunc X), C.


Instruction *InstCombinerImpl::foldICmpTruncConstant(ICmpInst &Cmp,

                                                     TruncInst *Trunc,

                                                     const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Value *X = Trunc->getOperand(0);

  Type *SrcTy = X->getType();

  unsigned DstBits = Trunc->getType()->getScalarSizeInBits(),

           SrcBits = SrcTy->getScalarSizeInBits();


  // Match (icmp pred (trunc nuw/nsw X), C)

  // Which we can convert to (icmp pred X, (sext/zext C))

  if (shouldChangeType(Trunc->getType(), SrcTy)) {

    if (Trunc->hasNoSignedWrap())

      return new ICmpInst(Pred, X, ConstantInt::get(SrcTy, C.sext(SrcBits)));

    if (!Cmp.isSigned() && Trunc->hasNoUnsignedWrap())

      return new ICmpInst(Pred, X, ConstantInt::get(SrcTy, C.zext(SrcBits)));

  }


  if (C.isOne() && C.getBitWidth() > 1) {

    // icmp slt trunc(signum(V)) 1 --> icmp slt V, 1

    Value *V = nullptr;

    if (Pred == ICmpInst::ICMP_SLT && match(X, m_Signum(m_Value(V))))

      return new ICmpInst(ICmpInst::ICMP_SLT, V,

                          ConstantInt::get(V->getType(), 1));

  }


  // TODO: Handle any shifted constant by subtracting trailing zeros.

  // TODO: Handle non-equality predicates.

  Value *Y;

  if (Cmp.isEquality() && match(X, m_Shl(m_One(), m_Value(Y)))) {

    // (trunc (1 << Y) to iN) == 0 --> Y u>= N

    // (trunc (1 << Y) to iN) != 0 --> Y u<  N

    if (C.isZero()) {

      auto NewPred = (Pred == Cmp.ICMP_EQ) ? Cmp.ICMP_UGE : Cmp.ICMP_ULT;

      return new ICmpInst(NewPred, Y, ConstantInt::get(SrcTy, DstBits));

    }

    // (trunc (1 << Y) to iN) == 2**C --> Y == C

    // (trunc (1 << Y) to iN) != 2**C --> Y != C

    if (C.isPowerOf2())

      return new ICmpInst(Pred, Y, ConstantInt::get(SrcTy, C.logBase2()));

  }


  if (Cmp.isEquality() && Trunc->hasOneUse()) {

    // Canonicalize to a mask and wider compare if the wide type is suitable:

    // (trunc X to i8) == C --> (X & 0xff) == (zext C)

    if (!SrcTy->isVectorTy() && shouldChangeType(DstBits, SrcBits)) {

      Constant *Mask =

          ConstantInt::get(SrcTy, APInt::getLowBitsSet(SrcBits, DstBits));

      Value *And = Builder.CreateAnd(X, Mask);

      Constant *WideC = ConstantInt::get(SrcTy, C.zext(SrcBits));

      return new ICmpInst(Pred, And, WideC);

    }


    // Simplify icmp eq (trunc x to i8), 42 -> icmp eq x, 42|highbits if all

    // of the high bits truncated out of x are known.

    KnownBits Known = computeKnownBits(X, &Cmp);


    // If all the high bits are known, we can do this xform.

    if ((Known.Zero | Known.One).countl_one() >= SrcBits - DstBits) {

      // Pull in the high bits from known-ones set.

      APInt NewRHS = C.zext(SrcBits);

      NewRHS |= Known.One & APInt::getHighBitsSet(SrcBits, SrcBits - DstBits);

      return new ICmpInst(Pred, X, ConstantInt::get(SrcTy, NewRHS));

    }

  }


  // Look through truncated right-shift of the sign-bit for a sign-bit check:

  // trunc iN (ShOp >> ShAmtC) to i[N - ShAmtC] < 0  --> ShOp <  0

  // trunc iN (ShOp >> ShAmtC) to i[N - ShAmtC] > -1 --> ShOp > -1

  Value *ShOp;

  uint64_t ShAmt;

  bool TrueIfSigned;

  if (isSignBitCheck(Pred, C, TrueIfSigned) &&

      match(X, m_Shr(m_Value(ShOp), m_ConstantInt(ShAmt))) &&

      DstBits == SrcBits - ShAmt) {

    return TrueIfSigned ? new ICmpInst(ICmpInst::ICMP_SLT, ShOp,

                                       ConstantInt::getNullValue(SrcTy))

                        : new ICmpInst(ICmpInst::ICMP_SGT, ShOp,

                                       ConstantInt::getAllOnesValue(SrcTy));

  }


  return nullptr;

}


/// Fold icmp (trunc nuw/nsw X), (trunc nuw/nsw Y).

/// Fold icmp (trunc nuw/nsw X), (zext/sext Y).

Instruction *


InstCombinerImpl::foldICmpTruncWithTruncOrExt(ICmpInst &Cmp,

                                              const SimplifyQuery &Q) {

  Value *X, *Y;

  CmpPredicate Pred;

  bool YIsSExt = false;

  // Try to match icmp (trunc X), (trunc Y)

  if (match(&Cmp, m_ICmp(Pred, m_Trunc(m_Value(X)), m_Trunc(m_Value(Y))))) {

    unsigned NoWrapFlags = cast<TruncInst>(Cmp.getOperand(0))->getNoWrapKind() &

                           cast<TruncInst>(Cmp.getOperand(1))->getNoWrapKind();

    if (Cmp.isSigned()) {

      // For signed comparisons, both truncs must be nsw.

      if (!(NoWrapFlags & TruncInst::NoSignedWrap))

        return nullptr;

    } else {

      // For unsigned and equality comparisons, either both must be nuw or

      // both must be nsw, we don't care which.

      if (!NoWrapFlags)

        return nullptr;

    }


    if (X->getType() != Y->getType() &&

        (!Cmp.getOperand(0)->hasOneUse() || !Cmp.getOperand(1)->hasOneUse()))

      return nullptr;

    if (!isDesirableIntType(X->getType()->getScalarSizeInBits()) &&

        isDesirableIntType(Y->getType()->getScalarSizeInBits())) {

      std::swap(X, Y);

      Pred = Cmp.getSwappedPredicate(Pred);

    }

    YIsSExt = !(NoWrapFlags & TruncInst::NoUnsignedWrap);

  }

  // Try to match icmp (trunc nuw X), (zext Y)

  else if (!Cmp.isSigned() &&

           match(&Cmp, m_c_ICmp(Pred, m_NUWTrunc(m_Value(X)),

                                m_OneUse(m_ZExt(m_Value(Y)))))) {

    // Can fold trunc nuw + zext for unsigned and equality predicates.

  }

  // Try to match icmp (trunc nsw X), (sext Y)

  else if (match(&Cmp, m_c_ICmp(Pred, m_NSWTrunc(m_Value(X)),

                                m_OneUse(m_ZExtOrSExt(m_Value(Y)))))) {

    // Can fold trunc nsw + zext/sext for all predicates.

    YIsSExt =

        isa<SExtInst>(Cmp.getOperand(0)) || isa<SExtInst>(Cmp.getOperand(1));

  } else

    return nullptr;


  Type *TruncTy = Cmp.getOperand(0)->getType();

  unsigned TruncBits = TruncTy->getScalarSizeInBits();


  // If this transform will end up changing from desirable types -> undesirable

  // types skip it.

  if (isDesirableIntType(TruncBits) &&

      !isDesirableIntType(X->getType()->getScalarSizeInBits()))

    return nullptr;


  Value *NewY = Builder.CreateIntCast(Y, X->getType(), YIsSExt);

  return new ICmpInst(Pred, X, NewY);

}


/// Fold icmp (xor X, Y), C.


Instruction *InstCombinerImpl::foldICmpXorConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Xor,

                                                   const APInt &C) {

  if (Instruction *I = foldICmpXorShiftConst(Cmp, Xor, C))

    return I;


  Value *X = Xor->getOperand(0);

  Value *Y = Xor->getOperand(1);

  const APInt *XorC;

  if (!match(Y, m_APInt(XorC)))

    return nullptr;


  // If this is a comparison that tests the signbit (X < 0) or (x > -1),

  // fold the xor.

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  bool TrueIfSigned = false;

  if (isSignBitCheck(Cmp.getPredicate(), C, TrueIfSigned)) {


    // If the sign bit of the XorCst is not set, there is no change to

    // the operation, just stop using the Xor.

    if (!XorC->isNegative())

      return replaceOperand(Cmp, 0, X);


    // Emit the opposite comparison.

    if (TrueIfSigned)

      return new ICmpInst(ICmpInst::ICMP_SGT, X,

                          ConstantInt::getAllOnesValue(X->getType()));

    else

      return new ICmpInst(ICmpInst::ICMP_SLT, X,

                          ConstantInt::getNullValue(X->getType()));

  }


  if (Xor->hasOneUse()) {

    // (icmp u/s (xor X SignMask), C) -> (icmp s/u X, (xor C SignMask))

    if (!Cmp.isEquality() && XorC->isSignMask()) {

      Pred = Cmp.getFlippedSignednessPredicate();

      return new ICmpInst(Pred, X, ConstantInt::get(X->getType(), C ^ *XorC));

    }


    // (icmp u/s (xor X ~SignMask), C) -> (icmp s/u X, (xor C ~SignMask))

    if (!Cmp.isEquality() && XorC->isMaxSignedValue()) {

      Pred = Cmp.getFlippedSignednessPredicate();

      Pred = Cmp.getSwappedPredicate(Pred);

      return new ICmpInst(Pred, X, ConstantInt::get(X->getType(), C ^ *XorC));

    }

  }


  // Mask constant magic can eliminate an 'xor' with unsigned compares.

  if (Pred == ICmpInst::ICMP_UGT) {

    // (xor X, ~C) >u C --> X <u ~C (when C+1 is a power of 2)

    if (*XorC == ~C && (C + 1).isPowerOf2())

      return new ICmpInst(ICmpInst::ICMP_ULT, X, Y);

    // (xor X, C) >u C --> X >u C (when C+1 is a power of 2)

    if (*XorC == C && (C + 1).isPowerOf2())

      return new ICmpInst(ICmpInst::ICMP_UGT, X, Y);

  }

  if (Pred == ICmpInst::ICMP_ULT) {

    // (xor X, -C) <u C --> X >u ~C (when C is a power of 2)

    if (*XorC == -C && C.isPowerOf2())

      return new ICmpInst(ICmpInst::ICMP_UGT, X,

                          ConstantInt::get(X->getType(), ~C));

    // (xor X, C) <u C --> X >u ~C (when -C is a power of 2)

    if (*XorC == C && (-C).isPowerOf2())

      return new ICmpInst(ICmpInst::ICMP_UGT, X,

                          ConstantInt::get(X->getType(), ~C));

  }

  return nullptr;

}


/// For power-of-2 C:

/// ((X s>> ShiftC) ^ X) u< C --> (X + C) u< (C << 1)

/// ((X s>> ShiftC) ^ X) u> (C - 1) --> (X + C) u> ((C << 1) - 1)


Instruction *InstCombinerImpl::foldICmpXorShiftConst(ICmpInst &Cmp,

                                                     BinaryOperator *Xor,

                                                     const APInt &C) {

  CmpInst::Predicate Pred = Cmp.getPredicate();

  APInt PowerOf2;

  if (Pred == ICmpInst::ICMP_ULT)

    PowerOf2 = C;

  else if (Pred == ICmpInst::ICMP_UGT && !C.isMaxValue())

    PowerOf2 = C + 1;

  else

    return nullptr;

  if (!PowerOf2.isPowerOf2())

    return nullptr;

  Value *X;

  const APInt *ShiftC;

  if (!match(Xor, m_OneUse(m_c_Xor(m_Value(X),

                                   m_AShr(m_Deferred(X), m_APInt(ShiftC))))))

    return nullptr;

  uint64_t Shift = ShiftC->getLimitedValue();

  Type *XType = X->getType();

  if (Shift == 0 || PowerOf2.isMinSignedValue())

    return nullptr;

  Value *Add = Builder.CreateAdd(X, ConstantInt::get(XType, PowerOf2));

  APInt Bound =

      Pred == ICmpInst::ICMP_ULT ? PowerOf2 << 1 : ((PowerOf2 << 1) - 1);

  return new ICmpInst(Pred, Add, ConstantInt::get(XType, Bound));

}


/// Fold icmp (and (sh X, Y), C2), C1.


Instruction *InstCombinerImpl::foldICmpAndShift(ICmpInst &Cmp,

                                                BinaryOperator *And,

                                                const APInt &C1,

                                                const APInt &C2) {

  BinaryOperator *Shift = dyn_cast<BinaryOperator>(And->getOperand(0));

  if (!Shift || !Shift->isShift())

    return nullptr;


  // If this is: (X >> C3) & C2 != C1 (where any shift and any compare could

  // exist), turn it into (X & (C2 << C3)) != (C1 << C3). This happens a LOT in

  // code produced by the clang front-end, for bitfield access.

  // This seemingly simple opportunity to fold away a shift turns out to be

  // rather complicated. See PR17827 for details.

  unsigned ShiftOpcode = Shift->getOpcode();

  bool IsShl = ShiftOpcode == Instruction::Shl;

  const APInt *C3;

  if (match(Shift->getOperand(1), m_APInt(C3))) {

    APInt NewAndCst, NewCmpCst;

    bool AnyCmpCstBitsShiftedOut;

    if (ShiftOpcode == Instruction::Shl) {

      // For a left shift, we can fold if the comparison is not signed. We can

      // also fold a signed comparison if the mask value and comparison value

      // are not negative. These constraints may not be obvious, but we can

      // prove that they are correct using an SMT solver.

      if (Cmp.isSigned() && (C2.isNegative() || C1.isNegative()))

        return nullptr;


      NewCmpCst = C1.lshr(*C3);

      NewAndCst = C2.lshr(*C3);

      AnyCmpCstBitsShiftedOut = NewCmpCst.shl(*C3) != C1;

    } else if (ShiftOpcode == Instruction::LShr) {

      // For a logical right shift, we can fold if the comparison is not signed.

      // We can also fold a signed comparison if the shifted mask value and the

      // shifted comparison value are not negative. These constraints may not be

      // obvious, but we can prove that they are correct using an SMT solver.

      NewCmpCst = C1.shl(*C3);

      NewAndCst = C2.shl(*C3);

      AnyCmpCstBitsShiftedOut = NewCmpCst.lshr(*C3) != C1;

      if (Cmp.isSigned() && (NewAndCst.isNegative() || NewCmpCst.isNegative()))

        return nullptr;

    } else {

      // For an arithmetic shift, check that both constants don't use (in a

      // signed sense) the top bits being shifted out.

      assert(ShiftOpcode == Instruction::AShr && "Unknown shift opcode");

      NewCmpCst = C1.shl(*C3);

      NewAndCst = C2.shl(*C3);

      AnyCmpCstBitsShiftedOut = NewCmpCst.ashr(*C3) != C1;

      if (NewAndCst.ashr(*C3) != C2)

        return nullptr;

    }


    if (AnyCmpCstBitsShiftedOut) {

      // If we shifted bits out, the fold is not going to work out. As a

      // special case, check to see if this means that the result is always

      // true or false now.

      if (Cmp.getPredicate() == ICmpInst::ICMP_EQ)

        return replaceInstUsesWith(Cmp, ConstantInt::getFalse(Cmp.getType()));

      if (Cmp.getPredicate() == ICmpInst::ICMP_NE)

        return replaceInstUsesWith(Cmp, ConstantInt::getTrue(Cmp.getType()));

    } else {

      Value *NewAnd = Builder.CreateAnd(

          Shift->getOperand(0), ConstantInt::get(And->getType(), NewAndCst));

      return new ICmpInst(Cmp.getPredicate(), NewAnd,

                          ConstantInt::get(And->getType(), NewCmpCst));

    }

  }


  // Turn ((X >> Y) & C2) == 0  into  (X & (C2 << Y)) == 0.  The latter is

  // preferable because it allows the C2 << Y expression to be hoisted out of a

  // loop if Y is invariant and X is not.

  if (Shift->hasOneUse() && C1.isZero() && Cmp.isEquality() &&

      !Shift->isArithmeticShift() &&

      ((!IsShl && C2.isOne()) || !isa<Constant>(Shift->getOperand(0)))) {

    // Compute C2 << Y.

    Value *NewShift =

        IsShl ? Builder.CreateLShr(And->getOperand(1), Shift->getOperand(1))

              : Builder.CreateShl(And->getOperand(1), Shift->getOperand(1));


    // Compute X & (C2 << Y).

    Value *NewAnd = Builder.CreateAnd(Shift->getOperand(0), NewShift);

    return new ICmpInst(Cmp.getPredicate(), NewAnd, Cmp.getOperand(1));

  }


  return nullptr;

}


/// Fold icmp (and X, C2), C1.


Instruction *InstCombinerImpl::foldICmpAndConstConst(ICmpInst &Cmp,

                                                     BinaryOperator *And,

                                                     const APInt &C1) {

  bool isICMP_NE = Cmp.getPredicate() == ICmpInst::ICMP_NE;


  // For vectors: icmp ne (and X, 1), 0 --> trunc X to N x i1

  // TODO: We canonicalize to the longer form for scalars because we have

  // better analysis/folds for icmp, and codegen may be better with icmp.

  if (isICMP_NE && Cmp.getType()->isVectorTy() && C1.isZero() &&

      match(And->getOperand(1), m_One()))

    return new TruncInst(And->getOperand(0), Cmp.getType());


  const APInt *C2;

  Value *X;

  if (!match(And, m_And(m_Value(X), m_APInt(C2))))

    return nullptr;


  // (and X, highmask) s> [0, ~highmask] --> X s> ~highmask

  if (Cmp.getPredicate() == ICmpInst::ICMP_SGT && C1.ule(~*C2) &&

      C2->isNegatedPowerOf2())

    return new ICmpInst(ICmpInst::ICMP_SGT, X,

                        ConstantInt::get(X->getType(), ~*C2));

  // (and X, highmask) s< [1, -highmask] --> X s< -highmask

  if (Cmp.getPredicate() == ICmpInst::ICMP_SLT && !C1.isSignMask() &&

      (C1 - 1).ule(~*C2) && C2->isNegatedPowerOf2() && !C2->isSignMask())

    return new ICmpInst(ICmpInst::ICMP_SLT, X,

                        ConstantInt::get(X->getType(), -*C2));


  // Don't perform the following transforms if the AND has multiple uses

  if (!And->hasOneUse())

    return nullptr;


  if (Cmp.isEquality() && C1.isZero()) {

    // Restrict this fold to single-use 'and' (PR10267).

    // Replace (and X, (1 << size(X)-1) != 0) with X s< 0

    if (C2->isSignMask()) {

      Constant *Zero = Constant::getNullValue(X->getType());

      auto NewPred = isICMP_NE ? ICmpInst::ICMP_SLT : ICmpInst::ICMP_SGE;

      return new ICmpInst(NewPred, X, Zero);

    }


    APInt NewC2 = *C2;

    KnownBits Know = computeKnownBits(And->getOperand(0), And);

    // Set high zeros of C2 to allow matching negated power-of-2.

    NewC2 = *C2 | APInt::getHighBitsSet(C2->getBitWidth(),

                                        Know.countMinLeadingZeros());


    // Restrict this fold only for single-use 'and' (PR10267).

    // ((%x & C) == 0) --> %x u< (-C)  iff (-C) is power of two.

    if (NewC2.isNegatedPowerOf2()) {

      Constant *NegBOC = ConstantInt::get(And->getType(), -NewC2);

      auto NewPred = isICMP_NE ? ICmpInst::ICMP_UGE : ICmpInst::ICMP_ULT;

      return new ICmpInst(NewPred, X, NegBOC);

    }

  }


  // If the LHS is an 'and' of a truncate and we can widen the and/compare to

  // the input width without changing the value produced, eliminate the cast:

  //

  // icmp (and (trunc W), C2), C1 -> icmp (and W, C2'), C1'

  //

  // We can do this transformation if the constants do not have their sign bits

  // set or if it is an equality comparison. Extending a relational comparison

  // when we're checking the sign bit would not work.

  Value *W;

  if (match(And->getOperand(0), m_OneUse(m_Trunc(m_Value(W)))) &&

      (Cmp.isEquality() || (!C1.isNegative() && !C2->isNegative()))) {

    // TODO: Is this a good transform for vectors? Wider types may reduce

    // throughput. Should this transform be limited (even for scalars) by using

    // shouldChangeType()?

    if (!Cmp.getType()->isVectorTy()) {

      Type *WideType = W->getType();

      unsigned WideScalarBits = WideType->getScalarSizeInBits();

      Constant *ZextC1 = ConstantInt::get(WideType, C1.zext(WideScalarBits));

      Constant *ZextC2 = ConstantInt::get(WideType, C2->zext(WideScalarBits));

      Value *NewAnd = Builder.CreateAnd(W, ZextC2, And->getName());

      return new ICmpInst(Cmp.getPredicate(), NewAnd, ZextC1);

    }

  }


  if (Instruction *I = foldICmpAndShift(Cmp, And, C1, *C2))

    return I;


  // (icmp pred (and (or (lshr A, B), A), 1), 0) -->

  // (icmp pred (and A, (or (shl 1, B), 1), 0))

  //

  // iff pred isn't signed

  if (!Cmp.isSigned() && C1.isZero() && And->getOperand(0)->hasOneUse() &&

      match(And->getOperand(1), m_One())) {

    Constant *One = cast<Constant>(And->getOperand(1));

    Value *Or = And->getOperand(0);

    Value *A, *B, *LShr;

    if (match(Or, m_Or(m_Value(LShr), m_Value(A))) &&

        match(LShr, m_LShr(m_Specific(A), m_Value(B)))) {

      unsigned UsesRemoved = 0;

      if (And->hasOneUse())

        ++UsesRemoved;

      if (Or->hasOneUse())

        ++UsesRemoved;

      if (LShr->hasOneUse())

        ++UsesRemoved;


      // Compute A & ((1 << B) | 1)

      unsigned RequireUsesRemoved = match(B, m_ImmConstant()) ? 1 : 3;

      if (UsesRemoved >= RequireUsesRemoved) {

        Value *NewOr =

            Builder.CreateOr(Builder.CreateShl(One, B, LShr->getName(),

                                               /*HasNUW=*/true),

                             One, Or->getName());

        Value *NewAnd = Builder.CreateAnd(A, NewOr, And->getName());

        return new ICmpInst(Cmp.getPredicate(), NewAnd, Cmp.getOperand(1));

      }

    }

  }


  // (icmp eq (and (bitcast X to int), ExponentMask), ExponentMask) -->

  // llvm.is.fpclass(X, fcInf|fcNan)

  // (icmp ne (and (bitcast X to int), ExponentMask), ExponentMask) -->

  // llvm.is.fpclass(X, ~(fcInf|fcNan))

  // (icmp eq (and (bitcast X to int), ExponentMask), 0) -->

  // llvm.is.fpclass(X, fcSubnormal|fcZero)

  // (icmp ne (and (bitcast X to int), ExponentMask), 0) -->

  // llvm.is.fpclass(X, ~(fcSubnormal|fcZero))

  Value *V;

  if (!Cmp.getParent()->getParent()->hasFnAttribute(

          Attribute::NoImplicitFloat) &&

      Cmp.isEquality() &&

      match(X, m_OneUse(m_ElementWiseBitCast(m_Value(V))))) {

    Type *FPType = V->getType()->getScalarType();

    if (FPType->isIEEELikeFPTy() && (C1.isZero() || C1 == *C2)) {

      APInt ExponentMask =

          APFloat::getInf(FPType->getFltSemantics()).bitcastToAPInt();

      if (*C2 == ExponentMask) {

        unsigned Mask = C1.isZero()

                            ? FPClassTest::fcZero | FPClassTest::fcSubnormal

                            : FPClassTest::fcNan | FPClassTest::fcInf;

        if (isICMP_NE)

          Mask = ~Mask & fcAllFlags;

        return replaceInstUsesWith(Cmp, Builder.createIsFPClass(V, Mask));

      }

    }

  }


  return nullptr;

}


/// Fold icmp (and X, Y), C.


Instruction *InstCombinerImpl::foldICmpAndConstant(ICmpInst &Cmp,

                                                   BinaryOperator *And,

                                                   const APInt &C) {

  if (Instruction *I = foldICmpAndConstConst(Cmp, And, C))

    return I;


  const ICmpInst::Predicate Pred = Cmp.getPredicate();

  bool TrueIfNeg;

  if (isSignBitCheck(Pred, C, TrueIfNeg)) {

    // ((X - 1) & ~X) <  0 --> X == 0

    // ((X - 1) & ~X) >= 0 --> X != 0

    Value *X;

    if (match(And->getOperand(0), m_Add(m_Value(X), m_AllOnes())) &&

        match(And->getOperand(1), m_Not(m_Specific(X)))) {

      auto NewPred = TrueIfNeg ? CmpInst::ICMP_EQ : CmpInst::ICMP_NE;

      return new ICmpInst(NewPred, X, ConstantInt::getNullValue(X->getType()));

    }

    // (X & -X) <  0 --> X == MinSignedC

    // (X & -X) > -1 --> X != MinSignedC

    if (match(And, m_c_And(m_Neg(m_Value(X)), m_Deferred(X)))) {

      Constant *MinSignedC = ConstantInt::get(

          X->getType(),

          APInt::getSignedMinValue(X->getType()->getScalarSizeInBits()));

      auto NewPred = TrueIfNeg ? CmpInst::ICMP_EQ : CmpInst::ICMP_NE;

      return new ICmpInst(NewPred, X, MinSignedC);

    }

  }


  // TODO: These all require that Y is constant too, so refactor with the above.


  // Try to optimize things like "A[i] & 42 == 0" to index computations.

  Value *X = And->getOperand(0);

  Value *Y = And->getOperand(1);

  if (auto *C2 = dyn_cast<ConstantInt>(Y))

    if (auto *LI = dyn_cast<LoadInst>(X))

      if (auto *GEP = dyn_cast<GetElementPtrInst>(LI->getOperand(0)))

        if (Instruction *Res = foldCmpLoadFromIndexedGlobal(LI, GEP, Cmp, C2))

          return Res;


  if (!Cmp.isEquality())

    return nullptr;


  // X & -C == -C -> X >  u ~C

  // X & -C != -C -> X <= u ~C

  //   iff C is a power of 2

  if (Cmp.getOperand(1) == Y && C.isNegatedPowerOf2()) {

    auto NewPred =

        Pred == CmpInst::ICMP_EQ ? CmpInst::ICMP_UGT : CmpInst::ICMP_ULE;

    return new ICmpInst(NewPred, X, SubOne(cast<Constant>(Cmp.getOperand(1))));

  }


  // ((zext i1 X) & Y) == 0 --> !((trunc Y) & X)

  // ((zext i1 X) & Y) != 0 -->  ((trunc Y) & X)

  // ((zext i1 X) & Y) == 1 -->  ((trunc Y) & X)

  // ((zext i1 X) & Y) != 1 --> !((trunc Y) & X)

  if (match(And, m_OneUse(m_c_And(m_OneUse(m_ZExt(m_Value(X))), m_Value(Y)))) &&

      X->getType()->isIntOrIntVectorTy(1) && (C.isZero() || C.isOne())) {

    Value *TruncY = Builder.CreateTrunc(Y, X->getType());

    if (C.isZero() ^ (Pred == CmpInst::ICMP_NE)) {

      Value *And = Builder.CreateAnd(TruncY, X);

      return BinaryOperator::CreateNot(And);

    }

    return BinaryOperator::CreateAnd(TruncY, X);

  }


  // (icmp eq/ne (and (shl -1, X), Y), 0)

  //    -> (icmp eq/ne (lshr Y, X), 0)

  // We could technically handle any C == 0 or (C < 0 && isOdd(C)) but it seems

  // highly unlikely the non-zero case will ever show up in code.

  if (C.isZero() &&

      match(And, m_OneUse(m_c_And(m_OneUse(m_Shl(m_AllOnes(), m_Value(X))),

                                  m_Value(Y))))) {

    Value *LShr = Builder.CreateLShr(Y, X);

    return new ICmpInst(Pred, LShr, Constant::getNullValue(LShr->getType()));

  }


  // (icmp eq/ne (and (add A, Addend), Msk), C)

  //    -> (icmp eq/ne (and A, Msk), (and (sub C, Addend), Msk))

  {

    Value *A;

    const APInt *Addend, *Msk;

    if (match(And, m_And(m_OneUse(m_Add(m_Value(A), m_APInt(Addend))),

                         m_LowBitMask(Msk))) &&

        C.ule(*Msk)) {

      APInt NewComperand = (C - *Addend) & *Msk;

      Value *MaskA = Builder.CreateAnd(A, ConstantInt::get(A->getType(), *Msk));

      return new ICmpInst(Pred, MaskA,

                          ConstantInt::get(MaskA->getType(), NewComperand));

    }

  }


  return nullptr;

}


/// Fold icmp eq/ne (or (xor/sub (X1, X2), xor/sub (X3, X4))), 0.


static Value *foldICmpOrXorSubChain(ICmpInst &Cmp, BinaryOperator *Or,

                                    InstCombiner::BuilderTy &Builder) {

  // Are we using xors or subs to bitwise check for a pair or pairs of

  // (in)equalities? Convert to a shorter form that has more potential to be

  // folded even further.

  // ((X1 ^/- X2) || (X3 ^/- X4)) == 0 --> (X1 == X2) && (X3 == X4)

  // ((X1 ^/- X2) || (X3 ^/- X4)) != 0 --> (X1 != X2) || (X3 != X4)

  // ((X1 ^/- X2) || (X3 ^/- X4) || (X5 ^/- X6)) == 0 -->

  // (X1 == X2) && (X3 == X4) && (X5 == X6)

  // ((X1 ^/- X2) || (X3 ^/- X4) || (X5 ^/- X6)) != 0 -->

  // (X1 != X2) || (X3 != X4) || (X5 != X6)

  SmallVector<std::pair<Value *, Value *>, 2> CmpValues;

  SmallVector<Value *, 16> WorkList(1, Or);


  while (!WorkList.empty()) {

    auto MatchOrOperatorArgument = [&](Value *OrOperatorArgument) {

      Value *Lhs, *Rhs;


      if (match(OrOperatorArgument,

                m_OneUse(m_Xor(m_Value(Lhs), m_Value(Rhs))))) {

        CmpValues.emplace_back(Lhs, Rhs);

        return;

      }


      if (match(OrOperatorArgument,

                m_OneUse(m_Sub(m_Value(Lhs), m_Value(Rhs))))) {

        CmpValues.emplace_back(Lhs, Rhs);

        return;

      }


      WorkList.push_back(OrOperatorArgument);

    };


    Value *CurrentValue = WorkList.pop_back_val();

    Value *OrOperatorLhs, *OrOperatorRhs;


    if (!match(CurrentValue,

               m_Or(m_Value(OrOperatorLhs), m_Value(OrOperatorRhs)))) {

      return nullptr;

    }


    MatchOrOperatorArgument(OrOperatorRhs);

    MatchOrOperatorArgument(OrOperatorLhs);

  }


  ICmpInst::Predicate Pred = Cmp.getPredicate();

  auto BOpc = Pred == CmpInst::ICMP_EQ ? Instruction::And : Instruction::Or;

  Value *LhsCmp = Builder.CreateICmp(Pred, CmpValues.rbegin()->first,

                                     CmpValues.rbegin()->second);


  for (auto It = CmpValues.rbegin() + 1; It != CmpValues.rend(); ++It) {

    Value *RhsCmp = Builder.CreateICmp(Pred, It->first, It->second);

    LhsCmp = Builder.CreateBinOp(BOpc, LhsCmp, RhsCmp);

  }


  return LhsCmp;

}


/// Fold icmp (or X, Y), C.


Instruction *InstCombinerImpl::foldICmpOrConstant(ICmpInst &Cmp,

                                                  BinaryOperator *Or,

                                                  const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  if (C.isOne()) {

    // icmp slt signum(V) 1 --> icmp slt V, 1

    Value *V = nullptr;

    if (Pred == ICmpInst::ICMP_SLT && match(Or, m_Signum(m_Value(V))))

      return new ICmpInst(ICmpInst::ICMP_SLT, V,

                          ConstantInt::get(V->getType(), 1));

  }


  Value *OrOp0 = Or->getOperand(0), *OrOp1 = Or->getOperand(1);


  // (icmp eq/ne (or disjoint x, C0), C1)

  //    -> (icmp eq/ne x, C0^C1)

  if (Cmp.isEquality() && match(OrOp1, m_ImmConstant()) &&

      cast<PossiblyDisjointInst>(Or)->isDisjoint()) {

    Value *NewC =

        Builder.CreateXor(OrOp1, ConstantInt::get(OrOp1->getType(), C));

    return new ICmpInst(Pred, OrOp0, NewC);

  }


  const APInt *MaskC;

  if (match(OrOp1, m_APInt(MaskC)) && Cmp.isEquality()) {

    if (*MaskC == C && (C + 1).isPowerOf2()) {

      // X | C == C --> X <=u C

      // X | C != C --> X  >u C

      //   iff C+1 is a power of 2 (C is a bitmask of the low bits)

      Pred = (Pred == CmpInst::ICMP_EQ) ? CmpInst::ICMP_ULE : CmpInst::ICMP_UGT;

      return new ICmpInst(Pred, OrOp0, OrOp1);

    }


    // More general: canonicalize 'equality with set bits mask' to

    // 'equality with clear bits mask'.

    // (X | MaskC) == C --> (X & ~MaskC) == C ^ MaskC

    // (X | MaskC) != C --> (X & ~MaskC) != C ^ MaskC

    if (Or->hasOneUse()) {

      Value *And = Builder.CreateAnd(OrOp0, ~(*MaskC));

      Constant *NewC = ConstantInt::get(Or->getType(), C ^ (*MaskC));

      return new ICmpInst(Pred, And, NewC);

    }

  }


  // (X | (X-1)) s<  0 --> X s< 1

  // (X | (X-1)) s> -1 --> X s> 0

  Value *X;

  bool TrueIfSigned;

  if (isSignBitCheck(Pred, C, TrueIfSigned) &&

      match(Or, m_c_Or(m_Add(m_Value(X), m_AllOnes()), m_Deferred(X)))) {

    auto NewPred = TrueIfSigned ? ICmpInst::ICMP_SLT : ICmpInst::ICMP_SGT;

    Constant *NewC = ConstantInt::get(X->getType(), TrueIfSigned ? 1 : 0);

    return new ICmpInst(NewPred, X, NewC);

  }


  const APInt *OrC;

  // icmp(X | OrC, C) --> icmp(X, 0)

  if (C.isNonNegative() && match(Or, m_Or(m_Value(X), m_APInt(OrC)))) {

    switch (Pred) {

    // X | OrC s< C --> X s< 0 iff OrC s>= C s>= 0

    case ICmpInst::ICMP_SLT:

    // X | OrC s>= C --> X s>= 0 iff OrC s>= C s>= 0

    case ICmpInst::ICMP_SGE:

      if (OrC->sge(C))

        return new ICmpInst(Pred, X, ConstantInt::getNullValue(X->getType()));

      break;

    // X | OrC s<= C --> X s< 0 iff OrC s> C s>= 0

    case ICmpInst::ICMP_SLE:

    // X | OrC s> C --> X s>= 0 iff OrC s> C s>= 0

    case ICmpInst::ICMP_SGT:

      if (OrC->sgt(C))

        return new ICmpInst(ICmpInst::getFlippedStrictnessPredicate(Pred), X,

                            ConstantInt::getNullValue(X->getType()));

      break;

    default:

      break;

    }

  }


  if (!Cmp.isEquality() || !C.isZero() || !Or->hasOneUse())

    return nullptr;


  Value *P, *Q;

  if (match(Or, m_Or(m_PtrToInt(m_Value(P)), m_PtrToInt(m_Value(Q))))) {

    // Simplify icmp eq (or (ptrtoint P), (ptrtoint Q)), 0

    // -> and (icmp eq P, null), (icmp eq Q, null).

    Value *CmpP =

        Builder.CreateICmp(Pred, P, ConstantInt::getNullValue(P->getType()));

    Value *CmpQ =

        Builder.CreateICmp(Pred, Q, ConstantInt::getNullValue(Q->getType()));

    auto BOpc = Pred == CmpInst::ICMP_EQ ? Instruction::And : Instruction::Or;

    return BinaryOperator::Create(BOpc, CmpP, CmpQ);

  }


  if (Value *V = foldICmpOrXorSubChain(Cmp, Or, Builder))

    return replaceInstUsesWith(Cmp, V);


  return nullptr;

}


/// Fold icmp (mul X, Y), C.


Instruction *InstCombinerImpl::foldICmpMulConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Mul,

                                                   const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Type *MulTy = Mul->getType();

  Value *X = Mul->getOperand(0);


  // If there's no overflow:

  // X * X == 0 --> X == 0

  // X * X != 0 --> X != 0

  if (Cmp.isEquality() && C.isZero() && X == Mul->getOperand(1) &&

      (Mul->hasNoUnsignedWrap() || Mul->hasNoSignedWrap()))

    return new ICmpInst(Pred, X, ConstantInt::getNullValue(MulTy));


  const APInt *MulC;

  if (!match(Mul->getOperand(1), m_APInt(MulC)))

    return nullptr;


  // If this is a test of the sign bit and the multiply is sign-preserving with

  // a constant operand, use the multiply LHS operand instead:

  // (X * +MulC) < 0 --> X < 0

  // (X * -MulC) < 0 --> X > 0

  if (isSignTest(Pred, C) && Mul->hasNoSignedWrap()) {

    if (MulC->isNegative())

      Pred = ICmpInst::getSwappedPredicate(Pred);

    return new ICmpInst(Pred, X, ConstantInt::getNullValue(MulTy));

  }


  if (MulC->isZero())

    return nullptr;


  // If the multiply does not wrap or the constant is odd, try to divide the

  // compare constant by the multiplication factor.

  if (Cmp.isEquality()) {

    // (mul nsw X, MulC) eq/ne C --> X eq/ne C /s MulC

    if (Mul->hasNoSignedWrap() && C.srem(*MulC).isZero()) {

      Constant *NewC = ConstantInt::get(MulTy, C.sdiv(*MulC));

      return new ICmpInst(Pred, X, NewC);

    }


    // C % MulC == 0 is weaker than we could use if MulC is odd because it

    // correct to transform if MulC * N == C including overflow. I.e with i8

    // (icmp eq (mul X, 5), 101) -> (icmp eq X, 225) but since 101 % 5 != 0, we

    // miss that case.

    if (C.urem(*MulC).isZero()) {

      // (mul nuw X, MulC) eq/ne C --> X eq/ne C /u MulC

      // (mul X, OddC) eq/ne N * C --> X eq/ne N

      if ((*MulC & 1).isOne() || Mul->hasNoUnsignedWrap()) {

        Constant *NewC = ConstantInt::get(MulTy, C.udiv(*MulC));

        return new ICmpInst(Pred, X, NewC);

      }

    }

  }


  // With a matching no-overflow guarantee, fold the constants:

  // (X * MulC) < C --> X < (C / MulC)

  // (X * MulC) > C --> X > (C / MulC)

  // TODO: Assert that Pred is not equal to SGE, SLE, UGE, ULE?

  Constant *NewC = nullptr;

  if (Mul->hasNoSignedWrap() && ICmpInst::isSigned(Pred)) {

    // MININT / -1 --> overflow.

    if (C.isMinSignedValue() && MulC->isAllOnes())

      return nullptr;

    if (MulC->isNegative())

      Pred = ICmpInst::getSwappedPredicate(Pred);


    if (Pred == ICmpInst::ICMP_SLT || Pred == ICmpInst::ICMP_SGE) {

      NewC = ConstantInt::get(

          MulTy, APIntOps::RoundingSDiv(C, *MulC, APInt::Rounding::UP));

    } else {

      assert((Pred == ICmpInst::ICMP_SLE || Pred == ICmpInst::ICMP_SGT) &&

             "Unexpected predicate");

      NewC = ConstantInt::get(

          MulTy, APIntOps::RoundingSDiv(C, *MulC, APInt::Rounding::DOWN));

    }

  } else if (Mul->hasNoUnsignedWrap() && ICmpInst::isUnsigned(Pred)) {

    if (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE) {

      NewC = ConstantInt::get(

          MulTy, APIntOps::RoundingUDiv(C, *MulC, APInt::Rounding::UP));

    } else {

      assert((Pred == ICmpInst::ICMP_ULE || Pred == ICmpInst::ICMP_UGT) &&

             "Unexpected predicate");

      NewC = ConstantInt::get(

          MulTy, APIntOps::RoundingUDiv(C, *MulC, APInt::Rounding::DOWN));

    }

  }


  return NewC ? new ICmpInst(Pred, X, NewC) : nullptr;

}


/// Fold icmp (shl nuw C2, Y), C.


static Instruction *foldICmpShlLHSC(ICmpInst &Cmp, Instruction *Shl,

                                    const APInt &C) {

  Value *Y;

  const APInt *C2;

  if (!match(Shl, m_NUWShl(m_APInt(C2), m_Value(Y))))

    return nullptr;


  Type *ShiftType = Shl->getType();

  unsigned TypeBits = C.getBitWidth();

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  if (Cmp.isUnsigned()) {

    if (C2->isZero() || C2->ugt(C))

      return nullptr;

    APInt Div, Rem;

    APInt::udivrem(C, *C2, Div, Rem);

    bool CIsPowerOf2 = Rem.isZero() && Div.isPowerOf2();


    // (1 << Y) pred C -> Y pred Log2(C)

    if (!CIsPowerOf2) {

      // (1 << Y) <  30 -> Y <= 4

      // (1 << Y) <= 30 -> Y <= 4

      // (1 << Y) >= 30 -> Y >  4

      // (1 << Y) >  30 -> Y >  4

      if (Pred == ICmpInst::ICMP_ULT)

        Pred = ICmpInst::ICMP_ULE;

      else if (Pred == ICmpInst::ICMP_UGE)

        Pred = ICmpInst::ICMP_UGT;

    }


    unsigned CLog2 = Div.logBase2();

    return new ICmpInst(Pred, Y, ConstantInt::get(ShiftType, CLog2));

  } else if (Cmp.isSigned() && C2->isOne()) {

    Constant *BitWidthMinusOne = ConstantInt::get(ShiftType, TypeBits - 1);

    // (1 << Y) >  0 -> Y != 31

    // (1 << Y) >  C -> Y != 31 if C is negative.

    if (Pred == ICmpInst::ICMP_SGT && C.sle(0))

      return new ICmpInst(ICmpInst::ICMP_NE, Y, BitWidthMinusOne);


    // (1 << Y) <  0 -> Y == 31

    // (1 << Y) <  1 -> Y == 31

    // (1 << Y) <  C -> Y == 31 if C is negative and not signed min.

    // Exclude signed min by subtracting 1 and lower the upper bound to 0.

    if (Pred == ICmpInst::ICMP_SLT && (C - 1).sle(0))

      return new ICmpInst(ICmpInst::ICMP_EQ, Y, BitWidthMinusOne);

  }


  return nullptr;

}


/// Fold icmp (shl X, Y), C.


Instruction *InstCombinerImpl::foldICmpShlConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Shl,

                                                   const APInt &C) {

  const APInt *ShiftVal;

  if (Cmp.isEquality() && match(Shl->getOperand(0), m_APInt(ShiftVal)))

    return foldICmpShlConstConst(Cmp, Shl->getOperand(1), C, *ShiftVal);


  ICmpInst::Predicate Pred = Cmp.getPredicate();

  // (icmp pred (shl nuw&nsw X, Y), Csle0)

  //      -> (icmp pred X, Csle0)

  //

  // The idea is the nuw/nsw essentially freeze the sign bit for the shift op

  // so X's must be what is used.

  if (C.sle(0) && Shl->hasNoUnsignedWrap() && Shl->hasNoSignedWrap())

    return new ICmpInst(Pred, Shl->getOperand(0), Cmp.getOperand(1));


  // (icmp eq/ne (shl nuw|nsw X, Y), 0)

  //      -> (icmp eq/ne X, 0)

  if (ICmpInst::isEquality(Pred) && C.isZero() &&

      (Shl->hasNoUnsignedWrap() || Shl->hasNoSignedWrap()))

    return new ICmpInst(Pred, Shl->getOperand(0), Cmp.getOperand(1));


  // (icmp slt (shl nsw X, Y), 0/1)

  //      -> (icmp slt X, 0/1)

  // (icmp sgt (shl nsw X, Y), 0/-1)

  //      -> (icmp sgt X, 0/-1)

  //

  // NB: sge/sle with a constant will canonicalize to sgt/slt.

  if (Shl->hasNoSignedWrap() &&

      (Pred == ICmpInst::ICMP_SGT || Pred == ICmpInst::ICMP_SLT))

    if (C.isZero() || (Pred == ICmpInst::ICMP_SGT ? C.isAllOnes() : C.isOne()))

      return new ICmpInst(Pred, Shl->getOperand(0), Cmp.getOperand(1));


  const APInt *ShiftAmt;

  if (!match(Shl->getOperand(1), m_APInt(ShiftAmt)))

    return foldICmpShlLHSC(Cmp, Shl, C);


  // Check that the shift amount is in range. If not, don't perform undefined

  // shifts. When the shift is visited, it will be simplified.

  unsigned TypeBits = C.getBitWidth();

  if (ShiftAmt->uge(TypeBits))

    return nullptr;


  Value *X = Shl->getOperand(0);

  Type *ShType = Shl->getType();


  // NSW guarantees that we are only shifting out sign bits from the high bits,

  // so we can ASHR the compare constant without needing a mask and eliminate

  // the shift.

  if (Shl->hasNoSignedWrap()) {

    if (Pred == ICmpInst::ICMP_SGT) {

      // icmp Pred (shl nsw X, ShiftAmt), C --> icmp Pred X, (C >>s ShiftAmt)

      APInt ShiftedC = C.ashr(*ShiftAmt);

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

    if ((Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_NE) &&

        C.ashr(*ShiftAmt).shl(*ShiftAmt) == C) {

      APInt ShiftedC = C.ashr(*ShiftAmt);

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

    if (Pred == ICmpInst::ICMP_SLT) {

      // SLE is the same as above, but SLE is canonicalized to SLT, so convert:

      // (X << S) <=s C is equiv to X <=s (C >> S) for all C

      // (X << S) <s (C + 1) is equiv to X <s (C >> S) + 1 if C <s SMAX

      // (X << S) <s C is equiv to X <s ((C - 1) >> S) + 1 if C >s SMIN

      assert(!C.isMinSignedValue() && "Unexpected icmp slt");

      APInt ShiftedC = (C - 1).ashr(*ShiftAmt) + 1;

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

  }


  // NUW guarantees that we are only shifting out zero bits from the high bits,

  // so we can LSHR the compare constant without needing a mask and eliminate

  // the shift.

  if (Shl->hasNoUnsignedWrap()) {

    if (Pred == ICmpInst::ICMP_UGT) {

      // icmp Pred (shl nuw X, ShiftAmt), C --> icmp Pred X, (C >>u ShiftAmt)

      APInt ShiftedC = C.lshr(*ShiftAmt);

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

    if ((Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_NE) &&

        C.lshr(*ShiftAmt).shl(*ShiftAmt) == C) {

      APInt ShiftedC = C.lshr(*ShiftAmt);

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

    if (Pred == ICmpInst::ICMP_ULT) {

      // ULE is the same as above, but ULE is canonicalized to ULT, so convert:

      // (X << S) <=u C is equiv to X <=u (C >> S) for all C

      // (X << S) <u (C + 1) is equiv to X <u (C >> S) + 1 if C <u ~0u

      // (X << S) <u C is equiv to X <u ((C - 1) >> S) + 1 if C >u 0

      assert(C.ugt(0) && "ult 0 should have been eliminated");

      APInt ShiftedC = (C - 1).lshr(*ShiftAmt) + 1;

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

  }


  if (Cmp.isEquality() && Shl->hasOneUse()) {

    // Strength-reduce the shift into an 'and'.

    Constant *Mask = ConstantInt::get(

        ShType,

        APInt::getLowBitsSet(TypeBits, TypeBits - ShiftAmt->getZExtValue()));

    Value *And = Builder.CreateAnd(X, Mask, Shl->getName() + ".mask");

    Constant *LShrC = ConstantInt::get(ShType, C.lshr(*ShiftAmt));

    return new ICmpInst(Pred, And, LShrC);

  }


  // Otherwise, if this is a comparison of the sign bit, simplify to and/test.

  bool TrueIfSigned = false;

  if (Shl->hasOneUse() && isSignBitCheck(Pred, C, TrueIfSigned)) {

    // (X << 31) <s 0  --> (X & 1) != 0

    Constant *Mask = ConstantInt::get(

        ShType,

        APInt::getOneBitSet(TypeBits, TypeBits - ShiftAmt->getZExtValue() - 1));

    Value *And = Builder.CreateAnd(X, Mask, Shl->getName() + ".mask");

    return new ICmpInst(TrueIfSigned ? ICmpInst::ICMP_NE : ICmpInst::ICMP_EQ,

                        And, Constant::getNullValue(ShType));

  }


  // Simplify 'shl' inequality test into 'and' equality test.

  if (Cmp.isUnsigned() && Shl->hasOneUse()) {

    // (X l<< C2) u<=/u> C1 iff C1+1 is power of two -> X & (~C1 l>> C2) ==/!= 0

    if ((C + 1).isPowerOf2() &&

        (Pred == ICmpInst::ICMP_ULE || Pred == ICmpInst::ICMP_UGT)) {

      Value *And = Builder.CreateAnd(X, (~C).lshr(ShiftAmt->getZExtValue()));

      return new ICmpInst(Pred == ICmpInst::ICMP_ULE ? ICmpInst::ICMP_EQ

                                                     : ICmpInst::ICMP_NE,

                          And, Constant::getNullValue(ShType));

    }

    // (X l<< C2) u</u>= C1 iff C1 is power of two -> X & (-C1 l>> C2) ==/!= 0

    if (C.isPowerOf2() &&

        (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE)) {

      Value *And =

          Builder.CreateAnd(X, (~(C - 1)).lshr(ShiftAmt->getZExtValue()));

      return new ICmpInst(Pred == ICmpInst::ICMP_ULT ? ICmpInst::ICMP_EQ

                                                     : ICmpInst::ICMP_NE,

                          And, Constant::getNullValue(ShType));

    }

  }


  // Transform (icmp pred iM (shl iM %v, N), C)

  // -> (icmp pred i(M-N) (trunc %v iM to i(M-N)), (trunc (C>>N))

  // Transform the shl to a trunc if (trunc (C>>N)) has no loss and M-N.

  // This enables us to get rid of the shift in favor of a trunc that may be

  // free on the target. It has the additional benefit of comparing to a

  // smaller constant that may be more target-friendly.

  unsigned Amt = ShiftAmt->getLimitedValue(TypeBits - 1);

  if (Shl->hasOneUse() && Amt != 0 &&

      shouldChangeType(ShType->getScalarSizeInBits(), TypeBits - Amt)) {

    ICmpInst::Predicate CmpPred = Pred;

    APInt RHSC = C;


    if (RHSC.countr_zero() < Amt && ICmpInst::isStrictPredicate(CmpPred)) {

      // Try the flipped strictness predicate.

      // e.g.:

      // icmp ult i64 (shl X, 32), 8589934593 ->

      // icmp ule i64 (shl X, 32), 8589934592 ->

      // icmp ule i32 (trunc X, i32), 2 ->

      // icmp ult i32 (trunc X, i32), 3

      if (auto FlippedStrictness = getFlippedStrictnessPredicateAndConstant(

              Pred, ConstantInt::get(ShType->getContext(), C))) {

        CmpPred = FlippedStrictness->first;

        RHSC = cast<ConstantInt>(FlippedStrictness->second)->getValue();

      }

    }


    if (RHSC.countr_zero() >= Amt) {

      Type *TruncTy = ShType->getWithNewBitWidth(TypeBits - Amt);

      Constant *NewC =

          ConstantInt::get(TruncTy, RHSC.ashr(*ShiftAmt).trunc(TypeBits - Amt));

      return new ICmpInst(CmpPred,

                          Builder.CreateTrunc(X, TruncTy, "", /*IsNUW=*/false,

                                              Shl->hasNoSignedWrap()),

                          NewC);

    }

  }


  return nullptr;

}


/// Fold icmp ({al}shr X, Y), C.


Instruction *InstCombinerImpl::foldICmpShrConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Shr,

                                                   const APInt &C) {

  // An exact shr only shifts out zero bits, so:

  // icmp eq/ne (shr X, Y), 0 --> icmp eq/ne X, 0

  Value *X = Shr->getOperand(0);

  CmpInst::Predicate Pred = Cmp.getPredicate();

  if (Cmp.isEquality() && Shr->isExact() && C.isZero())

    return new ICmpInst(Pred, X, Cmp.getOperand(1));


  bool IsAShr = Shr->getOpcode() == Instruction::AShr;

  const APInt *ShiftValC;

  if (match(X, m_APInt(ShiftValC))) {

    if (Cmp.isEquality())

      return foldICmpShrConstConst(Cmp, Shr->getOperand(1), C, *ShiftValC);


    // (ShiftValC >> Y) >s -1 --> Y != 0 with ShiftValC < 0

    // (ShiftValC >> Y) <s  0 --> Y == 0 with ShiftValC < 0

    bool TrueIfSigned;

    if (!IsAShr && ShiftValC->isNegative() &&

        isSignBitCheck(Pred, C, TrueIfSigned))

      return new ICmpInst(TrueIfSigned ? CmpInst::ICMP_EQ : CmpInst::ICMP_NE,

                          Shr->getOperand(1),

                          ConstantInt::getNullValue(X->getType()));


    // If the shifted constant is a power-of-2, test the shift amount directly:

    // (ShiftValC >> Y) >u C --> X <u (LZ(C) - LZ(ShiftValC))

    // (ShiftValC >> Y) <u C --> X >=u (LZ(C-1) - LZ(ShiftValC))

    if (!IsAShr && ShiftValC->isPowerOf2() &&

        (Pred == CmpInst::ICMP_UGT || Pred == CmpInst::ICMP_ULT)) {

      bool IsUGT = Pred == CmpInst::ICMP_UGT;

      assert(ShiftValC->uge(C) && "Expected simplify of compare");

      assert((IsUGT || !C.isZero()) && "Expected X u< 0 to simplify");


      unsigned CmpLZ = IsUGT ? C.countl_zero() : (C - 1).countl_zero();

      unsigned ShiftLZ = ShiftValC->countl_zero();

      Constant *NewC = ConstantInt::get(Shr->getType(), CmpLZ - ShiftLZ);

      auto NewPred = IsUGT ? CmpInst::ICMP_ULT : CmpInst::ICMP_UGE;

      return new ICmpInst(NewPred, Shr->getOperand(1), NewC);

    }

  }


  const APInt *ShiftAmtC;

  if (!match(Shr->getOperand(1), m_APInt(ShiftAmtC)))

    return nullptr;


  // Check that the shift amount is in range. If not, don't perform undefined

  // shifts. When the shift is visited it will be simplified.

  unsigned TypeBits = C.getBitWidth();

  unsigned ShAmtVal = ShiftAmtC->getLimitedValue(TypeBits);

  if (ShAmtVal >= TypeBits || ShAmtVal == 0)

    return nullptr;


  bool IsExact = Shr->isExact();

  Type *ShrTy = Shr->getType();

  // TODO: If we could guarantee that InstSimplify would handle all of the

  // constant-value-based preconditions in the folds below, then we could assert

  // those conditions rather than checking them. This is difficult because of

  // undef/poison (PR34838).

  if (IsAShr && Shr->hasOneUse()) {

    if (IsExact && (Pred == CmpInst::ICMP_SLT || Pred == CmpInst::ICMP_ULT) &&

        (C - 1).isPowerOf2() && C.countLeadingZeros() > ShAmtVal) {

      // When C - 1 is a power of two and the transform can be legally

      // performed, prefer this form so the produced constant is close to a

      // power of two.

      // icmp slt/ult (ashr exact X, ShAmtC), C

      // --> icmp slt/ult X, (C - 1) << ShAmtC) + 1

      APInt ShiftedC = (C - 1).shl(ShAmtVal) + 1;

      return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }

    if (IsExact || Pred == CmpInst::ICMP_SLT || Pred == CmpInst::ICMP_ULT) {

      // When ShAmtC can be shifted losslessly:

      // icmp PRED (ashr exact X, ShAmtC), C --> icmp PRED X, (C << ShAmtC)

      // icmp slt/ult (ashr X, ShAmtC), C --> icmp slt/ult X, (C << ShAmtC)

      APInt ShiftedC = C.shl(ShAmtVal);

      if (ShiftedC.ashr(ShAmtVal) == C)

        return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }

    if (Pred == CmpInst::ICMP_SGT) {

      // icmp sgt (ashr X, ShAmtC), C --> icmp sgt X, ((C + 1) << ShAmtC) - 1

      APInt ShiftedC = (C + 1).shl(ShAmtVal) - 1;

      if (!C.isMaxSignedValue() && !(C + 1).shl(ShAmtVal).isMinSignedValue() &&

          (ShiftedC + 1).ashr(ShAmtVal) == (C + 1))

        return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }

    if (Pred == CmpInst::ICMP_UGT) {

      // icmp ugt (ashr X, ShAmtC), C --> icmp ugt X, ((C + 1) << ShAmtC) - 1

      // 'C + 1 << ShAmtC' can overflow as a signed number, so the 2nd

      // clause accounts for that pattern.

      APInt ShiftedC = (C + 1).shl(ShAmtVal) - 1;

      if ((ShiftedC + 1).ashr(ShAmtVal) == (C + 1) ||

          (C + 1).shl(ShAmtVal).isMinSignedValue())

        return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }


    // If the compare constant has significant bits above the lowest sign-bit,

    // then convert an unsigned cmp to a test of the sign-bit:

    // (ashr X, ShiftC) u> C --> X s< 0

    // (ashr X, ShiftC) u< C --> X s> -1

    if (C.getBitWidth() > 2 && C.getNumSignBits() <= ShAmtVal) {

      if (Pred == CmpInst::ICMP_UGT) {

        return new ICmpInst(CmpInst::ICMP_SLT, X,

                            ConstantInt::getNullValue(ShrTy));

      }

      if (Pred == CmpInst::ICMP_ULT) {

        return new ICmpInst(CmpInst::ICMP_SGT, X,

                            ConstantInt::getAllOnesValue(ShrTy));

      }

    }

  } else if (!IsAShr) {

    if (Pred == CmpInst::ICMP_ULT || (Pred == CmpInst::ICMP_UGT && IsExact)) {

      // icmp ult (lshr X, ShAmtC), C --> icmp ult X, (C << ShAmtC)

      // icmp ugt (lshr exact X, ShAmtC), C --> icmp ugt X, (C << ShAmtC)

      APInt ShiftedC = C.shl(ShAmtVal);

      if (ShiftedC.lshr(ShAmtVal) == C)

        return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }

    if (Pred == CmpInst::ICMP_UGT) {

      // icmp ugt (lshr X, ShAmtC), C --> icmp ugt X, ((C + 1) << ShAmtC) - 1

      APInt ShiftedC = (C + 1).shl(ShAmtVal) - 1;

      if ((ShiftedC + 1).lshr(ShAmtVal) == (C + 1))

        return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }

  }


  if (!Cmp.isEquality())

    return nullptr;


  // Handle equality comparisons of shift-by-constant.


  // If the comparison constant changes with the shift, the comparison cannot

  // succeed (bits of the comparison constant cannot match the shifted value).

  // This should be known by InstSimplify and already be folded to true/false.

  assert(((IsAShr && C.shl(ShAmtVal).ashr(ShAmtVal) == C) ||

          (!IsAShr && C.shl(ShAmtVal).lshr(ShAmtVal) == C)) &&

         "Expected icmp+shr simplify did not occur.");


  // If the bits shifted out are known zero, compare the unshifted value:

  //  (X & 4) >> 1 == 2  --> (X & 4) == 4.

  if (Shr->isExact())

    return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, C << ShAmtVal));


  if (C.isZero()) {

    // == 0 is u< 1.

    if (Pred == CmpInst::ICMP_EQ)

      return new ICmpInst(CmpInst::ICMP_ULT, X,

                          ConstantInt::get(ShrTy, (C + 1).shl(ShAmtVal)));

    else

      return new ICmpInst(CmpInst::ICMP_UGT, X,

                          ConstantInt::get(ShrTy, (C + 1).shl(ShAmtVal) - 1));

  }


  if (Shr->hasOneUse()) {

    // Canonicalize the shift into an 'and':

    // icmp eq/ne (shr X, ShAmt), C --> icmp eq/ne (and X, HiMask), (C << ShAmt)

    APInt Val(APInt::getHighBitsSet(TypeBits, TypeBits - ShAmtVal));

    Constant *Mask = ConstantInt::get(ShrTy, Val);

    Value *And = Builder.CreateAnd(X, Mask, Shr->getName() + ".mask");

    return new ICmpInst(Pred, And, ConstantInt::get(ShrTy, C << ShAmtVal));

  }


  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpSRemConstant(ICmpInst &Cmp,

                                                    BinaryOperator *SRem,

                                                    const APInt &C) {

  const ICmpInst::Predicate Pred = Cmp.getPredicate();

  if (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULT) {

    // Canonicalize unsigned predicates to signed:

    // (X s% DivisorC) u> C -> (X s% DivisorC) s< 0

    //   iff (C s< 0 ? ~C : C) u>= abs(DivisorC)-1

    // (X s% DivisorC) u< C+1 -> (X s% DivisorC) s> -1

    //   iff (C+1 s< 0 ? ~C : C) u>= abs(DivisorC)-1


    const APInt *DivisorC;

    if (!match(SRem->getOperand(1), m_APInt(DivisorC)))

      return nullptr;


    APInt NormalizedC = C;

    if (Pred == ICmpInst::ICMP_ULT) {

      assert(!NormalizedC.isZero() &&

             "ult X, 0 should have been simplified already.");

      --NormalizedC;

    }

    if (C.isNegative())

      NormalizedC.flipAllBits();

    assert(!DivisorC->isZero() &&

           "srem X, 0 should have been simplified already.");

    if (!NormalizedC.uge(DivisorC->abs() - 1))

      return nullptr;


    Type *Ty = SRem->getType();

    if (Pred == ICmpInst::ICMP_UGT)

      return new ICmpInst(ICmpInst::ICMP_SLT, SRem,

                          ConstantInt::getNullValue(Ty));

    return new ICmpInst(ICmpInst::ICMP_SGT, SRem,

                        ConstantInt::getAllOnesValue(Ty));

  }

  // Match an 'is positive' or 'is negative' comparison of remainder by a

  // constant power-of-2 value:

  // (X % pow2C) sgt/slt 0

  if (Pred != ICmpInst::ICMP_SGT && Pred != ICmpInst::ICMP_SLT &&

      Pred != ICmpInst::ICMP_EQ && Pred != ICmpInst::ICMP_NE)

    return nullptr;


  // TODO: The one-use check is standard because we do not typically want to

  //       create longer instruction sequences, but this might be a special-case

  //       because srem is not good for analysis or codegen.

  if (!SRem->hasOneUse())

    return nullptr;


  const APInt *DivisorC;

  if (!match(SRem->getOperand(1), m_Power2(DivisorC)))

    return nullptr;


  // For cmp_sgt/cmp_slt only zero valued C is handled.

  // For cmp_eq/cmp_ne only positive valued C is handled.

  if (((Pred == ICmpInst::ICMP_SGT || Pred == ICmpInst::ICMP_SLT) &&

       !C.isZero()) ||

      ((Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_NE) &&

       !C.isStrictlyPositive()))

    return nullptr;


  // Mask off the sign bit and the modulo bits (low-bits).

  Type *Ty = SRem->getType();

  APInt SignMask = APInt::getSignMask(Ty->getScalarSizeInBits());

  Constant *MaskC = ConstantInt::get(Ty, SignMask | (*DivisorC - 1));

  Value *And = Builder.CreateAnd(SRem->getOperand(0), MaskC);


  if (Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_NE)

    return new ICmpInst(Pred, And, ConstantInt::get(Ty, C));


  // For 'is positive?' check that the sign-bit is clear and at least 1 masked

  // bit is set. Example:

  // (i8 X % 32) s> 0 --> (X & 159) s> 0

  if (Pred == ICmpInst::ICMP_SGT)

    return new ICmpInst(ICmpInst::ICMP_SGT, And, ConstantInt::getNullValue(Ty));


  // For 'is negative?' check that the sign-bit is set and at least 1 masked

  // bit is set. Example:

  // (i16 X % 4) s< 0 --> (X & 32771) u> 32768

  return new ICmpInst(ICmpInst::ICMP_UGT, And, ConstantInt::get(Ty, SignMask));

}


/// Fold icmp (udiv X, Y), C.


Instruction *InstCombinerImpl::foldICmpUDivConstant(ICmpInst &Cmp,

                                                    BinaryOperator *UDiv,

                                                    const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Value *X = UDiv->getOperand(0);

  Value *Y = UDiv->getOperand(1);

  Type *Ty = UDiv->getType();


  const APInt *C2;

  if (!match(X, m_APInt(C2)))

    return nullptr;


  assert(*C2 != 0 && "udiv 0, X should have been simplified already.");


  // (icmp ugt (udiv C2, Y), C) -> (icmp ule Y, C2/(C+1))

  if (Pred == ICmpInst::ICMP_UGT) {

    assert(!C.isMaxValue() &&

           "icmp ugt X, UINT_MAX should have been simplified already.");

    return new ICmpInst(ICmpInst::ICMP_ULE, Y,

                        ConstantInt::get(Ty, C2->udiv(C + 1)));

  }


  // (icmp ult (udiv C2, Y), C) -> (icmp ugt Y, C2/C)

  if (Pred == ICmpInst::ICMP_ULT) {

    assert(C != 0 && "icmp ult X, 0 should have been simplified already.");

    return new ICmpInst(ICmpInst::ICMP_UGT, Y,

                        ConstantInt::get(Ty, C2->udiv(C)));

  }


  return nullptr;

}


/// Fold icmp ({su}div X, Y), C.


Instruction *InstCombinerImpl::foldICmpDivConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Div,

                                                   const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Value *X = Div->getOperand(0);

  Value *Y = Div->getOperand(1);

  Type *Ty = Div->getType();

  bool DivIsSigned = Div->getOpcode() == Instruction::SDiv;


  // If unsigned division and the compare constant is bigger than

  // UMAX/2 (negative), there's only one pair of values that satisfies an

  // equality check, so eliminate the division:

  // (X u/ Y) == C --> (X == C) && (Y == 1)

  // (X u/ Y) != C --> (X != C) || (Y != 1)

  // Similarly, if signed division and the compare constant is exactly SMIN:

  // (X s/ Y) == SMIN --> (X == SMIN) && (Y == 1)

  // (X s/ Y) != SMIN --> (X != SMIN) || (Y != 1)

  if (Cmp.isEquality() && Div->hasOneUse() && C.isSignBitSet() &&

      (!DivIsSigned || C.isMinSignedValue())) {

    Value *XBig = Builder.CreateICmp(Pred, X, ConstantInt::get(Ty, C));

    Value *YOne = Builder.CreateICmp(Pred, Y, ConstantInt::get(Ty, 1));

    auto Logic = Pred == ICmpInst::ICMP_EQ ? Instruction::And : Instruction::Or;

    return BinaryOperator::Create(Logic, XBig, YOne);

  }


  // Fold: icmp pred ([us]div X, C2), C -> range test

  // Fold this div into the comparison, producing a range check.

  // Determine, based on the divide type, what the range is being

  // checked.  If there is an overflow on the low or high side, remember

  // it, otherwise compute the range [low, hi) bounding the new value.

  // See: InsertRangeTest above for the kinds of replacements possible.

  const APInt *C2;

  if (!match(Y, m_APInt(C2)))

    return nullptr;


  // FIXME: If the operand types don't match the type of the divide

  // then don't attempt this transform. The code below doesn't have the

  // logic to deal with a signed divide and an unsigned compare (and

  // vice versa). This is because (x /s C2) <s C  produces different

  // results than (x /s C2) <u C or (x /u C2) <s C or even

  // (x /u C2) <u C.  Simply casting the operands and result won't

  // work. :(  The if statement below tests that condition and bails

  // if it finds it.

  if (!Cmp.isEquality() && DivIsSigned != Cmp.isSigned())

    return nullptr;


  // The ProdOV computation fails on divide by 0 and divide by -1. Cases with

  // INT_MIN will also fail if the divisor is 1. Although folds of all these

  // division-by-constant cases should be present, we can not assert that they

  // have happened before we reach this icmp instruction.

  if (C2->isZero() || C2->isOne() || (DivIsSigned && C2->isAllOnes()))

    return nullptr;


  // Compute Prod = C * C2. We are essentially solving an equation of

  // form X / C2 = C. We solve for X by multiplying C2 and C.

  // By solving for X, we can turn this into a range check instead of computing

  // a divide.

  APInt Prod = C * *C2;


  // Determine if the product overflows by seeing if the product is not equal to

  // the divide. Make sure we do the same kind of divide as in the LHS

  // instruction that we're folding.

  bool ProdOV = (DivIsSigned ? Prod.sdiv(*C2) : Prod.udiv(*C2)) != C;


  // If the division is known to be exact, then there is no remainder from the

  // divide, so the covered range size is unit, otherwise it is the divisor.

  APInt RangeSize = Div->isExact() ? APInt(C2->getBitWidth(), 1) : *C2;


  // Figure out the interval that is being checked.  For example, a comparison

  // like "X /u 5 == 0" is really checking that X is in the interval [0, 5).

  // Compute this interval based on the constants involved and the signedness of

  // the compare/divide.  This computes a half-open interval, keeping track of

  // whether either value in the interval overflows.  After analysis each

  // overflow variable is set to 0 if it's corresponding bound variable is valid

  // -1 if overflowed off the bottom end, or +1 if overflowed off the top end.

  int LoOverflow = 0, HiOverflow = 0;

  APInt LoBound, HiBound;


  if (!DivIsSigned) { // udiv

    // e.g. X/5 op 3  --> [15, 20)

    LoBound = Prod;

    HiOverflow = LoOverflow = ProdOV;

    if (!HiOverflow) {

      // If this is not an exact divide, then many values in the range collapse

      // to the same result value.

      HiOverflow = addWithOverflow(HiBound, LoBound, RangeSize, false);

    }

  } else if (C2->isStrictlyPositive()) { // Divisor is > 0.

    if (C.isZero()) {                    // (X / pos) op 0

      // Can't overflow.  e.g.  X/2 op 0 --> [-1, 2)

      LoBound = -(RangeSize - 1);

      HiBound = RangeSize;

    } else if (C.isStrictlyPositive()) { // (X / pos) op pos

      LoBound = Prod;                    // e.g.   X/5 op 3 --> [15, 20)

      HiOverflow = LoOverflow = ProdOV;

      if (!HiOverflow)

        HiOverflow = addWithOverflow(HiBound, Prod, RangeSize, true);

    } else { // (X / pos) op neg

      // e.g. X/5 op -3  --> [-15-4, -15+1) --> [-19, -14)

      HiBound = Prod + 1;

      LoOverflow = HiOverflow = ProdOV ? -1 : 0;

      if (!LoOverflow) {

        APInt DivNeg = -RangeSize;

        LoOverflow = addWithOverflow(LoBound, HiBound, DivNeg, true) ? -1 : 0;

      }

    }

  } else if (C2->isNegative()) { // Divisor is < 0.

    if (Div->isExact())

      RangeSize.negate();

    if (C.isZero()) { // (X / neg) op 0

      // e.g. X/-5 op 0  --> [-4, 5)

      LoBound = RangeSize + 1;

      HiBound = -RangeSize;

      if (HiBound == *C2) { // -INTMIN = INTMIN

        HiOverflow = 1;     // [INTMIN+1, overflow)

        HiBound = APInt();  // e.g. X/INTMIN = 0 --> X > INTMIN

      }

    } else if (C.isStrictlyPositive()) { // (X / neg) op pos

      // e.g. X/-5 op 3  --> [-19, -14)

      HiBound = Prod + 1;

      HiOverflow = LoOverflow = ProdOV ? -1 : 0;

      if (!LoOverflow)

        LoOverflow =

            addWithOverflow(LoBound, HiBound, RangeSize, true) ? -1 : 0;

    } else {          // (X / neg) op neg

      LoBound = Prod; // e.g. X/-5 op -3  --> [15, 20)

      LoOverflow = HiOverflow = ProdOV;

      if (!HiOverflow)

        HiOverflow = subWithOverflow(HiBound, Prod, RangeSize, true);

    }


    // Dividing by a negative swaps the condition.  LT <-> GT

    Pred = ICmpInst::getSwappedPredicate(Pred);

  }


  switch (Pred) {

  default:

    llvm_unreachable("Unhandled icmp predicate!");

  case ICmpInst::ICMP_EQ:

    if (LoOverflow && HiOverflow)

      return replaceInstUsesWith(Cmp, Builder.getFalse());

    if (HiOverflow)

      return new ICmpInst(DivIsSigned ? ICmpInst::ICMP_SGE : ICmpInst::ICMP_UGE,

                          X, ConstantInt::get(Ty, LoBound));

    if (LoOverflow)

      return new ICmpInst(DivIsSigned ? ICmpInst::ICMP_SLT : ICmpInst::ICMP_ULT,

                          X, ConstantInt::get(Ty, HiBound));

    return replaceInstUsesWith(

        Cmp, insertRangeTest(X, LoBound, HiBound, DivIsSigned, true));

  case ICmpInst::ICMP_NE:

    if (LoOverflow && HiOverflow)

      return replaceInstUsesWith(Cmp, Builder.getTrue());

    if (HiOverflow)

      return new ICmpInst(DivIsSigned ? ICmpInst::ICMP_SLT : ICmpInst::ICMP_ULT,

                          X, ConstantInt::get(Ty, LoBound));

    if (LoOverflow)

      return new ICmpInst(DivIsSigned ? ICmpInst::ICMP_SGE : ICmpInst::ICMP_UGE,

                          X, ConstantInt::get(Ty, HiBound));

    return replaceInstUsesWith(

        Cmp, insertRangeTest(X, LoBound, HiBound, DivIsSigned, false));

  case ICmpInst::ICMP_ULT:

  case ICmpInst::ICMP_SLT:

    if (LoOverflow == +1) // Low bound is greater than input range.

      return replaceInstUsesWith(Cmp, Builder.getTrue());

    if (LoOverflow == -1) // Low bound is less than input range.

      return replaceInstUsesWith(Cmp, Builder.getFalse());

    return new ICmpInst(Pred, X, ConstantInt::get(Ty, LoBound));

  case ICmpInst::ICMP_UGT:

  case ICmpInst::ICMP_SGT:

    if (HiOverflow == +1) // High bound greater than input range.

      return replaceInstUsesWith(Cmp, Builder.getFalse());

    if (HiOverflow == -1) // High bound less than input range.

      return replaceInstUsesWith(Cmp, Builder.getTrue());

    if (Pred == ICmpInst::ICMP_UGT)

      return new ICmpInst(ICmpInst::ICMP_UGE, X, ConstantInt::get(Ty, HiBound));

    return new ICmpInst(ICmpInst::ICMP_SGE, X, ConstantInt::get(Ty, HiBound));

  }


  return nullptr;

}


/// Fold icmp (sub X, Y), C.


Instruction *InstCombinerImpl::foldICmpSubConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Sub,

                                                   const APInt &C) {

  Value *X = Sub->getOperand(0), *Y = Sub->getOperand(1);

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Type *Ty = Sub->getType();


  // (SubC - Y) == C) --> Y == (SubC - C)

  // (SubC - Y) != C) --> Y != (SubC - C)

  Constant *SubC;

  if (Cmp.isEquality() && match(X, m_ImmConstant(SubC))) {

    return new ICmpInst(Pred, Y,

                        ConstantExpr::getSub(SubC, ConstantInt::get(Ty, C)));

  }


  // (icmp P (sub nuw|nsw C2, Y), C) -> (icmp swap(P) Y, C2-C)

  const APInt *C2;

  APInt SubResult;

  ICmpInst::Predicate SwappedPred = Cmp.getSwappedPredicate();

  bool HasNSW = Sub->hasNoSignedWrap();

  bool HasNUW = Sub->hasNoUnsignedWrap();

  if (match(X, m_APInt(C2)) &&

      ((Cmp.isUnsigned() && HasNUW) || (Cmp.isSigned() && HasNSW)) &&

      !subWithOverflow(SubResult, *C2, C, Cmp.isSigned()))

    return new ICmpInst(SwappedPred, Y, ConstantInt::get(Ty, SubResult));


  // X - Y == 0 --> X == Y.

  // X - Y != 0 --> X != Y.

  // TODO: We allow this with multiple uses as long as the other uses are not

  //       in phis. The phi use check is guarding against a codegen regression

  //       for a loop test. If the backend could undo this (and possibly

  //       subsequent transforms), we would not need this hack.

  if (Cmp.isEquality() && C.isZero() &&

      none_of((Sub->users()), [](const User *U) { return isa<PHINode>(U); }))

    return new ICmpInst(Pred, X, Y);


  // The following transforms are only worth it if the only user of the subtract

  // is the icmp.

  // TODO: This is an artificial restriction for all of the transforms below

  //       that only need a single replacement icmp. Can these use the phi test

  //       like the transform above here?

  if (!Sub->hasOneUse())

    return nullptr;


  if (Sub->hasNoSignedWrap()) {

    // (icmp sgt (sub nsw X, Y), -1) -> (icmp sge X, Y)

    if (Pred == ICmpInst::ICMP_SGT && C.isAllOnes())

      return new ICmpInst(ICmpInst::ICMP_SGE, X, Y);


    // (icmp sgt (sub nsw X, Y), 0) -> (icmp sgt X, Y)

    if (Pred == ICmpInst::ICMP_SGT && C.isZero())

      return new ICmpInst(ICmpInst::ICMP_SGT, X, Y);


    // (icmp slt (sub nsw X, Y), 0) -> (icmp slt X, Y)

    if (Pred == ICmpInst::ICMP_SLT && C.isZero())

      return new ICmpInst(ICmpInst::ICMP_SLT, X, Y);


    // (icmp slt (sub nsw X, Y), 1) -> (icmp sle X, Y)

    if (Pred == ICmpInst::ICMP_SLT && C.isOne())

      return new ICmpInst(ICmpInst::ICMP_SLE, X, Y);

  }


  if (!match(X, m_APInt(C2)))

    return nullptr;


  // C2 - Y <u C -> (Y | (C - 1)) == C2

  //   iff (C2 & (C - 1)) == C - 1 and C is a power of 2

  if (Pred == ICmpInst::ICMP_ULT && C.isPowerOf2() &&

      (*C2 & (C - 1)) == (C - 1))

    return new ICmpInst(ICmpInst::ICMP_EQ, Builder.CreateOr(Y, C - 1), X);


  // C2 - Y >u C -> (Y | C) != C2

  //   iff C2 & C == C and C + 1 is a power of 2

  if (Pred == ICmpInst::ICMP_UGT && (C + 1).isPowerOf2() && (*C2 & C) == C)

    return new ICmpInst(ICmpInst::ICMP_NE, Builder.CreateOr(Y, C), X);


  // We have handled special cases that reduce.

  // Canonicalize any remaining sub to add as:

  // (C2 - Y) > C --> (Y + ~C2) < ~C

  Value *Add = Builder.CreateAdd(Y, ConstantInt::get(Ty, ~(*C2)), "notsub",

                                 HasNUW, HasNSW);

  return new ICmpInst(SwappedPred, Add, ConstantInt::get(Ty, ~C));

}


static Value *createLogicFromTable(const std::bitset<4> &Table, Value *Op0,

                                   Value *Op1, IRBuilderBase &Builder,

                                   bool HasOneUse) {

  auto FoldConstant = [&](bool Val) {

    Constant *Res = Val ? Builder.getTrue() : Builder.getFalse();

    if (Op0->getType()->isVectorTy())

      Res = ConstantVector::getSplat(

          cast<VectorType>(Op0->getType())->getElementCount(), Res);

    return Res;

  };


  switch (Table.to_ulong()) {

  case 0: // 0 0 0 0

    return FoldConstant(false);

  case 1: // 0 0 0 1

    return HasOneUse ? Builder.CreateNot(Builder.CreateOr(Op0, Op1)) : nullptr;

  case 2: // 0 0 1 0

    return HasOneUse ? Builder.CreateAnd(Builder.CreateNot(Op0), Op1) : nullptr;

  case 3: // 0 0 1 1

    return Builder.CreateNot(Op0);

  case 4: // 0 1 0 0

    return HasOneUse ? Builder.CreateAnd(Op0, Builder.CreateNot(Op1)) : nullptr;

  case 5: // 0 1 0 1

    return Builder.CreateNot(Op1);

  case 6: // 0 1 1 0

    return Builder.CreateXor(Op0, Op1);

  case 7: // 0 1 1 1

    return HasOneUse ? Builder.CreateNot(Builder.CreateAnd(Op0, Op1)) : nullptr;

  case 8: // 1 0 0 0

    return Builder.CreateAnd(Op0, Op1);

  case 9: // 1 0 0 1

    return HasOneUse ? Builder.CreateNot(Builder.CreateXor(Op0, Op1)) : nullptr;

  case 10: // 1 0 1 0

    return Op1;

  case 11: // 1 0 1 1

    return HasOneUse ? Builder.CreateOr(Builder.CreateNot(Op0), Op1) : nullptr;

  case 12: // 1 1 0 0

    return Op0;

  case 13: // 1 1 0 1

    return HasOneUse ? Builder.CreateOr(Op0, Builder.CreateNot(Op1)) : nullptr;

  case 14: // 1 1 1 0

    return Builder.CreateOr(Op0, Op1);

  case 15: // 1 1 1 1

    return FoldConstant(true);

  default:

    llvm_unreachable("Invalid Operation");

  }

  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpBinOpWithConstantViaTruthTable(

    ICmpInst &Cmp, BinaryOperator *BO, const APInt &C) {

  Value *A, *B;

  Constant *C1, *C2, *C3, *C4;

  if (!(match(BO->getOperand(0),

              m_Select(m_Value(A), m_Constant(C1), m_Constant(C2)))) ||

      !match(BO->getOperand(1),

             m_Select(m_Value(B), m_Constant(C3), m_Constant(C4))) ||

      Cmp.getType() != A->getType())

    return nullptr;


  std::bitset<4> Table;

  auto ComputeTable = [&](bool First, bool Second) -> std::optional<bool> {

    Constant *L = First ? C1 : C2;

    Constant *R = Second ? C3 : C4;

    if (auto *Res = ConstantFoldBinaryOpOperands(BO->getOpcode(), L, R, DL)) {

      auto *Val = Res->getType()->isVectorTy() ? Res->getSplatValue() : Res;

      if (auto *CI = dyn_cast_or_null<ConstantInt>(Val))

        return ICmpInst::compare(CI->getValue(), C, Cmp.getPredicate());

    }

    return std::nullopt;

  };


  for (unsigned I = 0; I < 4; ++I) {

    bool First = (I >> 1) & 1;

    bool Second = I & 1;

    if (auto Res = ComputeTable(First, Second))

      Table[I] = *Res;

    else

      return nullptr;

  }


  // Synthesize optimal logic.

  if (auto *Cond = createLogicFromTable(Table, A, B, Builder, BO->hasOneUse()))

    return replaceInstUsesWith(Cmp, Cond);

  return nullptr;

}


/// Fold icmp (add X, Y), C.


Instruction *InstCombinerImpl::foldICmpAddConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Add,

                                                   const APInt &C) {

  Value *Y = Add->getOperand(1);

  Value *X = Add->getOperand(0);


  Value *Op0, *Op1;

  Instruction *Ext0, *Ext1;

  const CmpInst::Predicate Pred = Cmp.getPredicate();

  if (match(Add,

            m_Add(m_CombineAnd(m_Instruction(Ext0), m_ZExtOrSExt(m_Value(Op0))),

                  m_CombineAnd(m_Instruction(Ext1),

                               m_ZExtOrSExt(m_Value(Op1))))) &&

      Op0->getType()->isIntOrIntVectorTy(1) &&

      Op1->getType()->isIntOrIntVectorTy(1)) {

    unsigned BW = C.getBitWidth();

    std::bitset<4> Table;

    auto ComputeTable = [&](bool Op0Val, bool Op1Val) {

      APInt Res(BW, 0);

      if (Op0Val)

        Res += APInt(BW, isa<ZExtInst>(Ext0) ? 1 : -1, /*isSigned=*/true);

      if (Op1Val)

        Res += APInt(BW, isa<ZExtInst>(Ext1) ? 1 : -1, /*isSigned=*/true);

      return ICmpInst::compare(Res, C, Pred);

    };


    Table[0] = ComputeTable(false, false);

    Table[1] = ComputeTable(false, true);

    Table[2] = ComputeTable(true, false);

    Table[3] = ComputeTable(true, true);

    if (auto *Cond =

            createLogicFromTable(Table, Op0, Op1, Builder, Add->hasOneUse()))

      return replaceInstUsesWith(Cmp, Cond);

  }

  const APInt *C2;

  if (Cmp.isEquality() || !match(Y, m_APInt(C2)))

    return nullptr;


  // Fold icmp pred (add X, C2), C.

  Type *Ty = Add->getType();


  // If the add does not wrap, we can always adjust the compare by subtracting

  // the constants. Equality comparisons are handled elsewhere. SGE/SLE/UGE/ULE

  // are canonicalized to SGT/SLT/UGT/ULT.

  if ((Add->hasNoSignedWrap() &&

       (Pred == ICmpInst::ICMP_SGT || Pred == ICmpInst::ICMP_SLT)) ||

      (Add->hasNoUnsignedWrap() &&

       (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULT))) {

    bool Overflow;

    APInt NewC =

        Cmp.isSigned() ? C.ssub_ov(*C2, Overflow) : C.usub_ov(*C2, Overflow);

    // If there is overflow, the result must be true or false.

    // TODO: Can we assert there is no overflow because InstSimplify always

    // handles those cases?

    if (!Overflow)

      // icmp Pred (add nsw X, C2), C --> icmp Pred X, (C - C2)

      return new ICmpInst(Pred, X, ConstantInt::get(Ty, NewC));

  }


  if (ICmpInst::isUnsigned(Pred) && Add->hasNoSignedWrap() &&

      C.isNonNegative() && (C - *C2).isNonNegative() &&

      computeConstantRange(X, /*ForSigned=*/true).add(*C2).isAllNonNegative())

    return new ICmpInst(ICmpInst::getSignedPredicate(Pred), X,

                        ConstantInt::get(Ty, C - *C2));


  auto CR = ConstantRange::makeExactICmpRegion(Pred, C).subtract(*C2);

  const APInt &Upper = CR.getUpper();

  const APInt &Lower = CR.getLower();

  if (Cmp.isSigned()) {

    if (Lower.isSignMask())

      return new ICmpInst(ICmpInst::ICMP_SLT, X, ConstantInt::get(Ty, Upper));

    if (Upper.isSignMask())

      return new ICmpInst(ICmpInst::ICMP_SGE, X, ConstantInt::get(Ty, Lower));

  } else {

    if (Lower.isMinValue())

      return new ICmpInst(ICmpInst::ICMP_ULT, X, ConstantInt::get(Ty, Upper));

    if (Upper.isMinValue())

      return new ICmpInst(ICmpInst::ICMP_UGE, X, ConstantInt::get(Ty, Lower));

  }


  // This set of folds is intentionally placed after folds that use no-wrapping

  // flags because those folds are likely better for later analysis/codegen.

  const APInt SMax = APInt::getSignedMaxValue(Ty->getScalarSizeInBits());

  const APInt SMin = APInt::getSignedMinValue(Ty->getScalarSizeInBits());


  // Fold compare with offset to opposite sign compare if it eliminates offset:

  // (X + C2) >u C --> X <s -C2 (if C == C2 + SMAX)

  if (Pred == CmpInst::ICMP_UGT && C == *C2 + SMax)

    return new ICmpInst(ICmpInst::ICMP_SLT, X, ConstantInt::get(Ty, -(*C2)));


  // (X + C2) <u C --> X >s ~C2 (if C == C2 + SMIN)

  if (Pred == CmpInst::ICMP_ULT && C == *C2 + SMin)

    return new ICmpInst(ICmpInst::ICMP_SGT, X, ConstantInt::get(Ty, ~(*C2)));


  // (X + C2) >s C --> X <u (SMAX - C) (if C == C2 - 1)

  if (Pred == CmpInst::ICMP_SGT && C == *C2 - 1)

    return new ICmpInst(ICmpInst::ICMP_ULT, X, ConstantInt::get(Ty, SMax - C));


  // (X + C2) <s C --> X >u (C ^ SMAX) (if C == C2)

  if (Pred == CmpInst::ICMP_SLT && C == *C2)

    return new ICmpInst(ICmpInst::ICMP_UGT, X, ConstantInt::get(Ty, C ^ SMax));


  // (X + -1) <u C --> X <=u C (if X is never null)

  if (Pred == CmpInst::ICMP_ULT && C2->isAllOnes()) {

    const SimplifyQuery Q = SQ.getWithInstruction(&Cmp);

    if (llvm::isKnownNonZero(X, Q))

      return new ICmpInst(ICmpInst::ICMP_ULE, X, ConstantInt::get(Ty, C));

  }


  if (!Add->hasOneUse())

    return nullptr;


  // X+C <u C2 -> (X & -C2) == C

  //   iff C & (C2-1) == 0

  //       C2 is a power of 2

  if (Pred == ICmpInst::ICMP_ULT && C.isPowerOf2() && (*C2 & (C - 1)) == 0)

    return new ICmpInst(ICmpInst::ICMP_EQ, Builder.CreateAnd(X, -C),

                        ConstantExpr::getNeg(cast<Constant>(Y)));


  // X+C2 <u C -> (X & C) == 2C

  //   iff C == -(C2)

  //       C2 is a power of 2

  if (Pred == ICmpInst::ICMP_ULT && C2->isPowerOf2() && C == -*C2)

    return new ICmpInst(ICmpInst::ICMP_NE, Builder.CreateAnd(X, C),

                        ConstantInt::get(Ty, C * 2));


  // X+C >u C2 -> (X & ~C2) != C

  //   iff C & C2 == 0

  //       C2+1 is a power of 2

  if (Pred == ICmpInst::ICMP_UGT && (C + 1).isPowerOf2() && (*C2 & C) == 0)

    return new ICmpInst(ICmpInst::ICMP_NE, Builder.CreateAnd(X, ~C),

                        ConstantExpr::getNeg(cast<Constant>(Y)));


  // The range test idiom can use either ult or ugt. Arbitrarily canonicalize

  // to the ult form.

  // X+C2 >u C -> X+(C2-C-1) <u ~C

  if (Pred == ICmpInst::ICMP_UGT)

    return new ICmpInst(ICmpInst::ICMP_ULT,

                        Builder.CreateAdd(X, ConstantInt::get(Ty, *C2 - C - 1)),

                        ConstantInt::get(Ty, ~C));


  // zext(V) + C2 pred C -> V + C3 pred' C4

  Value *V;

  if (match(X, m_ZExt(m_Value(V)))) {

    Type *NewCmpTy = V->getType();

    unsigned NewCmpBW = NewCmpTy->getScalarSizeInBits();

    if (shouldChangeType(Ty, NewCmpTy)) {

      ConstantRange SrcCR = CR.truncate(NewCmpBW, TruncInst::NoUnsignedWrap);

      CmpInst::Predicate EquivPred;

      APInt EquivInt;

      APInt EquivOffset;


      SrcCR.getEquivalentICmp(EquivPred, EquivInt, EquivOffset);

      return new ICmpInst(

          EquivPred,

          EquivOffset.isZero()

              ? V

              : Builder.CreateAdd(V, ConstantInt::get(NewCmpTy, EquivOffset)),

          ConstantInt::get(NewCmpTy, EquivInt));

    }

  }


  return nullptr;

}


bool InstCombinerImpl::matchThreeWayIntCompare(SelectInst *SI, Value *&LHS,

                                               Value *&RHS, ConstantInt *&Less,

                                               ConstantInt *&Equal,

                                               ConstantInt *&Greater) {

  // TODO: Generalize this to work with other comparison idioms or ensure

  // they get canonicalized into this form.


  // select i1 (a == b),

  //        i32 Equal,

  //        i32 (select i1 (a < b), i32 Less, i32 Greater)

  // where Equal, Less and Greater are placeholders for any three constants.

  CmpPredicate PredA;

  if (!match(SI->getCondition(), m_ICmp(PredA, m_Value(LHS), m_Value(RHS))) ||

      !ICmpInst::isEquality(PredA))

    return false;

  Value *EqualVal = SI->getTrueValue();

  Value *UnequalVal = SI->getFalseValue();

  // We still can get non-canonical predicate here, so canonicalize.

  if (PredA == ICmpInst::ICMP_NE)

    std::swap(EqualVal, UnequalVal);

  if (!match(EqualVal, m_ConstantInt(Equal)))

    return false;

  CmpPredicate PredB;

  Value *LHS2, *RHS2;

  if (!match(UnequalVal, m_Select(m_ICmp(PredB, m_Value(LHS2), m_Value(RHS2)),

                                  m_ConstantInt(Less), m_ConstantInt(Greater))))

    return false;

  // We can get predicate mismatch here, so canonicalize if possible:

  // First, ensure that 'LHS' match.

  if (LHS2 != LHS) {

    // x sgt y <--> y slt x

    std::swap(LHS2, RHS2);

    PredB = ICmpInst::getSwappedPredicate(PredB);

  }

  if (LHS2 != LHS)

    return false;

  // We also need to canonicalize 'RHS'.

  if (PredB == ICmpInst::ICMP_SGT && isa<Constant>(RHS2)) {

    // x sgt C-1  <-->  x sge C  <-->  not(x slt C)

    auto FlippedStrictness =

        getFlippedStrictnessPredicateAndConstant(PredB, cast<Constant>(RHS2));

    if (!FlippedStrictness)

      return false;

    assert(FlippedStrictness->first == ICmpInst::ICMP_SGE &&

           "basic correctness failure");

    RHS2 = FlippedStrictness->second;

    // And kind-of perform the result swap.

    std::swap(Less, Greater);

    PredB = ICmpInst::ICMP_SLT;

  }

  return PredB == ICmpInst::ICMP_SLT && RHS == RHS2;

}


Instruction *InstCombinerImpl::foldICmpSelectConstant(ICmpInst &Cmp,

                                                      SelectInst *Select,

                                                      ConstantInt *C) {


  assert(C && "Cmp RHS should be a constant int!");

  // If we're testing a constant value against the result of a three way

  // comparison, the result can be expressed directly in terms of the

  // original values being compared.  Note: We could possibly be more

  // aggressive here and remove the hasOneUse test. The original select is

  // really likely to simplify or sink when we remove a test of the result.

  Value *OrigLHS, *OrigRHS;

  ConstantInt *C1LessThan, *C2Equal, *C3GreaterThan;

  if (Cmp.hasOneUse() &&

      matchThreeWayIntCompare(Select, OrigLHS, OrigRHS, C1LessThan, C2Equal,

                              C3GreaterThan)) {

    assert(C1LessThan && C2Equal && C3GreaterThan);


    bool TrueWhenLessThan = ICmpInst::compare(

        C1LessThan->getValue(), C->getValue(), Cmp.getPredicate());

    bool TrueWhenEqual = ICmpInst::compare(C2Equal->getValue(), C->getValue(),

                                           Cmp.getPredicate());

    bool TrueWhenGreaterThan = ICmpInst::compare(

        C3GreaterThan->getValue(), C->getValue(), Cmp.getPredicate());


    // This generates the new instruction that will replace the original Cmp

    // Instruction. Instead of enumerating the various combinations when

    // TrueWhenLessThan, TrueWhenEqual and TrueWhenGreaterThan are true versus

    // false, we rely on chaining of ORs and future passes of InstCombine to

    // simplify the OR further (i.e. a s< b || a == b becomes a s<= b).


    // When none of the three constants satisfy the predicate for the RHS (C),

    // the entire original Cmp can be simplified to a false.

    Value *Cond = Builder.getFalse();

    if (TrueWhenLessThan)

      Cond = Builder.CreateOr(

          Cond, Builder.CreateICmp(ICmpInst::ICMP_SLT, OrigLHS, OrigRHS));

    if (TrueWhenEqual)

      Cond = Builder.CreateOr(

          Cond, Builder.CreateICmp(ICmpInst::ICMP_EQ, OrigLHS, OrigRHS));

    if (TrueWhenGreaterThan)

      Cond = Builder.CreateOr(

          Cond, Builder.CreateICmp(ICmpInst::ICMP_SGT, OrigLHS, OrigRHS));


    return replaceInstUsesWith(Cmp, Cond);

  }

  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpBitCast(ICmpInst &Cmp) {

  auto *Bitcast = dyn_cast<BitCastInst>(Cmp.getOperand(0));

  if (!Bitcast)

    return nullptr;


  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Value *Op1 = Cmp.getOperand(1);

  Value *BCSrcOp = Bitcast->getOperand(0);

  Type *SrcType = Bitcast->getSrcTy();

  Type *DstType = Bitcast->getType();


  // Make sure the bitcast doesn't change between scalar and vector and

  // doesn't change the number of vector elements.

  if (SrcType->isVectorTy() == DstType->isVectorTy() &&

      SrcType->getScalarSizeInBits() == DstType->getScalarSizeInBits()) {

    // Zero-equality and sign-bit checks are preserved through sitofp + bitcast.

    Value *X;

    if (match(BCSrcOp, m_SIToFP(m_Value(X)))) {

      // icmp  eq (bitcast (sitofp X)), 0 --> icmp  eq X, 0

      // icmp  ne (bitcast (sitofp X)), 0 --> icmp  ne X, 0

      // icmp slt (bitcast (sitofp X)), 0 --> icmp slt X, 0

      // icmp sgt (bitcast (sitofp X)), 0 --> icmp sgt X, 0

      if ((Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_SLT ||

           Pred == ICmpInst::ICMP_NE || Pred == ICmpInst::ICMP_SGT) &&

          match(Op1, m_Zero()))

        return new ICmpInst(Pred, X, ConstantInt::getNullValue(X->getType()));


      // icmp slt (bitcast (sitofp X)), 1 --> icmp slt X, 1

      if (Pred == ICmpInst::ICMP_SLT && match(Op1, m_One()))

        return new ICmpInst(Pred, X, ConstantInt::get(X->getType(), 1));


      // icmp sgt (bitcast (sitofp X)), -1 --> icmp sgt X, -1

      if (Pred == ICmpInst::ICMP_SGT && match(Op1, m_AllOnes()))

        return new ICmpInst(Pred, X,

                            ConstantInt::getAllOnesValue(X->getType()));

    }


    // Zero-equality checks are preserved through unsigned floating-point casts:

    // icmp eq (bitcast (uitofp X)), 0 --> icmp eq X, 0

    // icmp ne (bitcast (uitofp X)), 0 --> icmp ne X, 0

    if (match(BCSrcOp, m_UIToFP(m_Value(X))))

      if (Cmp.isEquality() && match(Op1, m_Zero()))

        return new ICmpInst(Pred, X, ConstantInt::getNullValue(X->getType()));


    const APInt *C;

    bool TrueIfSigned;

    if (match(Op1, m_APInt(C)) && Bitcast->hasOneUse()) {

      // If this is a sign-bit test of a bitcast of a casted FP value, eliminate

      // the FP extend/truncate because that cast does not change the sign-bit.

      // This is true for all standard IEEE-754 types and the X86 80-bit type.

      // The sign-bit is always the most significant bit in those types.

      if (isSignBitCheck(Pred, *C, TrueIfSigned) &&

          (match(BCSrcOp, m_FPExt(m_Value(X))) ||

           match(BCSrcOp, m_FPTrunc(m_Value(X))))) {

        // (bitcast (fpext/fptrunc X)) to iX) < 0 --> (bitcast X to iY) < 0

        // (bitcast (fpext/fptrunc X)) to iX) > -1 --> (bitcast X to iY) > -1

        Type *XType = X->getType();


        // We can't currently handle Power style floating point operations here.

        if (!(XType->isPPC_FP128Ty() || SrcType->isPPC_FP128Ty())) {

          Type *NewType = Builder.getIntNTy(XType->getScalarSizeInBits());

          if (auto *XVTy = dyn_cast<VectorType>(XType))

            NewType = VectorType::get(NewType, XVTy->getElementCount());

          Value *NewBitcast = Builder.CreateBitCast(X, NewType);

          if (TrueIfSigned)

            return new ICmpInst(ICmpInst::ICMP_SLT, NewBitcast,

                                ConstantInt::getNullValue(NewType));

          else

            return new ICmpInst(ICmpInst::ICMP_SGT, NewBitcast,

                                ConstantInt::getAllOnesValue(NewType));

        }

      }


      // icmp eq/ne (bitcast X to int), special fp -> llvm.is.fpclass(X, class)

      Type *FPType = SrcType->getScalarType();

      if (!Cmp.getParent()->getParent()->hasFnAttribute(

              Attribute::NoImplicitFloat) &&

          Cmp.isEquality() && FPType->isIEEELikeFPTy()) {

        FPClassTest Mask = APFloat(FPType->getFltSemantics(), *C).classify();

        if (Mask & (fcInf | fcZero)) {

          if (Pred == ICmpInst::ICMP_NE)

            Mask = ~Mask;

          return replaceInstUsesWith(Cmp,

                                     Builder.createIsFPClass(BCSrcOp, Mask));

        }

      }

    }

  }


  const APInt *C;

  if (!match(Cmp.getOperand(1), m_APInt(C)) || !DstType->isIntegerTy() ||

      !SrcType->isIntOrIntVectorTy())

    return nullptr;


  // If this is checking if all elements of a vector compare are set or not,

  // invert the casted vector equality compare and test if all compare

  // elements are clear or not. Compare against zero is generally easier for

  // analysis and codegen.

  // icmp eq/ne (bitcast (not X) to iN), -1 --> icmp eq/ne (bitcast X to iN), 0

  // Example: are all elements equal? --> are zero elements not equal?

  // TODO: Try harder to reduce compare of 2 freely invertible operands?

  if (Cmp.isEquality() && C->isAllOnes() && Bitcast->hasOneUse()) {

    if (Value *NotBCSrcOp =

            getFreelyInverted(BCSrcOp, BCSrcOp->hasOneUse(), &Builder)) {

      Value *Cast = Builder.CreateBitCast(NotBCSrcOp, DstType);

      return new ICmpInst(Pred, Cast, ConstantInt::getNullValue(DstType));

    }

  }


  // If this is checking if all elements of an extended vector are clear or not,

  // compare in a narrow type to eliminate the extend:

  // icmp eq/ne (bitcast (ext X) to iN), 0 --> icmp eq/ne (bitcast X to iM), 0

  Value *X;

  if (Cmp.isEquality() && C->isZero() && Bitcast->hasOneUse() &&

      match(BCSrcOp, m_ZExtOrSExt(m_Value(X)))) {

    if (auto *VecTy = dyn_cast<FixedVectorType>(X->getType())) {

      Type *NewType = Builder.getIntNTy(VecTy->getPrimitiveSizeInBits());

      Value *NewCast = Builder.CreateBitCast(X, NewType);

      return new ICmpInst(Pred, NewCast, ConstantInt::getNullValue(NewType));

    }

  }


  // Folding: icmp <pred> iN X, C

  //  where X = bitcast <M x iK> (shufflevector <M x iK> %vec, undef, SC)) to iN

  //    and C is a splat of a K-bit pattern

  //    and SC is a constant vector = <C', C', C', ..., C'>

  // Into:

  //   %E = extractelement <M x iK> %vec, i32 C'

  //   icmp <pred> iK %E, trunc(C)

  Value *Vec;

  ArrayRef<int> Mask;

  if (match(BCSrcOp, m_Shuffle(m_Value(Vec), m_Undef(), m_Mask(Mask)))) {

    // Check whether every element of Mask is the same constant

    if (all_equal(Mask)) {

      auto *VecTy = cast<VectorType>(SrcType);

      auto *EltTy = cast<IntegerType>(VecTy->getElementType());

      if (C->isSplat(EltTy->getBitWidth())) {

        // Fold the icmp based on the value of C

        // If C is M copies of an iK sized bit pattern,

        // then:

        //   =>  %E = extractelement <N x iK> %vec, i32 Elem

        //       icmp <pred> iK %SplatVal, <pattern>

        Value *Elem = Builder.getInt32(Mask[0]);

        Value *Extract = Builder.CreateExtractElement(Vec, Elem);

        Value *NewC = ConstantInt::get(EltTy, C->trunc(EltTy->getBitWidth()));

        return new ICmpInst(Pred, Extract, NewC);

      }

    }

  }

  return nullptr;

}


/// Try to fold integer comparisons with a constant operand: icmp Pred X, C

/// where X is some kind of instruction.


Instruction *InstCombinerImpl::foldICmpInstWithConstant(ICmpInst &Cmp) {

  const APInt *C;


  if (match(Cmp.getOperand(1), m_APInt(C))) {

    if (auto *BO = dyn_cast<BinaryOperator>(Cmp.getOperand(0)))

      if (Instruction *I = foldICmpBinOpWithConstant(Cmp, BO, *C))

        return I;


    if (auto *SI = dyn_cast<SelectInst>(Cmp.getOperand(0)))

      // For now, we only support constant integers while folding the

      // ICMP(SELECT)) pattern. We can extend this to support vector of integers

      // similar to the cases handled by binary ops above.

      if (auto *ConstRHS = dyn_cast<ConstantInt>(Cmp.getOperand(1)))

        if (Instruction *I = foldICmpSelectConstant(Cmp, SI, ConstRHS))

          return I;


    if (auto *TI = dyn_cast<TruncInst>(Cmp.getOperand(0)))

      if (Instruction *I = foldICmpTruncConstant(Cmp, TI, *C))

        return I;


    if (auto *II = dyn_cast<IntrinsicInst>(Cmp.getOperand(0)))

      if (Instruction *I = foldICmpIntrinsicWithConstant(Cmp, II, *C))

        return I;


    // (extractval ([s/u]subo X, Y), 0) == 0 --> X == Y

    // (extractval ([s/u]subo X, Y), 0) != 0 --> X != Y

    // TODO: This checks one-use, but that is not strictly necessary.

    Value *Cmp0 = Cmp.getOperand(0);

    Value *X, *Y;

    if (C->isZero() && Cmp.isEquality() && Cmp0->hasOneUse() &&

        (match(Cmp0,

               m_ExtractValue<0>(m_Intrinsic<Intrinsic::ssub_with_overflow>(

                   m_Value(X), m_Value(Y)))) ||

         match(Cmp0,

               m_ExtractValue<0>(m_Intrinsic<Intrinsic::usub_with_overflow>(

                   m_Value(X), m_Value(Y))))))

      return new ICmpInst(Cmp.getPredicate(), X, Y);

  }


  if (match(Cmp.getOperand(1), m_APIntAllowPoison(C)))

    return foldICmpInstWithConstantAllowPoison(Cmp, *C);


  return nullptr;

}


/// Fold an icmp equality instruction with binary operator LHS and constant RHS:

/// icmp eq/ne BO, C.


Instruction *InstCombinerImpl::foldICmpBinOpEqualityWithConstant(

    ICmpInst &Cmp, BinaryOperator *BO, const APInt &C) {

  // TODO: Some of these folds could work with arbitrary constants, but this

  // function is limited to scalar and vector splat constants.

  if (!Cmp.isEquality())

    return nullptr;


  ICmpInst::Predicate Pred = Cmp.getPredicate();

  bool isICMP_NE = Pred == ICmpInst::ICMP_NE;

  Constant *RHS = cast<Constant>(Cmp.getOperand(1));

  Value *BOp0 = BO->getOperand(0), *BOp1 = BO->getOperand(1);


  switch (BO->getOpcode()) {

  case Instruction::SRem:

    // If we have a signed (X % (2^c)) == 0, turn it into an unsigned one.

    if (C.isZero() && BO->hasOneUse()) {

      const APInt *BOC;

      if (match(BOp1, m_APInt(BOC)) && BOC->sgt(1) && BOC->isPowerOf2()) {

        Value *NewRem = Builder.CreateURem(BOp0, BOp1, BO->getName());

        return new ICmpInst(Pred, NewRem,

                            Constant::getNullValue(BO->getType()));

      }

    }

    break;

  case Instruction::Add: {

    // (A + C2) == C --> A == (C - C2)

    // (A + C2) != C --> A != (C - C2)

    // TODO: Remove the one-use limitation? See discussion in D58633.

    if (Constant *C2 = dyn_cast<Constant>(BOp1)) {

      if (BO->hasOneUse())

        return new ICmpInst(Pred, BOp0, ConstantExpr::getSub(RHS, C2));

    } else if (C.isZero()) {

      // Replace ((add A, B) != 0) with (A != -B) if A or B is

      // efficiently invertible, or if the add has just this one use.

      if (Value *NegVal = dyn_castNegVal(BOp1))

        return new ICmpInst(Pred, BOp0, NegVal);

      if (Value *NegVal = dyn_castNegVal(BOp0))

        return new ICmpInst(Pred, NegVal, BOp1);

      if (BO->hasOneUse()) {

        // (add nuw A, B) != 0 -> (or A, B) != 0

        if (match(BO, m_NUWAdd(m_Value(), m_Value()))) {

          Value *Or = Builder.CreateOr(BOp0, BOp1);

          return new ICmpInst(Pred, Or, Constant::getNullValue(BO->getType()));

        }

        Value *Neg = Builder.CreateNeg(BOp1);

        Neg->takeName(BO);

        return new ICmpInst(Pred, BOp0, Neg);

      }

    }

    break;

  }

  case Instruction::Xor:

    if (Constant *BOC = dyn_cast<Constant>(BOp1)) {

      // For the xor case, we can xor two constants together, eliminating

      // the explicit xor.

      return new ICmpInst(Pred, BOp0, ConstantExpr::getXor(RHS, BOC));

    } else if (C.isZero()) {

      // Replace ((xor A, B) != 0) with (A != B)

      return new ICmpInst(Pred, BOp0, BOp1);

    }

    break;

  case Instruction::Or: {

    const APInt *BOC;

    if (match(BOp1, m_APInt(BOC)) && BO->hasOneUse() && RHS->isAllOnesValue()) {

      // Comparing if all bits outside of a constant mask are set?

      // Replace (X | C) == -1 with (X & ~C) == ~C.

      // This removes the -1 constant.

      Constant *NotBOC = ConstantExpr::getNot(cast<Constant>(BOp1));

      Value *And = Builder.CreateAnd(BOp0, NotBOC);

      return new ICmpInst(Pred, And, NotBOC);

    }

    // (icmp eq (or (select cond, 0, NonZero), Other), 0)

    //  -> (and cond, (icmp eq Other, 0))

    // (icmp ne (or (select cond, NonZero, 0), Other), 0)

    //  -> (or cond, (icmp ne Other, 0))

    Value *Cond, *TV, *FV, *Other, *Sel;

    if (C.isZero() &&

        match(BO,

              m_OneUse(m_c_Or(m_CombineAnd(m_Value(Sel),

                                           m_Select(m_Value(Cond), m_Value(TV),

                                                    m_Value(FV))),

                              m_Value(Other)))) &&

        Cond->getType() == Cmp.getType()) {

      const SimplifyQuery Q = SQ.getWithInstruction(&Cmp);

      // Easy case is if eq/ne matches whether 0 is trueval/falseval.

      if (Pred == ICmpInst::ICMP_EQ

              ? (match(TV, m_Zero()) && isKnownNonZero(FV, Q))

              : (match(FV, m_Zero()) && isKnownNonZero(TV, Q))) {

        Value *Cmp = Builder.CreateICmp(

            Pred, Other, Constant::getNullValue(Other->getType()));

        return BinaryOperator::Create(

            Pred == ICmpInst::ICMP_EQ ? Instruction::And : Instruction::Or, Cmp,

            Cond);

      }

      // Harder case is if eq/ne matches whether 0 is falseval/trueval. In this

      // case we need to invert the select condition so we need to be careful to

      // avoid creating extra instructions.

      // (icmp ne (or (select cond, 0, NonZero), Other), 0)

      //  -> (or (not cond), (icmp ne Other, 0))

      // (icmp eq (or (select cond, NonZero, 0), Other), 0)

      //  -> (and (not cond), (icmp eq Other, 0))

      //

      // Only do this if the inner select has one use, in which case we are

      // replacing `select` with `(not cond)`. Otherwise, we will create more

      // uses. NB: Trying to freely invert cond doesn't make sense here, as if

      // cond was freely invertable, the select arms would have been inverted.

      if (Sel->hasOneUse() &&

          (Pred == ICmpInst::ICMP_EQ

               ? (match(FV, m_Zero()) && isKnownNonZero(TV, Q))

               : (match(TV, m_Zero()) && isKnownNonZero(FV, Q)))) {

        Value *NotCond = Builder.CreateNot(Cond);

        Value *Cmp = Builder.CreateICmp(

            Pred, Other, Constant::getNullValue(Other->getType()));

        return BinaryOperator::Create(

            Pred == ICmpInst::ICMP_EQ ? Instruction::And : Instruction::Or, Cmp,

            NotCond);

      }

    }

    break;

  }

  case Instruction::UDiv:

  case Instruction::SDiv:

    if (BO->isExact()) {

      // div exact X, Y eq/ne 0 -> X eq/ne 0

      // div exact X, Y eq/ne 1 -> X eq/ne Y

      // div exact X, Y eq/ne C ->

      //    if Y * C never-overflow && OneUse:

      //      -> Y * C eq/ne X

      if (C.isZero())

        return new ICmpInst(Pred, BOp0, Constant::getNullValue(BO->getType()));

      else if (C.isOne())

        return new ICmpInst(Pred, BOp0, BOp1);

      else if (BO->hasOneUse()) {

        OverflowResult OR = computeOverflow(

            Instruction::Mul, BO->getOpcode() == Instruction::SDiv, BOp1,

            Cmp.getOperand(1), BO);

        if (OR == OverflowResult::NeverOverflows) {

          Value *YC =

              Builder.CreateMul(BOp1, ConstantInt::get(BO->getType(), C));

          return new ICmpInst(Pred, YC, BOp0);

        }

      }

    }

    if (BO->getOpcode() == Instruction::UDiv && C.isZero()) {

      // (icmp eq/ne (udiv A, B), 0) -> (icmp ugt/ule i32 B, A)

      auto NewPred = isICMP_NE ? ICmpInst::ICMP_ULE : ICmpInst::ICMP_UGT;

      return new ICmpInst(NewPred, BOp1, BOp0);

    }

    break;

  default:

    break;

  }

  return nullptr;

}


static Instruction *foldCtpopPow2Test(ICmpInst &I, IntrinsicInst *CtpopLhs,

                                      const APInt &CRhs,

                                      InstCombiner::BuilderTy &Builder,

                                      const SimplifyQuery &Q) {

  assert(CtpopLhs->getIntrinsicID() == Intrinsic::ctpop &&

         "Non-ctpop intrin in ctpop fold");

  if (!CtpopLhs->hasOneUse())

    return nullptr;


  // Power of 2 test:

  //    isPow2OrZero : ctpop(X) u< 2

  //    isPow2       : ctpop(X) == 1

  //    NotPow2OrZero: ctpop(X) u> 1

  //    NotPow2      : ctpop(X) != 1

  // If we know any bit of X can be folded to:

  //    IsPow2       : X & (~Bit) == 0

  //    NotPow2      : X & (~Bit) != 0

  const ICmpInst::Predicate Pred = I.getPredicate();

  if (((I.isEquality() || Pred == ICmpInst::ICMP_UGT) && CRhs == 1) ||

      (Pred == ICmpInst::ICMP_ULT && CRhs == 2)) {

    Value *Op = CtpopLhs->getArgOperand(0);

    KnownBits OpKnown = computeKnownBits(Op, Q.DL, Q.AC, Q.CxtI, Q.DT);

    // No need to check for count > 1, that should be already constant folded.

    if (OpKnown.countMinPopulation() == 1) {

      Value *And = Builder.CreateAnd(

          Op, Constant::getIntegerValue(Op->getType(), ~(OpKnown.One)));

      return new ICmpInst(

          (Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_ULT)

              ? ICmpInst::ICMP_EQ

              : ICmpInst::ICMP_NE,

          And, Constant::getNullValue(Op->getType()));

    }

  }


  return nullptr;

}


/// Fold an equality icmp with LLVM intrinsic and constant operand.


Instruction *InstCombinerImpl::foldICmpEqIntrinsicWithConstant(

    ICmpInst &Cmp, IntrinsicInst *II, const APInt &C) {

  Type *Ty = II->getType();

  unsigned BitWidth = C.getBitWidth();

  const ICmpInst::Predicate Pred = Cmp.getPredicate();


  switch (II->getIntrinsicID()) {

  case Intrinsic::abs:

    // abs(A) == 0  ->  A == 0

    // abs(A) == INT_MIN  ->  A == INT_MIN

    if (C.isZero() || C.isMinSignedValue())

      return new ICmpInst(Pred, II->getArgOperand(0), ConstantInt::get(Ty, C));

    break;


  case Intrinsic::bswap:

    // bswap(A) == C  ->  A == bswap(C)

    return new ICmpInst(Pred, II->getArgOperand(0),

                        ConstantInt::get(Ty, C.byteSwap()));


  case Intrinsic::bitreverse:

    // bitreverse(A) == C  ->  A == bitreverse(C)

    return new ICmpInst(Pred, II->getArgOperand(0),

                        ConstantInt::get(Ty, C.reverseBits()));


  case Intrinsic::ctlz:

  case Intrinsic::cttz: {

    // ctz(A) == bitwidth(A)  ->  A == 0 and likewise for !=

    if (C == BitWidth)

      return new ICmpInst(Pred, II->getArgOperand(0),

                          ConstantInt::getNullValue(Ty));


    // ctz(A) == C -> A & Mask1 == Mask2, where Mask2 only has bit C set

    // and Mask1 has bits 0..C+1 set. Similar for ctl, but for high bits.

    // Limit to one use to ensure we don't increase instruction count.

    unsigned Num = C.getLimitedValue(BitWidth);

    if (Num != BitWidth && II->hasOneUse()) {

      bool IsTrailing = II->getIntrinsicID() == Intrinsic::cttz;

      APInt Mask1 = IsTrailing ? APInt::getLowBitsSet(BitWidth, Num + 1)

                               : APInt::getHighBitsSet(BitWidth, Num + 1);

      APInt Mask2 = IsTrailing

                        ? APInt::getOneBitSet(BitWidth, Num)

                        : APInt::getOneBitSet(BitWidth, BitWidth - Num - 1);

      return new ICmpInst(Pred, Builder.CreateAnd(II->getArgOperand(0), Mask1),

                          ConstantInt::get(Ty, Mask2));

    }

    break;

  }


  case Intrinsic::ctpop: {

    // popcount(A) == 0  ->  A == 0 and likewise for !=

    // popcount(A) == bitwidth(A)  ->  A == -1 and likewise for !=

    bool IsZero = C.isZero();

    if (IsZero || C == BitWidth)

      return new ICmpInst(Pred, II->getArgOperand(0),

                          IsZero ? Constant::getNullValue(Ty)

                                 : Constant::getAllOnesValue(Ty));


    break;

  }


  case Intrinsic::fshl:

  case Intrinsic::fshr:

    if (II->getArgOperand(0) == II->getArgOperand(1)) {

      const APInt *RotAmtC;

      // ror(X, RotAmtC) == C --> X == rol(C, RotAmtC)

      // rol(X, RotAmtC) == C --> X == ror(C, RotAmtC)

      if (match(II->getArgOperand(2), m_APInt(RotAmtC)))

        return new ICmpInst(Pred, II->getArgOperand(0),

                            II->getIntrinsicID() == Intrinsic::fshl

                                ? ConstantInt::get(Ty, C.rotr(*RotAmtC))

                                : ConstantInt::get(Ty, C.rotl(*RotAmtC)));

    }

    break;


  case Intrinsic::umax:

  case Intrinsic::uadd_sat: {

    // uadd.sat(a, b) == 0  ->  (a | b) == 0

    // umax(a, b) == 0  ->  (a | b) == 0

    if (C.isZero() && II->hasOneUse()) {

      Value *Or = Builder.CreateOr(II->getArgOperand(0), II->getArgOperand(1));

      return new ICmpInst(Pred, Or, Constant::getNullValue(Ty));

    }

    break;

  }


  case Intrinsic::ssub_sat:

    // ssub.sat(a, b) == 0 -> a == b

    if (C.isZero())

      return new ICmpInst(Pred, II->getArgOperand(0), II->getArgOperand(1));

    break;

  case Intrinsic::usub_sat: {

    // usub.sat(a, b) == 0  ->  a <= b

    if (C.isZero()) {

      ICmpInst::Predicate NewPred =

          Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_ULE : ICmpInst::ICMP_UGT;

      return new ICmpInst(NewPred, II->getArgOperand(0), II->getArgOperand(1));

    }

    break;

  }

  default:

    break;

  }


  return nullptr;

}


/// Fold an icmp with LLVM intrinsics

static Instruction *


foldICmpIntrinsicWithIntrinsic(ICmpInst &Cmp,

                               InstCombiner::BuilderTy &Builder) {

  assert(Cmp.isEquality());


  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Value *Op0 = Cmp.getOperand(0);

  Value *Op1 = Cmp.getOperand(1);

  const auto *IIOp0 = dyn_cast<IntrinsicInst>(Op0);

  const auto *IIOp1 = dyn_cast<IntrinsicInst>(Op1);

  if (!IIOp0 || !IIOp1 || IIOp0->getIntrinsicID() != IIOp1->getIntrinsicID())

    return nullptr;


  switch (IIOp0->getIntrinsicID()) {

  case Intrinsic::bswap:

  case Intrinsic::bitreverse:

    // If both operands are byte-swapped or bit-reversed, just compare the

    // original values.

    return new ICmpInst(Pred, IIOp0->getOperand(0), IIOp1->getOperand(0));

  case Intrinsic::fshl:

  case Intrinsic::fshr: {

    // If both operands are rotated by same amount, just compare the

    // original values.

    if (IIOp0->getOperand(0) != IIOp0->getOperand(1))

      break;

    if (IIOp1->getOperand(0) != IIOp1->getOperand(1))

      break;

    if (IIOp0->getOperand(2) == IIOp1->getOperand(2))

      return new ICmpInst(Pred, IIOp0->getOperand(0), IIOp1->getOperand(0));


    // rotate(X, AmtX) == rotate(Y, AmtY)

    //  -> rotate(X, AmtX - AmtY) == Y

    // Do this if either both rotates have one use or if only one has one use

    // and AmtX/AmtY are constants.

    unsigned OneUses = IIOp0->hasOneUse() + IIOp1->hasOneUse();

    if (OneUses == 2 ||

        (OneUses == 1 && match(IIOp0->getOperand(2), m_ImmConstant()) &&

         match(IIOp1->getOperand(2), m_ImmConstant()))) {

      Value *SubAmt =

          Builder.CreateSub(IIOp0->getOperand(2), IIOp1->getOperand(2));

      Value *CombinedRotate = Builder.CreateIntrinsic(

          Op0->getType(), IIOp0->getIntrinsicID(),

          {IIOp0->getOperand(0), IIOp0->getOperand(0), SubAmt});

      return new ICmpInst(Pred, IIOp1->getOperand(0), CombinedRotate);

    }

  } break;

  default:

    break;

  }


  return nullptr;

}


/// Try to fold integer comparisons with a constant operand: icmp Pred X, C

/// where X is some kind of instruction and C is AllowPoison.

/// TODO: Move more folds which allow poison to this function.

Instruction *


InstCombinerImpl::foldICmpInstWithConstantAllowPoison(ICmpInst &Cmp,

                                                      const APInt &C) {

  const ICmpInst::Predicate Pred = Cmp.getPredicate();

  if (auto *II = dyn_cast<IntrinsicInst>(Cmp.getOperand(0))) {

    switch (II->getIntrinsicID()) {

    default:

      break;

    case Intrinsic::fshl:

    case Intrinsic::fshr:

      if (Cmp.isEquality() && II->getArgOperand(0) == II->getArgOperand(1)) {

        // (rot X, ?) == 0/-1 --> X == 0/-1

        if (C.isZero() || C.isAllOnes())

          return new ICmpInst(Pred, II->getArgOperand(0), Cmp.getOperand(1));

      }

      break;

    }

  }


  return nullptr;

}


/// Fold an icmp with BinaryOp and constant operand: icmp Pred BO, C.


Instruction *InstCombinerImpl::foldICmpBinOpWithConstant(ICmpInst &Cmp,

                                                         BinaryOperator *BO,

                                                         const APInt &C) {

  switch (BO->getOpcode()) {

  case Instruction::Xor:

    if (Instruction *I = foldICmpXorConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::And:

    if (Instruction *I = foldICmpAndConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::Or:

    if (Instruction *I = foldICmpOrConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::Mul:

    if (Instruction *I = foldICmpMulConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::Shl:

    if (Instruction *I = foldICmpShlConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::LShr:

  case Instruction::AShr:

    if (Instruction *I = foldICmpShrConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::SRem:

    if (Instruction *I = foldICmpSRemConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::UDiv:

    if (Instruction *I = foldICmpUDivConstant(Cmp, BO, C))

      return I;

    [[fallthrough]];

  case Instruction::SDiv:

    if (Instruction *I = foldICmpDivConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::Sub:

    if (Instruction *I = foldICmpSubConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::Add:

    if (Instruction *I = foldICmpAddConstant(Cmp, BO, C))

      return I;

    break;

  default:

    break;

  }


  // TODO: These folds could be refactored to be part of the above calls.

  if (Instruction *I = foldICmpBinOpEqualityWithConstant(Cmp, BO, C))

    return I;


  // Fall back to handling `icmp pred (select A ? C1 : C2) binop (select B ? C3

  // : C4), C5` pattern, by computing a truth table of the four constant

  // variants.

  return foldICmpBinOpWithConstantViaTruthTable(Cmp, BO, C);

}


static Instruction *


foldICmpUSubSatOrUAddSatWithConstant(CmpPredicate Pred, SaturatingInst *II,

                                     const APInt &C,

                                     InstCombiner::BuilderTy &Builder) {

  // This transform may end up producing more than one instruction for the

  // intrinsic, so limit it to one user of the intrinsic.

  if (!II->hasOneUse())

    return nullptr;


  // Let Y        = [add/sub]_sat(X, C) pred C2

  //     SatVal   = The saturating value for the operation

  //     WillWrap = Whether or not the operation will underflow / overflow

  // => Y = (WillWrap ? SatVal : (X binop C)) pred C2

  // => Y = WillWrap ? (SatVal pred C2) : ((X binop C) pred C2)

  //

  // When (SatVal pred C2) is true, then

  //    Y = WillWrap ? true : ((X binop C) pred C2)

  // => Y = WillWrap || ((X binop C) pred C2)

  // else

  //    Y =  WillWrap ? false : ((X binop C) pred C2)

  // => Y = !WillWrap ?  ((X binop C) pred C2) : false

  // => Y = !WillWrap && ((X binop C) pred C2)

  Value *Op0 = II->getOperand(0);

  Value *Op1 = II->getOperand(1);


  const APInt *COp1;

  // This transform only works when the intrinsic has an integral constant or

  // splat vector as the second operand.

  if (!match(Op1, m_APInt(COp1)))

    return nullptr;


  APInt SatVal;

  switch (II->getIntrinsicID()) {

  default:

    llvm_unreachable(

        "This function only works with usub_sat and uadd_sat for now!");

  case Intrinsic::uadd_sat:

    SatVal = APInt::getAllOnes(C.getBitWidth());

    break;

  case Intrinsic::usub_sat:

    SatVal = APInt::getZero(C.getBitWidth());

    break;

  }


  // Check (SatVal pred C2)

  bool SatValCheck = ICmpInst::compare(SatVal, C, Pred);


  // !WillWrap.

  ConstantRange C1 = ConstantRange::makeExactNoWrapRegion(

      II->getBinaryOp(), *COp1, II->getNoWrapKind());


  // WillWrap.

  if (SatValCheck)

    C1 = C1.inverse();


  ConstantRange C2 = ConstantRange::makeExactICmpRegion(Pred, C);

  if (II->getBinaryOp() == Instruction::Add)

    C2 = C2.sub(*COp1);

  else

    C2 = C2.add(*COp1);


  Instruction::BinaryOps CombiningOp =

      SatValCheck ? Instruction::BinaryOps::Or : Instruction::BinaryOps::And;


  std::optional<ConstantRange> Combination;

  if (CombiningOp == Instruction::BinaryOps::Or)

    Combination = C1.exactUnionWith(C2);

  else /* CombiningOp == Instruction::BinaryOps::And */

    Combination = C1.exactIntersectWith(C2);


  if (!Combination)

    return nullptr;


  CmpInst::Predicate EquivPred;

  APInt EquivInt;

  APInt EquivOffset;


  Combination->getEquivalentICmp(EquivPred, EquivInt, EquivOffset);


  return new ICmpInst(

      EquivPred,

      Builder.CreateAdd(Op0, ConstantInt::get(Op1->getType(), EquivOffset)),

      ConstantInt::get(Op1->getType(), EquivInt));

}


static Instruction *


foldICmpOfCmpIntrinsicWithConstant(CmpPredicate Pred, IntrinsicInst *I,

                                   const APInt &C,

                                   InstCombiner::BuilderTy &Builder) {

  std::optional<ICmpInst::Predicate> NewPredicate = std::nullopt;

  switch (Pred) {

  case ICmpInst::ICMP_EQ:

  case ICmpInst::ICMP_NE:

    if (C.isZero())

      NewPredicate = Pred;

    else if (C.isOne())

      NewPredicate =

          Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_UGT : ICmpInst::ICMP_ULE;

    else if (C.isAllOnes())

      NewPredicate =

          Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_ULT : ICmpInst::ICMP_UGE;

    break;


  case ICmpInst::ICMP_SGT:

    if (C.isAllOnes())

      NewPredicate = ICmpInst::ICMP_UGE;

    else if (C.isZero())

      NewPredicate = ICmpInst::ICMP_UGT;

    break;


  case ICmpInst::ICMP_SLT:

    if (C.isZero())

      NewPredicate = ICmpInst::ICMP_ULT;

    else if (C.isOne())

      NewPredicate = ICmpInst::ICMP_ULE;

    break;


  case ICmpInst::ICMP_ULT:

    if (C.ugt(1))

      NewPredicate = ICmpInst::ICMP_UGE;

    break;


  case ICmpInst::ICMP_UGT:

    if (!C.isZero() && !C.isAllOnes())

      NewPredicate = ICmpInst::ICMP_ULT;

    break;


  default:

    break;

  }


  if (!NewPredicate)

    return nullptr;


  if (I->getIntrinsicID() == Intrinsic::scmp)

    NewPredicate = ICmpInst::getSignedPredicate(*NewPredicate);

  Value *LHS = I->getOperand(0);

  Value *RHS = I->getOperand(1);

  return new ICmpInst(*NewPredicate, LHS, RHS);

}


/// Fold an icmp with LLVM intrinsic and constant operand: icmp Pred II, C.


Instruction *InstCombinerImpl::foldICmpIntrinsicWithConstant(ICmpInst &Cmp,

                                                             IntrinsicInst *II,

                                                             const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();


  // Handle folds that apply for any kind of icmp.

  switch (II->getIntrinsicID()) {

  default:

    break;

  case Intrinsic::uadd_sat:

  case Intrinsic::usub_sat:

    if (auto *Folded = foldICmpUSubSatOrUAddSatWithConstant(

            Pred, cast<SaturatingInst>(II), C, Builder))

      return Folded;

    break;

  case Intrinsic::ctpop: {

    const SimplifyQuery Q = SQ.getWithInstruction(&Cmp);

    if (Instruction *R = foldCtpopPow2Test(Cmp, II, C, Builder, Q))

      return R;

  } break;

  case Intrinsic::scmp:

  case Intrinsic::ucmp:

    if (auto *Folded = foldICmpOfCmpIntrinsicWithConstant(Pred, II, C, Builder))

      return Folded;

    break;

  }


  if (Cmp.isEquality())

    return foldICmpEqIntrinsicWithConstant(Cmp, II, C);


  Type *Ty = II->getType();

  unsigned BitWidth = C.getBitWidth();

  switch (II->getIntrinsicID()) {

  case Intrinsic::ctpop: {

    // (ctpop X > BitWidth - 1) --> X == -1

    Value *X = II->getArgOperand(0);

    if (C == BitWidth - 1 && Pred == ICmpInst::ICMP_UGT)

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_EQ, X,

                             ConstantInt::getAllOnesValue(Ty));

    // (ctpop X < BitWidth) --> X != -1

    if (C == BitWidth && Pred == ICmpInst::ICMP_ULT)

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_NE, X,

                             ConstantInt::getAllOnesValue(Ty));

    break;

  }

  case Intrinsic::ctlz: {

    // ctlz(0bXXXXXXXX) > 3 -> 0bXXXXXXXX < 0b00010000

    if (Pred == ICmpInst::ICMP_UGT && C.ult(BitWidth)) {

      unsigned Num = C.getLimitedValue();

      APInt Limit = APInt::getOneBitSet(BitWidth, BitWidth - Num - 1);

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_ULT,

                             II->getArgOperand(0), ConstantInt::get(Ty, Limit));

    }


    // ctlz(0bXXXXXXXX) < 3 -> 0bXXXXXXXX > 0b00011111

    if (Pred == ICmpInst::ICMP_ULT && C.uge(1) && C.ule(BitWidth)) {

      unsigned Num = C.getLimitedValue();

      APInt Limit = APInt::getLowBitsSet(BitWidth, BitWidth - Num);

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_UGT,

                             II->getArgOperand(0), ConstantInt::get(Ty, Limit));

    }

    break;

  }

  case Intrinsic::cttz: {

    // Limit to one use to ensure we don't increase instruction count.

    if (!II->hasOneUse())

      return nullptr;


    // cttz(0bXXXXXXXX) > 3 -> 0bXXXXXXXX & 0b00001111 == 0

    if (Pred == ICmpInst::ICMP_UGT && C.ult(BitWidth)) {

      APInt Mask = APInt::getLowBitsSet(BitWidth, C.getLimitedValue() + 1);

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_EQ,

                             Builder.CreateAnd(II->getArgOperand(0), Mask),

                             ConstantInt::getNullValue(Ty));

    }


    // cttz(0bXXXXXXXX) < 3 -> 0bXXXXXXXX & 0b00000111 != 0

    if (Pred == ICmpInst::ICMP_ULT && C.uge(1) && C.ule(BitWidth)) {

      APInt Mask = APInt::getLowBitsSet(BitWidth, C.getLimitedValue());

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_NE,

                             Builder.CreateAnd(II->getArgOperand(0), Mask),

                             ConstantInt::getNullValue(Ty));

    }

    break;

  }

  case Intrinsic::ssub_sat:

    // ssub.sat(a, b) spred 0 -> a spred b

    if (ICmpInst::isSigned(Pred)) {

      if (C.isZero())

        return new ICmpInst(Pred, II->getArgOperand(0), II->getArgOperand(1));

      // X s<= 0 is cannonicalized to X s< 1

      if (Pred == ICmpInst::ICMP_SLT && C.isOne())

        return new ICmpInst(ICmpInst::ICMP_SLE, II->getArgOperand(0),

                            II->getArgOperand(1));

      // X s>= 0 is cannonicalized to X s> -1

      if (Pred == ICmpInst::ICMP_SGT && C.isAllOnes())

        return new ICmpInst(ICmpInst::ICMP_SGE, II->getArgOperand(0),

                            II->getArgOperand(1));

    }

    break;

  default:

    break;

  }


  return nullptr;

}


/// Handle icmp with constant (but not simple integer constant) RHS.


Instruction *InstCombinerImpl::foldICmpInstWithConstantNotInt(ICmpInst &I) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  Constant *RHSC = dyn_cast<Constant>(Op1);

  Instruction *LHSI = dyn_cast<Instruction>(Op0);

  if (!RHSC || !LHSI)

    return nullptr;


  switch (LHSI->getOpcode()) {

  case Instruction::IntToPtr:

    // icmp pred inttoptr(X), null -> icmp pred X, 0

    if (RHSC->isNullValue() &&

        DL.getIntPtrType(RHSC->getType()) == LHSI->getOperand(0)->getType())

      return new ICmpInst(

          I.getPredicate(), LHSI->getOperand(0),

          Constant::getNullValue(LHSI->getOperand(0)->getType()));

    break;


  case Instruction::Load:

    // Try to optimize things like "A[i] > 4" to index computations.

    if (GetElementPtrInst *GEP =

            dyn_cast<GetElementPtrInst>(LHSI->getOperand(0)))

      if (Instruction *Res =

              foldCmpLoadFromIndexedGlobal(cast<LoadInst>(LHSI), GEP, I))

        return Res;

    break;

  }


  return nullptr;

}


Instruction *InstCombinerImpl::foldSelectICmp(CmpPredicate Pred, SelectInst *SI,

                                              Value *RHS, const ICmpInst &I) {

  // Try to fold the comparison into the select arms, which will cause the

  // select to be converted into a logical and/or.

  auto SimplifyOp = [&](Value *Op, bool SelectCondIsTrue) -> Value * {

    if (Value *Res = simplifyICmpInst(Pred, Op, RHS, SQ))

      return Res;

    if (std::optional<bool> Impl = isImpliedCondition(

            SI->getCondition(), Pred, Op, RHS, DL, SelectCondIsTrue))

      return ConstantInt::get(I.getType(), *Impl);

    return nullptr;

  };


  ConstantInt *CI = nullptr;

  Value *Op1 = SimplifyOp(SI->getOperand(1), true);

  if (Op1)

    CI = dyn_cast<ConstantInt>(Op1);


  Value *Op2 = SimplifyOp(SI->getOperand(2), false);

  if (Op2)

    CI = dyn_cast<ConstantInt>(Op2);


  auto Simplifies = [&](Value *Op, unsigned Idx) {

    // A comparison of ucmp/scmp with a constant will fold into an icmp.

    const APInt *Dummy;

    return Op ||

           (isa<CmpIntrinsic>(SI->getOperand(Idx)) &&

            SI->getOperand(Idx)->hasOneUse() && match(RHS, m_APInt(Dummy)));

  };


  // We only want to perform this transformation if it will not lead to

  // additional code. This is true if either both sides of the select

  // fold to a constant (in which case the icmp is replaced with a select

  // which will usually simplify) or this is the only user of the

  // select (in which case we are trading a select+icmp for a simpler

  // select+icmp) or all uses of the select can be replaced based on

  // dominance information ("Global cases").

  bool Transform = false;

  if (Op1 && Op2)

    Transform = true;

  else if (Simplifies(Op1, 1) || Simplifies(Op2, 2)) {

    // Local case

    if (SI->hasOneUse())

      Transform = true;

    // Global cases

    else if (CI && !CI->isZero())

      // When Op1 is constant try replacing select with second operand.

      // Otherwise Op2 is constant and try replacing select with first

      // operand.

      Transform = replacedSelectWithOperand(SI, &I, Op1 ? 2 : 1);

  }

  if (Transform) {

    if (!Op1)

      Op1 = Builder.CreateICmp(Pred, SI->getOperand(1), RHS, I.getName());

    if (!Op2)

      Op2 = Builder.CreateICmp(Pred, SI->getOperand(2), RHS, I.getName());

    return SelectInst::Create(SI->getOperand(0), Op1, Op2);

  }


  return nullptr;

}


// Returns whether V is a Mask ((X + 1) & X == 0) or ~Mask (-Pow2OrZero)


static bool isMaskOrZero(const Value *V, bool Not, const SimplifyQuery &Q,

                         unsigned Depth = 0) {

  if (Not ? match(V, m_NegatedPower2OrZero()) : match(V, m_LowBitMaskOrZero()))

    return true;

  if (V->getType()->getScalarSizeInBits() == 1)

    return true;

  if (Depth++ >= MaxAnalysisRecursionDepth)

    return false;

  Value *X;

  const Instruction *I = dyn_cast<Instruction>(V);

  if (!I)

    return false;

  switch (I->getOpcode()) {

  case Instruction::ZExt:

    // ZExt(Mask) is a Mask.

    return !Not && isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::SExt:

    // SExt(Mask) is a Mask.

    // SExt(~Mask) is a ~Mask.

    return isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::And:

  case Instruction::Or:

    // Mask0 | Mask1 is a Mask.

    // Mask0 & Mask1 is a Mask.

    // ~Mask0 | ~Mask1 is a ~Mask.

    // ~Mask0 & ~Mask1 is a ~Mask.

    return isMaskOrZero(I->getOperand(1), Not, Q, Depth) &&

           isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::Xor:

    if (match(V, m_Not(m_Value(X))))

      return isMaskOrZero(X, !Not, Q, Depth);


    // (X ^ -X) is a ~Mask

    if (Not)

      return match(V, m_c_Xor(m_Value(X), m_Neg(m_Deferred(X))));

    // (X ^ (X - 1)) is a Mask

    else

      return match(V, m_c_Xor(m_Value(X), m_Add(m_Deferred(X), m_AllOnes())));

  case Instruction::Select:

    // c ? Mask0 : Mask1 is a Mask.

    return isMaskOrZero(I->getOperand(1), Not, Q, Depth) &&

           isMaskOrZero(I->getOperand(2), Not, Q, Depth);

  case Instruction::Shl:

    // (~Mask) << X is a ~Mask.

    return Not && isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::LShr:

    // Mask >> X is a Mask.

    return !Not && isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::AShr:

    // Mask s>> X is a Mask.

    // ~Mask s>> X is a ~Mask.

    return isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::Add:

    // Pow2 - 1 is a Mask.

    if (!Not && match(I->getOperand(1), m_AllOnes()))

      return isKnownToBeAPowerOfTwo(I->getOperand(0), Q.DL, /*OrZero*/ true,

                                    Q.AC, Q.CxtI, Q.DT, Depth);

    break;

  case Instruction::Sub:

    // -Pow2 is a ~Mask.

    if (Not && match(I->getOperand(0), m_Zero()))

      return isKnownToBeAPowerOfTwo(I->getOperand(1), Q.DL, /*OrZero*/ true,

                                    Q.AC, Q.CxtI, Q.DT, Depth);

    break;

  case Instruction::Call: {

    if (auto *II = dyn_cast<IntrinsicInst>(I)) {

      switch (II->getIntrinsicID()) {

        // min/max(Mask0, Mask1) is a Mask.

        // min/max(~Mask0, ~Mask1) is a ~Mask.

      case Intrinsic::umax:

      case Intrinsic::smax:

      case Intrinsic::umin:

      case Intrinsic::smin:

        return isMaskOrZero(II->getArgOperand(1), Not, Q, Depth) &&

               isMaskOrZero(II->getArgOperand(0), Not, Q, Depth);


        // In the context of masks, bitreverse(Mask) == ~Mask

      case Intrinsic::bitreverse:

        return isMaskOrZero(II->getArgOperand(0), !Not, Q, Depth);

      default:

        break;

      }

    }

    break;

  }

  default:

    break;

  }

  return false;

}


/// Some comparisons can be simplified.

/// In this case, we are looking for comparisons that look like

/// a check for a lossy truncation.

/// Folds:

///   icmp SrcPred (x & Mask), x    to    icmp DstPred x, Mask

///   icmp SrcPred (x & ~Mask), ~Mask    to    icmp DstPred x, ~Mask

///   icmp eq/ne (x & ~Mask), 0     to    icmp DstPred x, Mask

///   icmp eq/ne (~x | Mask), -1     to    icmp DstPred x, Mask

/// Where Mask is some pattern that produces all-ones in low bits:

///    (-1 >> y)

///    ((-1 << y) >> y)     <- non-canonical, has extra uses

///   ~(-1 << y)

///    ((1 << y) + (-1))    <- non-canonical, has extra uses

/// The Mask can be a constant, too.

/// For some predicates, the operands are commutative.

/// For others, x can only be on a specific side.


static Value *foldICmpWithLowBitMaskedVal(CmpPredicate Pred, Value *Op0,

                                          Value *Op1, const SimplifyQuery &Q,

                                          InstCombiner &IC) {


  ICmpInst::Predicate DstPred;

  switch (Pred) {

  case ICmpInst::Predicate::ICMP_EQ:

    //  x & Mask == x

    //  x & ~Mask == 0

    //  ~x | Mask == -1

    //    ->    x u<= Mask

    //  x & ~Mask == ~Mask

    //    ->    ~Mask u<= x

    DstPred = ICmpInst::Predicate::ICMP_ULE;

    break;

  case ICmpInst::Predicate::ICMP_NE:

    //  x & Mask != x

    //  x & ~Mask != 0

    //  ~x | Mask != -1

    //    ->    x u> Mask

    //  x & ~Mask != ~Mask

    //    ->    ~Mask u> x

    DstPred = ICmpInst::Predicate::ICMP_UGT;

    break;

  case ICmpInst::Predicate::ICMP_ULT:

    //  x & Mask u< x

    //    -> x u> Mask

    //  x & ~Mask u< ~Mask

    //    -> ~Mask u> x

    DstPred = ICmpInst::Predicate::ICMP_UGT;

    break;

  case ICmpInst::Predicate::ICMP_UGE:

    //  x & Mask u>= x

    //    -> x u<= Mask

    //  x & ~Mask u>= ~Mask

    //    -> ~Mask u<= x

    DstPred = ICmpInst::Predicate::ICMP_ULE;

    break;

  case ICmpInst::Predicate::ICMP_SLT:

    //  x & Mask s< x [iff Mask s>= 0]

    //    -> x s> Mask

    //  x & ~Mask s< ~Mask [iff ~Mask != 0]

    //    -> ~Mask s> x

    DstPred = ICmpInst::Predicate::ICMP_SGT;

    break;

  case ICmpInst::Predicate::ICMP_SGE:

    //  x & Mask s>= x [iff Mask s>= 0]

    //    -> x s<= Mask

    //  x & ~Mask s>= ~Mask [iff ~Mask != 0]

    //    -> ~Mask s<= x

    DstPred = ICmpInst::Predicate::ICMP_SLE;

    break;

  default:

    // We don't support sgt,sle

    // ult/ugt are simplified to true/false respectively.

    return nullptr;

  }


  Value *X, *M;

  // Put search code in lambda for early positive returns.

  auto IsLowBitMask = [&]() {

    if (match(Op0, m_c_And(m_Specific(Op1), m_Value(M)))) {

      X = Op1;

      // Look for: x & Mask pred x

      if (isMaskOrZero(M, /*Not=*/false, Q)) {

        return !ICmpInst::isSigned(Pred) ||

               (match(M, m_NonNegative()) || isKnownNonNegative(M, Q));

      }


      // Look for: x & ~Mask pred ~Mask

      if (isMaskOrZero(X, /*Not=*/true, Q)) {

        return !ICmpInst::isSigned(Pred) || isKnownNonZero(X, Q);

      }

      return false;

    }

    if (ICmpInst::isEquality(Pred) && match(Op1, m_AllOnes()) &&

        match(Op0, m_OneUse(m_Or(m_Value(X), m_Value(M))))) {


      auto Check = [&]() {

        // Look for: ~x | Mask == -1

        if (isMaskOrZero(M, /*Not=*/false, Q)) {

          if (Value *NotX =

                  IC.getFreelyInverted(X, X->hasOneUse(), &IC.Builder)) {

            X = NotX;

            return true;

          }

        }

        return false;

      };

      if (Check())

        return true;

      std::swap(X, M);

      return Check();

    }

    if (ICmpInst::isEquality(Pred) && match(Op1, m_Zero()) &&

        match(Op0, m_OneUse(m_And(m_Value(X), m_Value(M))))) {

      auto Check = [&]() {

        // Look for: x & ~Mask == 0

        if (isMaskOrZero(M, /*Not=*/true, Q)) {

          if (Value *NotM =

                  IC.getFreelyInverted(M, M->hasOneUse(), &IC.Builder)) {

            M = NotM;

            return true;

          }

        }

        return false;

      };

      if (Check())

        return true;

      std::swap(X, M);

      return Check();

    }

    return false;

  };


  if (!IsLowBitMask())

    return nullptr;


  return IC.Builder.CreateICmp(DstPred, X, M);

}


/// Some comparisons can be simplified.

/// In this case, we are looking for comparisons that look like

/// a check for a lossy signed truncation.

/// Folds:   (MaskedBits is a constant.)

///   ((%x << MaskedBits) a>> MaskedBits) SrcPred %x

/// Into:

///   (add %x, (1 << (KeptBits-1))) DstPred (1 << KeptBits)

/// Where  KeptBits = bitwidth(%x) - MaskedBits

static Value *


foldICmpWithTruncSignExtendedVal(ICmpInst &I,

                                 InstCombiner::BuilderTy &Builder) {

  CmpPredicate SrcPred;

  Value *X;

  const APInt *C0, *C1; // FIXME: non-splats, potentially with undef.

  // We are ok with 'shl' having multiple uses, but 'ashr' must be one-use.

  if (!match(&I, m_c_ICmp(SrcPred,

                          m_OneUse(m_AShr(m_Shl(m_Value(X), m_APInt(C0)),

                                          m_APInt(C1))),

                          m_Deferred(X))))

    return nullptr;


  // Potential handling of non-splats: for each element:

  //  * if both are undef, replace with constant 0.

  //    Because (1<<0) is OK and is 1, and ((1<<0)>>1) is also OK and is 0.

  //  * if both are not undef, and are different, bailout.

  //  * else, only one is undef, then pick the non-undef one.


  // The shift amount must be equal.

  if (*C0 != *C1)

    return nullptr;

  const APInt &MaskedBits = *C0;

  assert(MaskedBits != 0 && "shift by zero should be folded away already.");


  ICmpInst::Predicate DstPred;

  switch (SrcPred) {

  case ICmpInst::Predicate::ICMP_EQ:

    // ((%x << MaskedBits) a>> MaskedBits) == %x

    //   =>

    // (add %x, (1 << (KeptBits-1))) u< (1 << KeptBits)

    DstPred = ICmpInst::Predicate::ICMP_ULT;

    break;

  case ICmpInst::Predicate::ICMP_NE:

    // ((%x << MaskedBits) a>> MaskedBits) != %x

    //   =>

    // (add %x, (1 << (KeptBits-1))) u>= (1 << KeptBits)

    DstPred = ICmpInst::Predicate::ICMP_UGE;

    break;

  // FIXME: are more folds possible?

  default:

    return nullptr;

  }


  auto *XType = X->getType();

  const unsigned XBitWidth = XType->getScalarSizeInBits();

  const APInt BitWidth = APInt(XBitWidth, XBitWidth);

  assert(BitWidth.ugt(MaskedBits) && "shifts should leave some bits untouched");


  // KeptBits = bitwidth(%x) - MaskedBits

  const APInt KeptBits = BitWidth - MaskedBits;

  assert(KeptBits.ugt(0) && KeptBits.ult(BitWidth) && "unreachable");

  // ICmpCst = (1 << KeptBits)

  const APInt ICmpCst = APInt(XBitWidth, 1).shl(KeptBits);

  assert(ICmpCst.isPowerOf2());

  // AddCst = (1 << (KeptBits-1))

  const APInt AddCst = ICmpCst.lshr(1);

  assert(AddCst.ult(ICmpCst) && AddCst.isPowerOf2());


  // T0 = add %x, AddCst

  Value *T0 = Builder.CreateAdd(X, ConstantInt::get(XType, AddCst));

  // T1 = T0 DstPred ICmpCst

  Value *T1 = Builder.CreateICmp(DstPred, T0, ConstantInt::get(XType, ICmpCst));


  return T1;

}


// Given pattern:

//   icmp eq/ne (and ((x shift Q), (y oppositeshift K))), 0

// we should move shifts to the same hand of 'and', i.e. rewrite as

//   icmp eq/ne (and (x shift (Q+K)), y), 0  iff (Q+K) u< bitwidth(x)

// We are only interested in opposite logical shifts here.

// One of the shifts can be truncated.

// If we can, we want to end up creating 'lshr' shift.

static Value *


foldShiftIntoShiftInAnotherHandOfAndInICmp(ICmpInst &I, const SimplifyQuery SQ,

                                           InstCombiner::BuilderTy &Builder) {

  if (!I.isEquality() || !match(I.getOperand(1), m_Zero()) ||

      !I.getOperand(0)->hasOneUse())

    return nullptr;


  auto m_AnyLogicalShift = m_LogicalShift(m_Value(), m_Value());


  // Look for an 'and' of two logical shifts, one of which may be truncated.

  // We use m_TruncOrSelf() on the RHS to correctly handle commutative case.

  Instruction *XShift, *MaybeTruncation, *YShift;

  if (!match(

          I.getOperand(0),

          m_c_And(m_CombineAnd(m_AnyLogicalShift, m_Instruction(XShift)),

                  m_CombineAnd(m_TruncOrSelf(m_CombineAnd(

                                   m_AnyLogicalShift, m_Instruction(YShift))),

                               m_Instruction(MaybeTruncation)))))

    return nullptr;


  // We potentially looked past 'trunc', but only when matching YShift,

  // therefore YShift must have the widest type.

  Instruction *WidestShift = YShift;

  // Therefore XShift must have the shallowest type.

  // Or they both have identical types if there was no truncation.

  Instruction *NarrowestShift = XShift;


  Type *WidestTy = WidestShift->getType();

  Type *NarrowestTy = NarrowestShift->getType();

  assert(NarrowestTy == I.getOperand(0)->getType() &&

         "We did not look past any shifts while matching XShift though.");

  bool HadTrunc = WidestTy != I.getOperand(0)->getType();


  // If YShift is a 'lshr', swap the shifts around.

  if (match(YShift, m_LShr(m_Value(), m_Value())))

    std::swap(XShift, YShift);


  // The shifts must be in opposite directions.

  auto XShiftOpcode = XShift->getOpcode();

  if (XShiftOpcode == YShift->getOpcode())

    return nullptr; // Do not care about same-direction shifts here.


  Value *X, *XShAmt, *Y, *YShAmt;

  match(XShift, m_BinOp(m_Value(X), m_ZExtOrSelf(m_Value(XShAmt))));

  match(YShift, m_BinOp(m_Value(Y), m_ZExtOrSelf(m_Value(YShAmt))));


  // If one of the values being shifted is a constant, then we will end with

  // and+icmp, and [zext+]shift instrs will be constant-folded. If they are not,

  // however, we will need to ensure that we won't increase instruction count.

  if (!isa<Constant>(X) && !isa<Constant>(Y)) {

    // At least one of the hands of the 'and' should be one-use shift.

    if (!match(I.getOperand(0),

               m_c_And(m_OneUse(m_AnyLogicalShift), m_Value())))

      return nullptr;

    if (HadTrunc) {

      // Due to the 'trunc', we will need to widen X. For that either the old

      // 'trunc' or the shift amt in the non-truncated shift should be one-use.

      if (!MaybeTruncation->hasOneUse() &&

          !NarrowestShift->getOperand(1)->hasOneUse())

        return nullptr;

    }

  }


  // We have two shift amounts from two different shifts. The types of those

  // shift amounts may not match. If that's the case let's bailout now.

  if (XShAmt->getType() != YShAmt->getType())

    return nullptr;


  // As input, we have the following pattern:

  //   icmp eq/ne (and ((x shift Q), (y oppositeshift K))), 0

  // We want to rewrite that as:

  //   icmp eq/ne (and (x shift (Q+K)), y), 0  iff (Q+K) u< bitwidth(x)

  // While we know that originally (Q+K) would not overflow

  // (because  2 * (N-1) u<= iN -1), we have looked past extensions of

  // shift amounts. so it may now overflow in smaller bitwidth.

  // To ensure that does not happen, we need to ensure that the total maximal

  // shift amount is still representable in that smaller bit width.

  unsigned MaximalPossibleTotalShiftAmount =

      (WidestTy->getScalarSizeInBits() - 1) +

      (NarrowestTy->getScalarSizeInBits() - 1);

  APInt MaximalRepresentableShiftAmount =

      APInt::getAllOnes(XShAmt->getType()->getScalarSizeInBits());

  if (MaximalRepresentableShiftAmount.ult(MaximalPossibleTotalShiftAmount))

    return nullptr;


  // Can we fold (XShAmt+YShAmt) ?

  auto *NewShAmt = dyn_cast_or_null<Constant>(

      simplifyAddInst(XShAmt, YShAmt, /*isNSW=*/false,

                      /*isNUW=*/false, SQ.getWithInstruction(&I)));

  if (!NewShAmt)

    return nullptr;

  if (NewShAmt->getType() != WidestTy) {

    NewShAmt =

        ConstantFoldCastOperand(Instruction::ZExt, NewShAmt, WidestTy, SQ.DL);

    if (!NewShAmt)

      return nullptr;

  }

  unsigned WidestBitWidth = WidestTy->getScalarSizeInBits();


  // Is the new shift amount smaller than the bit width?

  // FIXME: could also rely on ConstantRange.

  if (!match(NewShAmt,

             m_SpecificInt_ICMP(ICmpInst::Predicate::ICMP_ULT,

                                APInt(WidestBitWidth, WidestBitWidth))))

    return nullptr;


  // An extra legality check is needed if we had trunc-of-lshr.

  if (HadTrunc && match(WidestShift, m_LShr(m_Value(), m_Value()))) {

    auto CanFold = [NewShAmt, WidestBitWidth, NarrowestShift, SQ,

                    WidestShift]() {

      // It isn't obvious whether it's worth it to analyze non-constants here.

      // Also, let's basically give up on non-splat cases, pessimizing vectors.

      // If *any* of these preconditions matches we can perform the fold.

      Constant *NewShAmtSplat = NewShAmt->getType()->isVectorTy()

                                    ? NewShAmt->getSplatValue()

                                    : NewShAmt;

      // If it's edge-case shift (by 0 or by WidestBitWidth-1) we can fold.

      if (NewShAmtSplat &&

          (NewShAmtSplat->isNullValue() ||

           NewShAmtSplat->getUniqueInteger() == WidestBitWidth - 1))

        return true;

      // We consider *min* leading zeros so a single outlier

      // blocks the transform as opposed to allowing it.

      if (auto *C = dyn_cast<Constant>(NarrowestShift->getOperand(0))) {

        KnownBits Known = computeKnownBits(C, SQ.DL);

        unsigned MinLeadZero = Known.countMinLeadingZeros();

        // If the value being shifted has at most lowest bit set we can fold.

        unsigned MaxActiveBits = Known.getBitWidth() - MinLeadZero;

        if (MaxActiveBits <= 1)

          return true;

        // Precondition:  NewShAmt u<= countLeadingZeros(C)

        if (NewShAmtSplat && NewShAmtSplat->getUniqueInteger().ule(MinLeadZero))

          return true;

      }

      if (auto *C = dyn_cast<Constant>(WidestShift->getOperand(0))) {

        KnownBits Known = computeKnownBits(C, SQ.DL);

        unsigned MinLeadZero = Known.countMinLeadingZeros();

        // If the value being shifted has at most lowest bit set we can fold.

        unsigned MaxActiveBits = Known.getBitWidth() - MinLeadZero;

        if (MaxActiveBits <= 1)

          return true;

        // Precondition:  ((WidestBitWidth-1)-NewShAmt) u<= countLeadingZeros(C)

        if (NewShAmtSplat) {

          APInt AdjNewShAmt =

              (WidestBitWidth - 1) - NewShAmtSplat->getUniqueInteger();

          if (AdjNewShAmt.ule(MinLeadZero))

            return true;

        }

      }

      return false; // Can't tell if it's ok.

    };

    if (!CanFold())

      return nullptr;

  }


  // All good, we can do this fold.

  X = Builder.CreateZExt(X, WidestTy);

  Y = Builder.CreateZExt(Y, WidestTy);

  // The shift is the same that was for X.

  Value *T0 = XShiftOpcode == Instruction::BinaryOps::LShr

                  ? Builder.CreateLShr(X, NewShAmt)

                  : Builder.CreateShl(X, NewShAmt);

  Value *T1 = Builder.CreateAnd(T0, Y);

  return Builder.CreateICmp(I.getPredicate(), T1,

                            Constant::getNullValue(WidestTy));

}


/// Fold

///   (-1 u/ x) u< y

///   ((x * y) ?/ x) != y

/// to

///   @llvm.?mul.with.overflow(x, y) plus extraction of overflow bit

/// Note that the comparison is commutative, while inverted (u>=, ==) predicate

/// will mean that we are looking for the opposite answer.


Value *InstCombinerImpl::foldMultiplicationOverflowCheck(ICmpInst &I) {

  CmpPredicate Pred;

  Value *X, *Y;

  Instruction *Mul;

  Instruction *Div;

  bool NeedNegation;

  // Look for: (-1 u/ x) u</u>= y

  if (!I.isEquality() &&

      match(&I, m_c_ICmp(Pred,

                         m_CombineAnd(m_OneUse(m_UDiv(m_AllOnes(), m_Value(X))),

                                      m_Instruction(Div)),

                         m_Value(Y)))) {

    Mul = nullptr;


    // Are we checking that overflow does not happen, or does happen?

    switch (Pred) {

    case ICmpInst::Predicate::ICMP_ULT:

      NeedNegation = false;

      break; // OK

    case ICmpInst::Predicate::ICMP_UGE:

      NeedNegation = true;

      break; // OK

    default:

      return nullptr; // Wrong predicate.

    }

  } else // Look for: ((x * y) / x) !=/== y

    if (I.isEquality() &&

        match(&I, m_c_ICmp(Pred, m_Value(Y),

                           m_CombineAnd(m_OneUse(m_IDiv(

                                            m_CombineAnd(m_c_Mul(m_Deferred(Y),

                                                                 m_Value(X)),

                                                         m_Instruction(Mul)),

                                            m_Deferred(X))),

                                        m_Instruction(Div))))) {

      NeedNegation = Pred == ICmpInst::Predicate::ICMP_EQ;

    } else

      return nullptr;


  BuilderTy::InsertPointGuard Guard(Builder);

  // If the pattern included (x * y), we'll want to insert new instructions

  // right before that original multiplication so that we can replace it.

  bool MulHadOtherUses = Mul && !Mul->hasOneUse();

  if (MulHadOtherUses)

    Builder.SetInsertPoint(Mul);


  CallInst *Call = Builder.CreateIntrinsic(

      Div->getOpcode() == Instruction::UDiv ? Intrinsic::umul_with_overflow

                                            : Intrinsic::smul_with_overflow,

      X->getType(), {X, Y}, /*FMFSource=*/nullptr, "mul");


  // If the multiplication was used elsewhere, to ensure that we don't leave

  // "duplicate" instructions, replace uses of that original multiplication

  // with the multiplication result from the with.overflow intrinsic.

  if (MulHadOtherUses)

    replaceInstUsesWith(*Mul, Builder.CreateExtractValue(Call, 0, "mul.val"));


  Value *Res = Builder.CreateExtractValue(Call, 1, "mul.ov");

  if (NeedNegation) // This technically increases instruction count.

    Res = Builder.CreateNot(Res, "mul.not.ov");


  // If we replaced the mul, erase it. Do this after all uses of Builder,

  // as the mul is used as insertion point.

  if (MulHadOtherUses)

    eraseInstFromFunction(*Mul);


  return Res;

}


static Instruction *foldICmpXNegX(ICmpInst &I,

                                  InstCombiner::BuilderTy &Builder) {

  CmpPredicate Pred;

  Value *X;

  if (match(&I, m_c_ICmp(Pred, m_NSWNeg(m_Value(X)), m_Deferred(X)))) {


    if (ICmpInst::isSigned(Pred))

      Pred = ICmpInst::getSwappedPredicate(Pred);

    else if (ICmpInst::isUnsigned(Pred))

      Pred = ICmpInst::getSignedPredicate(Pred);

    // else for equality-comparisons just keep the predicate.


    return ICmpInst::Create(Instruction::ICmp, Pred, X,

                            Constant::getNullValue(X->getType()), I.getName());

  }


  // A value is not equal to its negation unless that value is 0 or

  // MinSignedValue, ie: a != -a --> (a & MaxSignedVal) != 0

  if (match(&I, m_c_ICmp(Pred, m_OneUse(m_Neg(m_Value(X))), m_Deferred(X))) &&

      ICmpInst::isEquality(Pred)) {

    Type *Ty = X->getType();

    uint32_t BitWidth = Ty->getScalarSizeInBits();

    Constant *MaxSignedVal =

        ConstantInt::get(Ty, APInt::getSignedMaxValue(BitWidth));

    Value *And = Builder.CreateAnd(X, MaxSignedVal);

    Constant *Zero = Constant::getNullValue(Ty);

    return CmpInst::Create(Instruction::ICmp, Pred, And, Zero);

  }


  return nullptr;

}


static Instruction *foldICmpAndXX(ICmpInst &I, const SimplifyQuery &Q,

                                  InstCombinerImpl &IC) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1), *A;

  // Normalize and operand as operand 0.

  CmpInst::Predicate Pred = I.getPredicate();

  if (match(Op1, m_c_And(m_Specific(Op0), m_Value()))) {

    std::swap(Op0, Op1);

    Pred = ICmpInst::getSwappedPredicate(Pred);

  }


  if (!match(Op0, m_c_And(m_Specific(Op1), m_Value(A))))

    return nullptr;


  // (icmp (X & Y) u< X --> (X & Y) != X

  if (Pred == ICmpInst::ICMP_ULT)

    return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);


  // (icmp (X & Y) u>= X --> (X & Y) == X

  if (Pred == ICmpInst::ICMP_UGE)

    return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);


  if (ICmpInst::isEquality(Pred) && Op0->hasOneUse()) {

    // icmp (X & Y) eq/ne Y --> (X | ~Y) eq/ne -1 if Y is freely invertible and

    // Y is non-constant. If Y is constant the `X & C == C` form is preferable

    // so don't do this fold.

    if (!match(Op1, m_ImmConstant()))

      if (auto *NotOp1 =

              IC.getFreelyInverted(Op1, !Op1->hasNUsesOrMore(3), &IC.Builder))

        return new ICmpInst(Pred, IC.Builder.CreateOr(A, NotOp1),

                            Constant::getAllOnesValue(Op1->getType()));

    // icmp (X & Y) eq/ne Y --> (~X & Y) eq/ne 0 if X  is freely invertible.

    if (auto *NotA = IC.getFreelyInverted(A, A->hasOneUse(), &IC.Builder))

      return new ICmpInst(Pred, IC.Builder.CreateAnd(Op1, NotA),

                          Constant::getNullValue(Op1->getType()));

  }


  if (!ICmpInst::isSigned(Pred))

    return nullptr;


  KnownBits KnownY = IC.computeKnownBits(A, &I);

  // (X & NegY) spred X --> (X & NegY) upred X

  if (KnownY.isNegative())

    return new ICmpInst(ICmpInst::getUnsignedPredicate(Pred), Op0, Op1);


  if (Pred != ICmpInst::ICMP_SLE && Pred != ICmpInst::ICMP_SGT)

    return nullptr;


  if (KnownY.isNonNegative())

    // (X & PosY) s<= X --> X s>= 0

    // (X & PosY) s> X --> X s< 0

    return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Op1,

                        Constant::getNullValue(Op1->getType()));


  if (isKnownNegative(Op1, IC.getSimplifyQuery().getWithInstruction(&I)))

    // (NegX & Y) s<= NegX --> Y s< 0

    // (NegX & Y) s> NegX --> Y s>= 0

    return new ICmpInst(ICmpInst::getFlippedStrictnessPredicate(Pred), A,

                        Constant::getNullValue(A->getType()));


  return nullptr;

}


static Instruction *foldICmpOrXX(ICmpInst &I, const SimplifyQuery &Q,

                                 InstCombinerImpl &IC) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1), *A;


  // Normalize or operand as operand 0.

  CmpInst::Predicate Pred = I.getPredicate();

  if (match(Op1, m_c_Or(m_Specific(Op0), m_Value(A)))) {

    std::swap(Op0, Op1);

    Pred = ICmpInst::getSwappedPredicate(Pred);

  } else if (!match(Op0, m_c_Or(m_Specific(Op1), m_Value(A)))) {

    return nullptr;

  }


  // icmp (X | Y) u<= X --> (X | Y) == X

  if (Pred == ICmpInst::ICMP_ULE)

    return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);


  // icmp (X | Y) u> X --> (X | Y) != X

  if (Pred == ICmpInst::ICMP_UGT)

    return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);


  if (ICmpInst::isEquality(Pred) && Op0->hasOneUse()) {

    // icmp (X | Y) eq/ne Y --> (X & ~Y) eq/ne 0 if Y is freely invertible

    if (Value *NotOp1 = IC.getFreelyInverted(

            Op1, !isa<Constant>(Op1) && !Op1->hasNUsesOrMore(3), &IC.Builder))

      return new ICmpInst(Pred, IC.Builder.CreateAnd(A, NotOp1),

                          Constant::getNullValue(Op1->getType()));

    // icmp (X | Y) eq/ne Y --> (~X | Y) eq/ne -1 if X  is freely invertible.

    if (Value *NotA = IC.getFreelyInverted(A, A->hasOneUse(), &IC.Builder))

      return new ICmpInst(Pred, IC.Builder.CreateOr(Op1, NotA),

                          Constant::getAllOnesValue(Op1->getType()));

  }

  return nullptr;

}


static Instruction *foldICmpXorXX(ICmpInst &I, const SimplifyQuery &Q,

                                  InstCombinerImpl &IC) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1), *A;

  // Normalize xor operand as operand 0.

  CmpInst::Predicate Pred = I.getPredicate();

  if (match(Op1, m_c_Xor(m_Specific(Op0), m_Value()))) {

    std::swap(Op0, Op1);

    Pred = ICmpInst::getSwappedPredicate(Pred);

  }

  if (!match(Op0, m_c_Xor(m_Specific(Op1), m_Value(A))))

    return nullptr;


  // icmp (X ^ Y_NonZero) u>= X --> icmp (X ^ Y_NonZero) u> X

  // icmp (X ^ Y_NonZero) u<= X --> icmp (X ^ Y_NonZero) u< X

  // icmp (X ^ Y_NonZero) s>= X --> icmp (X ^ Y_NonZero) s> X

  // icmp (X ^ Y_NonZero) s<= X --> icmp (X ^ Y_NonZero) s< X

  CmpInst::Predicate PredOut = CmpInst::getStrictPredicate(Pred);

  if (PredOut != Pred && isKnownNonZero(A, Q))

    return new ICmpInst(PredOut, Op0, Op1);


  // These transform work when A is negative.

  // X s< X^A, X s<= X^A, X u> X^A, X u>= X^A  --> X s< 0

  // X s> X^A, X s>= X^A, X u< X^A, X u<= X^A  --> X s>= 0

  if (match(A, m_Negative())) {

    CmpInst::Predicate NewPred;

    switch (ICmpInst::getStrictPredicate(Pred)) {

    default:

      return nullptr;

    case ICmpInst::ICMP_SLT:

    case ICmpInst::ICMP_UGT:

      NewPred = ICmpInst::ICMP_SLT;

      break;

    case ICmpInst::ICMP_SGT:

    case ICmpInst::ICMP_ULT:

      NewPred = ICmpInst::ICMP_SGE;

      break;

    }

    Constant *Const = Constant::getNullValue(Op0->getType());

    return new ICmpInst(NewPred, Op0, Const);

  }


  return nullptr;

}


/// Return true if X is a multiple of C.

/// TODO: Handle non-power-of-2 factors.


static bool isMultipleOf(Value *X, const APInt &C, const SimplifyQuery &Q) {

  if (C.isOne())

    return true;


  if (!C.isPowerOf2())

    return false;


  return MaskedValueIsZero(X, C - 1, Q);

}


/// Try to fold icmp (binop), X or icmp X, (binop).

/// TODO: A large part of this logic is duplicated in InstSimplify's

/// simplifyICmpWithBinOp(). We should be able to share that and avoid the code

/// duplication.


Instruction *InstCombinerImpl::foldICmpBinOp(ICmpInst &I,

                                             const SimplifyQuery &SQ) {

  const SimplifyQuery Q = SQ.getWithInstruction(&I);

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);


  // Special logic for binary operators.

  BinaryOperator *BO0 = dyn_cast<BinaryOperator>(Op0);

  BinaryOperator *BO1 = dyn_cast<BinaryOperator>(Op1);

  if (!BO0 && !BO1)

    return nullptr;


  if (Instruction *NewICmp = foldICmpXNegX(I, Builder))

    return NewICmp;


  const CmpInst::Predicate Pred = I.getPredicate();

  Value *X;


  // Convert add-with-unsigned-overflow comparisons into a 'not' with compare.

  // (Op1 + X) u</u>= Op1 --> ~Op1 u</u>= X

  if (match(Op0, m_OneUse(m_c_Add(m_Specific(Op1), m_Value(X)))) &&

      (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE))

    return new ICmpInst(Pred, Builder.CreateNot(Op1), X);

  // Op0 u>/u<= (Op0 + X) --> X u>/u<= ~Op0

  if (match(Op1, m_OneUse(m_c_Add(m_Specific(Op0), m_Value(X)))) &&

      (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULE))

    return new ICmpInst(Pred, X, Builder.CreateNot(Op0));


  {

    // (Op1 + X) + C u</u>= Op1 --> ~C - X u</u>= Op1

    Constant *C;

    if (match(Op0, m_OneUse(m_Add(m_c_Add(m_Specific(Op1), m_Value(X)),

                                  m_ImmConstant(C)))) &&

        (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE)) {

      Constant *C2 = ConstantExpr::getNot(C);

      return new ICmpInst(Pred, Builder.CreateSub(C2, X), Op1);

    }

    // Op0 u>/u<= (Op0 + X) + C --> Op0 u>/u<= ~C - X

    if (match(Op1, m_OneUse(m_Add(m_c_Add(m_Specific(Op0), m_Value(X)),

                                  m_ImmConstant(C)))) &&

        (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULE)) {

      Constant *C2 = ConstantExpr::getNot(C);

      return new ICmpInst(Pred, Op0, Builder.CreateSub(C2, X));

    }

  }


  // (icmp eq/ne (X, -P2), INT_MIN)

  //  -> (icmp slt/sge X, INT_MIN + P2)

  if (ICmpInst::isEquality(Pred) && BO0 &&

      match(I.getOperand(1), m_SignMask()) &&

      match(BO0, m_And(m_Value(), m_NegatedPower2OrZero()))) {

    // Will Constant fold.

    Value *NewC = Builder.CreateSub(I.getOperand(1), BO0->getOperand(1));

    return new ICmpInst(Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_SLT

                                                  : ICmpInst::ICMP_SGE,

                        BO0->getOperand(0), NewC);

  }


  {

    // Similar to above: an unsigned overflow comparison may use offset + mask:

    // ((Op1 + C) & C) u<  Op1 --> Op1 != 0

    // ((Op1 + C) & C) u>= Op1 --> Op1 == 0

    // Op0 u>  ((Op0 + C) & C) --> Op0 != 0

    // Op0 u<= ((Op0 + C) & C) --> Op0 == 0

    BinaryOperator *BO;

    const APInt *C;

    if ((Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE) &&

        match(Op0, m_And(m_BinOp(BO), m_LowBitMask(C))) &&

        match(BO, m_Add(m_Specific(Op1), m_SpecificIntAllowPoison(*C)))) {

      CmpInst::Predicate NewPred =

          Pred == ICmpInst::ICMP_ULT ? ICmpInst::ICMP_NE : ICmpInst::ICMP_EQ;

      Constant *Zero = ConstantInt::getNullValue(Op1->getType());

      return new ICmpInst(NewPred, Op1, Zero);

    }


    if ((Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULE) &&

        match(Op1, m_And(m_BinOp(BO), m_LowBitMask(C))) &&

        match(BO, m_Add(m_Specific(Op0), m_SpecificIntAllowPoison(*C)))) {

      CmpInst::Predicate NewPred =

          Pred == ICmpInst::ICMP_UGT ? ICmpInst::ICMP_NE : ICmpInst::ICMP_EQ;

      Constant *Zero = ConstantInt::getNullValue(Op1->getType());

      return new ICmpInst(NewPred, Op0, Zero);

    }

  }


  bool NoOp0WrapProblem = false, NoOp1WrapProblem = false;

  bool Op0HasNUW = false, Op1HasNUW = false;

  bool Op0HasNSW = false, Op1HasNSW = false;

  // Analyze the case when either Op0 or Op1 is an add instruction.

  // Op0 = A + B (or A and B are null); Op1 = C + D (or C and D are null).

  auto hasNoWrapProblem = [](const BinaryOperator &BO, CmpInst::Predicate Pred,

                             bool &HasNSW, bool &HasNUW) -> bool {

    if (isa<OverflowingBinaryOperator>(BO)) {

      HasNUW = BO.hasNoUnsignedWrap();

      HasNSW = BO.hasNoSignedWrap();

      return ICmpInst::isEquality(Pred) ||

             (CmpInst::isUnsigned(Pred) && HasNUW) ||

             (CmpInst::isSigned(Pred) && HasNSW);

    } else if (BO.getOpcode() == Instruction::Or) {

      HasNUW = true;

      HasNSW = true;

      return true;

    } else {

      return false;

    }

  };

  Value *A = nullptr, *B = nullptr, *C = nullptr, *D = nullptr;


  if (BO0) {

    match(BO0, m_AddLike(m_Value(A), m_Value(B)));

    NoOp0WrapProblem = hasNoWrapProblem(*BO0, Pred, Op0HasNSW, Op0HasNUW);

  }

  if (BO1) {

    match(BO1, m_AddLike(m_Value(C), m_Value(D)));

    NoOp1WrapProblem = hasNoWrapProblem(*BO1, Pred, Op1HasNSW, Op1HasNUW);

  }


  // icmp (A+B), A -> icmp B, 0 for equalities or if there is no overflow.

  // icmp (A+B), B -> icmp A, 0 for equalities or if there is no overflow.

  if ((A == Op1 || B == Op1) && NoOp0WrapProblem)

    return new ICmpInst(Pred, A == Op1 ? B : A,

                        Constant::getNullValue(Op1->getType()));


  // icmp C, (C+D) -> icmp 0, D for equalities or if there is no overflow.

  // icmp D, (C+D) -> icmp 0, C for equalities or if there is no overflow.

  if ((C == Op0 || D == Op0) && NoOp1WrapProblem)

    return new ICmpInst(Pred, Constant::getNullValue(Op0->getType()),

                        C == Op0 ? D : C);


  // icmp (A+B), (A+D) -> icmp B, D for equalities or if there is no overflow.

  if (A && C && (A == C || A == D || B == C || B == D) && NoOp0WrapProblem &&

      NoOp1WrapProblem) {

    // Determine Y and Z in the form icmp (X+Y), (X+Z).

    Value *Y, *Z;

    if (A == C) {

      // C + B == C + D  ->  B == D

      Y = B;

      Z = D;

    } else if (A == D) {

      // D + B == C + D  ->  B == C

      Y = B;

      Z = C;

    } else if (B == C) {

      // A + C == C + D  ->  A == D

      Y = A;

      Z = D;

    } else {

      assert(B == D);

      // A + D == C + D  ->  A == C

      Y = A;

      Z = C;

    }

    return new ICmpInst(Pred, Y, Z);

  }


  if (ICmpInst::isRelational(Pred)) {

    // Return if both X and Y is divisible by Z/-Z.

    // TODO: Generalize to check if (X - Y) is divisible by Z/-Z.

    auto ShareCommonDivisor = [&Q](Value *X, Value *Y, Value *Z,

                                   bool IsNegative) -> bool {

      const APInt *OffsetC;

      if (!match(Z, m_APInt(OffsetC)))

        return false;


      // Fast path for Z == 1/-1.

      if (IsNegative ? OffsetC->isAllOnes() : OffsetC->isOne())

        return true;


      APInt C = *OffsetC;

      if (IsNegative)

        C.negate();

      // Note: -INT_MIN is also negative.

      if (!C.isStrictlyPositive())

        return false;


      return isMultipleOf(X, C, Q) && isMultipleOf(Y, C, Q);

    };


    // TODO: The subtraction-related identities shown below also hold, but

    // canonicalization from (X -nuw 1) to (X + -1) means that the combinations

    // wouldn't happen even if they were implemented.

    //

    // icmp ult (A - 1), Op1 -> icmp ule A, Op1

    // icmp uge (A - 1), Op1 -> icmp ugt A, Op1

    // icmp ugt Op0, (C - 1) -> icmp uge Op0, C

    // icmp ule Op0, (C - 1) -> icmp ult Op0, C


    // icmp slt (A + -1), Op1 -> icmp sle A, Op1

    // icmp sge (A + -1), Op1 -> icmp sgt A, Op1

    // icmp sle (A + 1), Op1 -> icmp slt A, Op1

    // icmp sgt (A + 1), Op1 -> icmp sge A, Op1

    // icmp ule (A + 1), Op0 -> icmp ult A, Op1

    // icmp ugt (A + 1), Op0 -> icmp uge A, Op1

    if (A && NoOp0WrapProblem &&

        ShareCommonDivisor(A, Op1, B,

                           ICmpInst::isLT(Pred) || ICmpInst::isGE(Pred)))

      return new ICmpInst(ICmpInst::getFlippedStrictnessPredicate(Pred), A,

                          Op1);


    // icmp sgt Op0, (C + -1) -> icmp sge Op0, C

    // icmp sle Op0, (C + -1) -> icmp slt Op0, C

    // icmp sge Op0, (C + 1) -> icmp sgt Op0, C

    // icmp slt Op0, (C + 1) -> icmp sle Op0, C

    // icmp uge Op0, (C + 1) -> icmp ugt Op0, C

    // icmp ult Op0, (C + 1) -> icmp ule Op0, C

    if (C && NoOp1WrapProblem &&

        ShareCommonDivisor(Op0, C, D,

                           ICmpInst::isGT(Pred) || ICmpInst::isLE(Pred)))

      return new ICmpInst(ICmpInst::getFlippedStrictnessPredicate(Pred), Op0,

                          C);

  }


  // if C1 has greater magnitude than C2:

  //  icmp (A + C1), (C + C2) -> icmp (A + C3), C

  //  s.t. C3 = C1 - C2

  //

  // if C2 has greater magnitude than C1:

  //  icmp (A + C1), (C + C2) -> icmp A, (C + C3)

  //  s.t. C3 = C2 - C1

  if (A && C && NoOp0WrapProblem && NoOp1WrapProblem &&

      (BO0->hasOneUse() || BO1->hasOneUse()) && !I.isUnsigned()) {

    const APInt *AP1, *AP2;

    // TODO: Support non-uniform vectors.

    // TODO: Allow poison passthrough if B or D's element is poison.

    if (match(B, m_APIntAllowPoison(AP1)) &&

        match(D, m_APIntAllowPoison(AP2)) &&

        AP1->isNegative() == AP2->isNegative()) {

      APInt AP1Abs = AP1->abs();

      APInt AP2Abs = AP2->abs();

      if (AP1Abs.uge(AP2Abs)) {

        APInt Diff = *AP1 - *AP2;

        Constant *C3 = Constant::getIntegerValue(BO0->getType(), Diff);

        Value *NewAdd = Builder.CreateAdd(

            A, C3, "", Op0HasNUW && Diff.ule(*AP1), Op0HasNSW);

        return new ICmpInst(Pred, NewAdd, C);

      } else {

        APInt Diff = *AP2 - *AP1;

        Constant *C3 = Constant::getIntegerValue(BO0->getType(), Diff);

        Value *NewAdd = Builder.CreateAdd(

            C, C3, "", Op1HasNUW && Diff.ule(*AP2), Op1HasNSW);

        return new ICmpInst(Pred, A, NewAdd);

      }

    }

    Constant *Cst1, *Cst2;

    if (match(B, m_ImmConstant(Cst1)) && match(D, m_ImmConstant(Cst2)) &&

        ICmpInst::isEquality(Pred)) {

      Constant *Diff = ConstantExpr::getSub(Cst2, Cst1);

      Value *NewAdd = Builder.CreateAdd(C, Diff);

      return new ICmpInst(Pred, A, NewAdd);

    }

  }


  // Analyze the case when either Op0 or Op1 is a sub instruction.

  // Op0 = A - B (or A and B are null); Op1 = C - D (or C and D are null).

  A = nullptr;

  B = nullptr;

  C = nullptr;

  D = nullptr;

  if (BO0 && BO0->getOpcode() == Instruction::Sub) {

    A = BO0->getOperand(0);

    B = BO0->getOperand(1);

  }

  if (BO1 && BO1->getOpcode() == Instruction::Sub) {

    C = BO1->getOperand(0);

    D = BO1->getOperand(1);

  }


  // icmp (A-B), A -> icmp 0, B for equalities or if there is no overflow.

  if (A == Op1 && NoOp0WrapProblem)

    return new ICmpInst(Pred, Constant::getNullValue(Op1->getType()), B);

  // icmp C, (C-D) -> icmp D, 0 for equalities or if there is no overflow.

  if (C == Op0 && NoOp1WrapProblem)

    return new ICmpInst(Pred, D, Constant::getNullValue(Op0->getType()));


  // Convert sub-with-unsigned-overflow comparisons into a comparison of args.

  // (A - B) u>/u<= A --> B u>/u<= A

  if (A == Op1 && (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULE))

    return new ICmpInst(Pred, B, A);

  // C u</u>= (C - D) --> C u</u>= D

  if (C == Op0 && (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE))

    return new ICmpInst(Pred, C, D);

  // (A - B) u>=/u< A --> B u>/u<= A  iff B != 0

  if (A == Op1 && (Pred == ICmpInst::ICMP_UGE || Pred == ICmpInst::ICMP_ULT) &&

      isKnownNonZero(B, Q))

    return new ICmpInst(CmpInst::getFlippedStrictnessPredicate(Pred), B, A);

  // C u<=/u> (C - D) --> C u</u>= D  iff B != 0

  if (C == Op0 && (Pred == ICmpInst::ICMP_ULE || Pred == ICmpInst::ICMP_UGT) &&

      isKnownNonZero(D, Q))

    return new ICmpInst(CmpInst::getFlippedStrictnessPredicate(Pred), C, D);


  // icmp (A-B), (C-B) -> icmp A, C for equalities or if there is no overflow.

  if (B && D && B == D && NoOp0WrapProblem && NoOp1WrapProblem)

    return new ICmpInst(Pred, A, C);


  // icmp (A-B), (A-D) -> icmp D, B for equalities or if there is no overflow.

  if (A && C && A == C && NoOp0WrapProblem && NoOp1WrapProblem)

    return new ICmpInst(Pred, D, B);


  // icmp (0-X) < cst --> x > -cst

  if (NoOp0WrapProblem && ICmpInst::isSigned(Pred)) {

    Value *X;

    if (match(BO0, m_Neg(m_Value(X))))

      if (Constant *RHSC = dyn_cast<Constant>(Op1))

        if (RHSC->isNotMinSignedValue())

          return new ICmpInst(I.getSwappedPredicate(), X,

                              ConstantExpr::getNeg(RHSC));

  }


  if (Instruction *R = foldICmpXorXX(I, Q, *this))

    return R;

  if (Instruction *R = foldICmpOrXX(I, Q, *this))

    return R;


  {

    // Try to remove shared multiplier from comparison:

    // X * Z pred Y * Z

    Value *X, *Y, *Z;

    if ((match(Op0, m_Mul(m_Value(X), m_Value(Z))) &&

         match(Op1, m_c_Mul(m_Specific(Z), m_Value(Y)))) ||

        (match(Op0, m_Mul(m_Value(Z), m_Value(X))) &&

         match(Op1, m_c_Mul(m_Specific(Z), m_Value(Y))))) {

      if (ICmpInst::isSigned(Pred)) {

        if (Op0HasNSW && Op1HasNSW) {

          KnownBits ZKnown = computeKnownBits(Z, &I);

          if (ZKnown.isStrictlyPositive())

            return new ICmpInst(Pred, X, Y);

          if (ZKnown.isNegative())

            return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), X, Y);

          Value *LessThan = simplifyICmpInst(ICmpInst::ICMP_SLT, X, Y,

                                             SQ.getWithInstruction(&I));

          if (LessThan && match(LessThan, m_One()))

            return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Z,

                                Constant::getNullValue(Z->getType()));

          Value *GreaterThan = simplifyICmpInst(ICmpInst::ICMP_SGT, X, Y,

                                                SQ.getWithInstruction(&I));

          if (GreaterThan && match(GreaterThan, m_One()))

            return new ICmpInst(Pred, Z, Constant::getNullValue(Z->getType()));

        }

      } else {

        bool NonZero;

        if (ICmpInst::isEquality(Pred)) {

          // If X != Y, fold (X *nw Z) eq/ne (Y *nw Z) -> Z eq/ne 0

          if (((Op0HasNSW && Op1HasNSW) || (Op0HasNUW && Op1HasNUW)) &&

              isKnownNonEqual(X, Y, SQ))

            return new ICmpInst(Pred, Z, Constant::getNullValue(Z->getType()));


          KnownBits ZKnown = computeKnownBits(Z, &I);

          // if Z % 2 != 0

          //    X * Z eq/ne Y * Z -> X eq/ne Y

          if (ZKnown.countMaxTrailingZeros() == 0)

            return new ICmpInst(Pred, X, Y);

          NonZero = !ZKnown.One.isZero() || isKnownNonZero(Z, Q);

          // if Z != 0 and nsw(X * Z) and nsw(Y * Z)

          //    X * Z eq/ne Y * Z -> X eq/ne Y

          if (NonZero && BO0 && BO1 && Op0HasNSW && Op1HasNSW)

            return new ICmpInst(Pred, X, Y);

        } else

          NonZero = isKnownNonZero(Z, Q);


        // If Z != 0 and nuw(X * Z) and nuw(Y * Z)

        //    X * Z u{lt/le/gt/ge}/eq/ne Y * Z -> X u{lt/le/gt/ge}/eq/ne Y

        if (NonZero && BO0 && BO1 && Op0HasNUW && Op1HasNUW)

          return new ICmpInst(Pred, X, Y);

      }

    }

  }


  BinaryOperator *SRem = nullptr;

  // icmp (srem X, Y), Y

  if (BO0 && BO0->getOpcode() == Instruction::SRem && Op1 == BO0->getOperand(1))

    SRem = BO0;

  // icmp Y, (srem X, Y)

  else if (BO1 && BO1->getOpcode() == Instruction::SRem &&

           Op0 == BO1->getOperand(1))

    SRem = BO1;

  if (SRem) {

    // We don't check hasOneUse to avoid increasing register pressure because

    // the value we use is the same value this instruction was already using.

    switch (SRem == BO0 ? ICmpInst::getSwappedPredicate(Pred) : Pred) {

    default:

      break;

    case ICmpInst::ICMP_EQ:

      return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    case ICmpInst::ICMP_NE:

      return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

    case ICmpInst::ICMP_SGT:

    case ICmpInst::ICMP_SGE:

      return new ICmpInst(ICmpInst::ICMP_SGT, SRem->getOperand(1),

                          Constant::getAllOnesValue(SRem->getType()));

    case ICmpInst::ICMP_SLT:

    case ICmpInst::ICMP_SLE:

      return new ICmpInst(ICmpInst::ICMP_SLT, SRem->getOperand(1),

                          Constant::getNullValue(SRem->getType()));

    }

  }


  if (BO0 && BO1 && BO0->getOpcode() == BO1->getOpcode() &&

      (BO0->hasOneUse() || BO1->hasOneUse()) &&

      BO0->getOperand(1) == BO1->getOperand(1)) {

    switch (BO0->getOpcode()) {

    default:

      break;

    case Instruction::Add:

    case Instruction::Sub:

    case Instruction::Xor: {

      if (I.isEquality()) // a+x icmp eq/ne b+x --> a icmp b

        return new ICmpInst(Pred, BO0->getOperand(0), BO1->getOperand(0));


      const APInt *C;

      if (match(BO0->getOperand(1), m_APInt(C))) {

        // icmp u/s (a ^ signmask), (b ^ signmask) --> icmp s/u a, b

        if (C->isSignMask()) {

          ICmpInst::Predicate NewPred = I.getFlippedSignednessPredicate();

          return new ICmpInst(NewPred, BO0->getOperand(0), BO1->getOperand(0));

        }


        // icmp u/s (a ^ maxsignval), (b ^ maxsignval) --> icmp s/u' a, b

        if (BO0->getOpcode() == Instruction::Xor && C->isMaxSignedValue()) {

          ICmpInst::Predicate NewPred = I.getFlippedSignednessPredicate();

          NewPred = I.getSwappedPredicate(NewPred);

          return new ICmpInst(NewPred, BO0->getOperand(0), BO1->getOperand(0));

        }

      }

      break;

    }

    case Instruction::Mul: {

      if (!I.isEquality())

        break;


      const APInt *C;

      if (match(BO0->getOperand(1), m_APInt(C)) && !C->isZero() &&

          !C->isOne()) {

        // icmp eq/ne (X * C), (Y * C) --> icmp (X & Mask), (Y & Mask)

        // Mask = -1 >> count-trailing-zeros(C).

        if (unsigned TZs = C->countr_zero()) {

          Constant *Mask = ConstantInt::get(

              BO0->getType(),

              APInt::getLowBitsSet(C->getBitWidth(), C->getBitWidth() - TZs));

          Value *And1 = Builder.CreateAnd(BO0->getOperand(0), Mask);

          Value *And2 = Builder.CreateAnd(BO1->getOperand(0), Mask);

          return new ICmpInst(Pred, And1, And2);

        }

      }

      break;

    }

    case Instruction::UDiv:

    case Instruction::LShr:

      if (I.isSigned() || !BO0->isExact() || !BO1->isExact())

        break;

      return new ICmpInst(Pred, BO0->getOperand(0), BO1->getOperand(0));


    case Instruction::SDiv:

      if (!(I.isEquality() || match(BO0->getOperand(1), m_NonNegative())) ||

          !BO0->isExact() || !BO1->isExact())

        break;

      return new ICmpInst(Pred, BO0->getOperand(0), BO1->getOperand(0));


    case Instruction::AShr:

      if (!BO0->isExact() || !BO1->isExact())

        break;

      return new ICmpInst(Pred, BO0->getOperand(0), BO1->getOperand(0));


    case Instruction::Shl: {

      bool NUW = Op0HasNUW && Op1HasNUW;

      bool NSW = Op0HasNSW && Op1HasNSW;

      if (!NUW && !NSW)

        break;

      if (!NSW && I.isSigned())

        break;

      return new ICmpInst(Pred, BO0->getOperand(0), BO1->getOperand(0));

    }

    }

  }


  if (BO0) {

    // Transform  A & (L - 1) `ult` L --> L != 0

    auto LSubOne = m_Add(m_Specific(Op1), m_AllOnes());

    auto BitwiseAnd = m_c_And(m_Value(), LSubOne);


    if (match(BO0, BitwiseAnd) && Pred == ICmpInst::ICMP_ULT) {

      auto *Zero = Constant::getNullValue(BO0->getType());

      return new ICmpInst(ICmpInst::ICMP_NE, Op1, Zero);

    }

  }


  // For unsigned predicates / eq / ne:

  // icmp pred (x << 1), x --> icmp getSignedPredicate(pred) x, 0

  // icmp pred x, (x << 1) --> icmp getSignedPredicate(pred) 0, x

  if (!ICmpInst::isSigned(Pred)) {

    if (match(Op0, m_Shl(m_Specific(Op1), m_One())))

      return new ICmpInst(ICmpInst::getSignedPredicate(Pred), Op1,

                          Constant::getNullValue(Op1->getType()));

    else if (match(Op1, m_Shl(m_Specific(Op0), m_One())))

      return new ICmpInst(ICmpInst::getSignedPredicate(Pred),

                          Constant::getNullValue(Op0->getType()), Op0);

  }


  if (Value *V = foldMultiplicationOverflowCheck(I))

    return replaceInstUsesWith(I, V);


  if (Instruction *R = foldICmpAndXX(I, Q, *this))

    return R;


  if (Value *V = foldICmpWithTruncSignExtendedVal(I, Builder))

    return replaceInstUsesWith(I, V);


  if (Value *V = foldShiftIntoShiftInAnotherHandOfAndInICmp(I, SQ, Builder))

    return replaceInstUsesWith(I, V);


  return nullptr;

}


/// Fold icmp Pred min|max(X, Y), Z.


Instruction *InstCombinerImpl::foldICmpWithMinMax(Instruction &I,

                                                  MinMaxIntrinsic *MinMax,

                                                  Value *Z, CmpPredicate Pred) {

  Value *X = MinMax->getLHS();

  Value *Y = MinMax->getRHS();

  if (ICmpInst::isSigned(Pred) && !MinMax->isSigned())

    return nullptr;

  if (ICmpInst::isUnsigned(Pred) && MinMax->isSigned()) {

    // Revert the transform signed pred -> unsigned pred

    // TODO: We can flip the signedness of predicate if both operands of icmp

    // are negative.

    if (isKnownNonNegative(Z, SQ.getWithInstruction(&I)) &&

        isKnownNonNegative(MinMax, SQ.getWithInstruction(&I))) {

      Pred = ICmpInst::getFlippedSignednessPredicate(Pred);

    } else

      return nullptr;

  }

  SimplifyQuery Q = SQ.getWithInstruction(&I);

  auto IsCondKnownTrue = [](Value *Val) -> std::optional<bool> {

    if (!Val)

      return std::nullopt;

    if (match(Val, m_One()))

      return true;

    if (match(Val, m_Zero()))

      return false;

    return std::nullopt;

  };

  // Remove samesign here since it is illegal to keep it when we speculatively

  // execute comparisons. For example, `icmp samesign ult umax(X, -46), -32`

  // cannot be decomposed into `(icmp samesign ult X, -46) or (icmp samesign ult

  // -46, -32)`. `X` is allowed to be non-negative here.

  Pred = Pred.dropSameSign();

  auto CmpXZ = IsCondKnownTrue(simplifyICmpInst(Pred, X, Z, Q));

  auto CmpYZ = IsCondKnownTrue(simplifyICmpInst(Pred, Y, Z, Q));

  if (!CmpXZ.has_value() && !CmpYZ.has_value())

    return nullptr;

  if (!CmpXZ.has_value()) {

    std::swap(X, Y);

    std::swap(CmpXZ, CmpYZ);

  }


  auto FoldIntoCmpYZ = [&]() -> Instruction * {

    if (CmpYZ.has_value())

      return replaceInstUsesWith(I, ConstantInt::getBool(I.getType(), *CmpYZ));

    return ICmpInst::Create(Instruction::ICmp, Pred, Y, Z);

  };


  switch (Pred) {

  case ICmpInst::ICMP_EQ:

  case ICmpInst::ICMP_NE: {

    // If X == Z:

    //     Expr       Result

    // min(X, Y) == Z X <= Y

    // max(X, Y) == Z X >= Y

    // min(X, Y) != Z X > Y

    // max(X, Y) != Z X < Y

    if ((Pred == ICmpInst::ICMP_EQ) == *CmpXZ) {

      ICmpInst::Predicate NewPred =

          ICmpInst::getNonStrictPredicate(MinMax->getPredicate());

      if (Pred == ICmpInst::ICMP_NE)

        NewPred = ICmpInst::getInversePredicate(NewPred);

      return ICmpInst::Create(Instruction::ICmp, NewPred, X, Y);

    }

    // Otherwise (X != Z):

    ICmpInst::Predicate NewPred = MinMax->getPredicate();

    auto MinMaxCmpXZ = IsCondKnownTrue(simplifyICmpInst(NewPred, X, Z, Q));

    if (!MinMaxCmpXZ.has_value()) {

      std::swap(X, Y);

      std::swap(CmpXZ, CmpYZ);

      // Re-check pre-condition X != Z

      if (!CmpXZ.has_value() || (Pred == ICmpInst::ICMP_EQ) == *CmpXZ)

        break;

      MinMaxCmpXZ = IsCondKnownTrue(simplifyICmpInst(NewPred, X, Z, Q));

    }

    if (!MinMaxCmpXZ.has_value())

      break;

    if (*MinMaxCmpXZ) {

      //    Expr         Fact    Result

      // min(X, Y) == Z  X < Z   false

      // max(X, Y) == Z  X > Z   false

      // min(X, Y) != Z  X < Z    true

      // max(X, Y) != Z  X > Z    true

      return replaceInstUsesWith(

          I, ConstantInt::getBool(I.getType(), Pred == ICmpInst::ICMP_NE));

    } else {

      //    Expr         Fact    Result

      // min(X, Y) == Z  X > Z   Y == Z

      // max(X, Y) == Z  X < Z   Y == Z

      // min(X, Y) != Z  X > Z   Y != Z

      // max(X, Y) != Z  X < Z   Y != Z

      return FoldIntoCmpYZ();

    }

    break;

  }

  case ICmpInst::ICMP_SLT:

  case ICmpInst::ICMP_ULT:

  case ICmpInst::ICMP_SLE:

  case ICmpInst::ICMP_ULE:

  case ICmpInst::ICMP_SGT:

  case ICmpInst::ICMP_UGT:

  case ICmpInst::ICMP_SGE:

  case ICmpInst::ICMP_UGE: {

    bool IsSame = MinMax->getPredicate() == ICmpInst::getStrictPredicate(Pred);

    if (*CmpXZ) {

      if (IsSame) {

        //      Expr        Fact    Result

        // min(X, Y) < Z    X < Z   true

        // min(X, Y) <= Z   X <= Z  true

        // max(X, Y) > Z    X > Z   true

        // max(X, Y) >= Z   X >= Z  true

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      } else {

        //      Expr        Fact    Result

        // max(X, Y) < Z    X < Z   Y < Z

        // max(X, Y) <= Z   X <= Z  Y <= Z

        // min(X, Y) > Z    X > Z   Y > Z

        // min(X, Y) >= Z   X >= Z  Y >= Z

        return FoldIntoCmpYZ();

      }

    } else {

      if (IsSame) {

        //      Expr        Fact    Result

        // min(X, Y) < Z    X >= Z  Y < Z

        // min(X, Y) <= Z   X > Z   Y <= Z

        // max(X, Y) > Z    X <= Z  Y > Z

        // max(X, Y) >= Z   X < Z   Y >= Z

        return FoldIntoCmpYZ();

      } else {

        //      Expr        Fact    Result

        // max(X, Y) < Z    X >= Z  false

        // max(X, Y) <= Z   X > Z   false

        // min(X, Y) > Z    X <= Z  false

        // min(X, Y) >= Z   X < Z   false

        return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

      }

    }

    break;

  }

  default:

    break;

  }


  return nullptr;

}


// Canonicalize checking for a power-of-2-or-zero value:


static Instruction *foldICmpPow2Test(ICmpInst &I,

                                     InstCombiner::BuilderTy &Builder) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  const CmpInst::Predicate Pred = I.getPredicate();

  Value *A = nullptr;

  bool CheckIs;

  if (I.isEquality()) {

    // (A & (A-1)) == 0 --> ctpop(A) < 2 (two commuted variants)

    // ((A-1) & A) != 0 --> ctpop(A) > 1 (two commuted variants)

    if (!match(Op0, m_OneUse(m_c_And(m_Add(m_Value(A), m_AllOnes()),

                                     m_Deferred(A)))) ||

        !match(Op1, m_ZeroInt()))

      A = nullptr;


    // (A & -A) == A --> ctpop(A) < 2 (four commuted variants)

    // (-A & A) != A --> ctpop(A) > 1 (four commuted variants)

    if (match(Op0, m_OneUse(m_c_And(m_Neg(m_Specific(Op1)), m_Specific(Op1)))))

      A = Op1;

    else if (match(Op1,

                   m_OneUse(m_c_And(m_Neg(m_Specific(Op0)), m_Specific(Op0)))))

      A = Op0;


    CheckIs = Pred == ICmpInst::ICMP_EQ;

  } else if (ICmpInst::isUnsigned(Pred)) {

    // (A ^ (A-1)) u>= A --> ctpop(A) < 2 (two commuted variants)

    // ((A-1) ^ A) u< A --> ctpop(A) > 1 (two commuted variants)


    if ((Pred == ICmpInst::ICMP_UGE || Pred == ICmpInst::ICMP_ULT) &&

        match(Op0, m_OneUse(m_c_Xor(m_Add(m_Specific(Op1), m_AllOnes()),

                                    m_Specific(Op1))))) {

      A = Op1;

      CheckIs = Pred == ICmpInst::ICMP_UGE;

    } else if ((Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULE) &&

               match(Op1, m_OneUse(m_c_Xor(m_Add(m_Specific(Op0), m_AllOnes()),

                                           m_Specific(Op0))))) {

      A = Op0;

      CheckIs = Pred == ICmpInst::ICMP_ULE;

    }

  }


  if (A) {

    Type *Ty = A->getType();

    CallInst *CtPop = Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, A);

    return CheckIs ? new ICmpInst(ICmpInst::ICMP_ULT, CtPop,

                                  ConstantInt::get(Ty, 2))

                   : new ICmpInst(ICmpInst::ICMP_UGT, CtPop,

                                  ConstantInt::get(Ty, 1));

  }


  return nullptr;

}


/// Find all possible pairs (BinOp, RHS) that BinOp V, RHS can be simplified.

using OffsetOp = std::pair<Instruction::BinaryOps, Value *>;


static void collectOffsetOp(Value *V, SmallVectorImpl<OffsetOp> &Offsets,

                            bool AllowRecursion) {

  Instruction *Inst = dyn_cast<Instruction>(V);

  if (!Inst || !Inst->hasOneUse())

    return;


  switch (Inst->getOpcode()) {

  case Instruction::Add:

    Offsets.emplace_back(Instruction::Sub, Inst->getOperand(1));

    Offsets.emplace_back(Instruction::Sub, Inst->getOperand(0));

    break;

  case Instruction::Sub:

    Offsets.emplace_back(Instruction::Add, Inst->getOperand(1));

    break;

  case Instruction::Xor:

    Offsets.emplace_back(Instruction::Xor, Inst->getOperand(1));

    Offsets.emplace_back(Instruction::Xor, Inst->getOperand(0));

    break;

  case Instruction::Select:

    if (AllowRecursion) {

      collectOffsetOp(Inst->getOperand(1), Offsets, /*AllowRecursion=*/false);

      collectOffsetOp(Inst->getOperand(2), Offsets, /*AllowRecursion=*/false);

    }

    break;

  default:

    break;

  }

}


enum class OffsetKind { Invalid, Value, Select };


struct OffsetResult {

  OffsetKind Kind;

  Value *V0, *V1, *V2;


  static OffsetResult invalid() {

    return {OffsetKind::Invalid, nullptr, nullptr, nullptr};

  }


  static OffsetResult value(Value *V) {

    return {OffsetKind::Value, V, nullptr, nullptr};

  }


  static OffsetResult select(Value *Cond, Value *TrueV, Value *FalseV) {

    return {OffsetKind::Select, Cond, TrueV, FalseV};

  }


  bool isValid() const { return Kind != OffsetKind::Invalid; }


  Value *materialize(InstCombiner::BuilderTy &Builder) const {

    switch (Kind) {

    case OffsetKind::Invalid:

      llvm_unreachable("Invalid offset result");

    case OffsetKind::Value:

      return V0;

    case OffsetKind::Select:

      return Builder.CreateSelect(V0, V1, V2);

    }

    llvm_unreachable("Unknown OffsetKind enum");

  }


};


/// Offset both sides of an equality icmp to see if we can save some

/// instructions: icmp eq/ne X, Y -> icmp eq/ne X op Z, Y op Z.

/// Note: This operation should not introduce poison.


static Instruction *foldICmpEqualityWithOffset(ICmpInst &I,

                                               InstCombiner::BuilderTy &Builder,

                                               const SimplifyQuery &SQ) {

  assert(I.isEquality() && "Expected an equality icmp");

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  if (!Op0->getType()->isIntOrIntVectorTy())

    return nullptr;


  SmallVector<OffsetOp, 4> OffsetOps;

  collectOffsetOp(Op0, OffsetOps, /*AllowRecursion=*/true);

  collectOffsetOp(Op1, OffsetOps, /*AllowRecursion=*/true);


  auto ApplyOffsetImpl = [&](Value *V, unsigned BinOpc, Value *RHS) -> Value * {

    Value *Simplified = simplifyBinOp(BinOpc, V, RHS, SQ);

    // Avoid infinite loops by checking if RHS is an identity for the BinOp.

    if (!Simplified || Simplified == V)

      return nullptr;

    // Reject constant expressions as they don't simplify things.

    if (isa<Constant>(Simplified) && !match(Simplified, m_ImmConstant()))

      return nullptr;

    // Check if the transformation introduces poison.

    return impliesPoison(RHS, V) ? Simplified : nullptr;

  };


  auto ApplyOffset = [&](Value *V, unsigned BinOpc,

                         Value *RHS) -> OffsetResult {

    if (auto *Sel = dyn_cast<SelectInst>(V)) {

      if (!Sel->hasOneUse())

        return OffsetResult::invalid();

      Value *TrueVal = ApplyOffsetImpl(Sel->getTrueValue(), BinOpc, RHS);

      if (!TrueVal)

        return OffsetResult::invalid();

      Value *FalseVal = ApplyOffsetImpl(Sel->getFalseValue(), BinOpc, RHS);

      if (!FalseVal)

        return OffsetResult::invalid();

      return OffsetResult::select(Sel->getCondition(), TrueVal, FalseVal);

    }

    if (Value *Simplified = ApplyOffsetImpl(V, BinOpc, RHS))

      return OffsetResult::value(Simplified);

    return OffsetResult::invalid();

  };


  for (auto [BinOp, RHS] : OffsetOps) {

    auto BinOpc = static_cast<unsigned>(BinOp);


    auto Op0Result = ApplyOffset(Op0, BinOpc, RHS);

    if (!Op0Result.isValid())

      continue;

    auto Op1Result = ApplyOffset(Op1, BinOpc, RHS);

    if (!Op1Result.isValid())

      continue;


    Value *NewLHS = Op0Result.materialize(Builder);

    Value *NewRHS = Op1Result.materialize(Builder);

    return new ICmpInst(I.getPredicate(), NewLHS, NewRHS);

  }


  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpEquality(ICmpInst &I) {

  if (!I.isEquality())

    return nullptr;


  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  const CmpInst::Predicate Pred = I.getPredicate();

  Value *A, *B, *C, *D;

  if (match(Op0, m_Xor(m_Value(A), m_Value(B)))) {

    if (A == Op1 || B == Op1) { // (A^B) == A  ->  B == 0

      Value *OtherVal = A == Op1 ? B : A;

      return new ICmpInst(Pred, OtherVal, Constant::getNullValue(A->getType()));

    }


    if (match(Op1, m_Xor(m_Value(C), m_Value(D)))) {

      // A^c1 == C^c2 --> A == C^(c1^c2)

      ConstantInt *C1, *C2;

      if (match(B, m_ConstantInt(C1)) && match(D, m_ConstantInt(C2)) &&

          Op1->hasOneUse()) {

        Constant *NC = Builder.getInt(C1->getValue() ^ C2->getValue());

        Value *Xor = Builder.CreateXor(C, NC);

        return new ICmpInst(Pred, A, Xor);

      }


      // A^B == A^D -> B == D

      if (A == C)

        return new ICmpInst(Pred, B, D);

      if (A == D)

        return new ICmpInst(Pred, B, C);

      if (B == C)

        return new ICmpInst(Pred, A, D);

      if (B == D)

        return new ICmpInst(Pred, A, C);

    }

  }


  if (match(Op1, m_Xor(m_Value(A), m_Value(B))) && (A == Op0 || B == Op0)) {

    // A == (A^B)  ->  B == 0

    Value *OtherVal = A == Op0 ? B : A;

    return new ICmpInst(Pred, OtherVal, Constant::getNullValue(A->getType()));

  }


  // (X&Z) == (Y&Z) -> (X^Y) & Z == 0

  if (match(Op0, m_And(m_Value(A), m_Value(B))) &&

      match(Op1, m_And(m_Value(C), m_Value(D)))) {

    Value *X = nullptr, *Y = nullptr, *Z = nullptr;


    if (A == C) {

      X = B;

      Y = D;

      Z = A;

    } else if (A == D) {

      X = B;

      Y = C;

      Z = A;

    } else if (B == C) {

      X = A;

      Y = D;

      Z = B;

    } else if (B == D) {

      X = A;

      Y = C;

      Z = B;

    }


    if (X) {

      // If X^Y is a negative power of two, then `icmp eq/ne (Z & NegP2), 0`

      // will fold to `icmp ult/uge Z, -NegP2` incurringb no additional

      // instructions.

      const APInt *C0, *C1;

      bool XorIsNegP2 = match(X, m_APInt(C0)) && match(Y, m_APInt(C1)) &&

                        (*C0 ^ *C1).isNegatedPowerOf2();


      // If either Op0/Op1 are both one use or X^Y will constant fold and one of

      // Op0/Op1 are one use, proceed. In those cases we are instruction neutral

      // but `icmp eq/ne A, 0` is easier to analyze than `icmp eq/ne A, B`.

      int UseCnt =

          int(Op0->hasOneUse()) + int(Op1->hasOneUse()) +

          (int(match(X, m_ImmConstant()) && match(Y, m_ImmConstant())));

      if (XorIsNegP2 || UseCnt >= 2) {

        // Build (X^Y) & Z

        Op1 = Builder.CreateXor(X, Y);

        Op1 = Builder.CreateAnd(Op1, Z);

        return new ICmpInst(Pred, Op1, Constant::getNullValue(Op1->getType()));

      }

    }

  }


  {

    // Similar to above, but specialized for constant because invert is needed:

    // (X | C) == (Y | C) --> (X ^ Y) & ~C == 0

    Value *X, *Y;

    Constant *C;

    if (match(Op0, m_OneUse(m_Or(m_Value(X), m_Constant(C)))) &&

        match(Op1, m_OneUse(m_Or(m_Value(Y), m_Specific(C))))) {

      Value *Xor = Builder.CreateXor(X, Y);

      Value *And = Builder.CreateAnd(Xor, ConstantExpr::getNot(C));

      return new ICmpInst(Pred, And, Constant::getNullValue(And->getType()));

    }

  }


  if (match(Op1, m_ZExt(m_Value(A))) &&

      (Op0->hasOneUse() || Op1->hasOneUse())) {

    // (B & (Pow2C-1)) == zext A --> A == trunc B

    // (B & (Pow2C-1)) != zext A --> A != trunc B

    const APInt *MaskC;

    if (match(Op0, m_And(m_Value(B), m_LowBitMask(MaskC))) &&

        MaskC->countr_one() == A->getType()->getScalarSizeInBits())

      return new ICmpInst(Pred, A, Builder.CreateTrunc(B, A->getType()));

  }


  // (A >> C) == (B >> C) --> (A^B) u< (1 << C)

  // For lshr and ashr pairs.

  const APInt *AP1, *AP2;

  if ((match(Op0, m_OneUse(m_LShr(m_Value(A), m_APIntAllowPoison(AP1)))) &&

       match(Op1, m_OneUse(m_LShr(m_Value(B), m_APIntAllowPoison(AP2))))) ||

      (match(Op0, m_OneUse(m_AShr(m_Value(A), m_APIntAllowPoison(AP1)))) &&

       match(Op1, m_OneUse(m_AShr(m_Value(B), m_APIntAllowPoison(AP2)))))) {

    if (*AP1 != *AP2)

      return nullptr;

    unsigned TypeBits = AP1->getBitWidth();

    unsigned ShAmt = AP1->getLimitedValue(TypeBits);

    if (ShAmt < TypeBits && ShAmt != 0) {

      ICmpInst::Predicate NewPred =

          Pred == ICmpInst::ICMP_NE ? ICmpInst::ICMP_UGE : ICmpInst::ICMP_ULT;

      Value *Xor = Builder.CreateXor(A, B, I.getName() + ".unshifted");

      APInt CmpVal = APInt::getOneBitSet(TypeBits, ShAmt);

      return new ICmpInst(NewPred, Xor, ConstantInt::get(A->getType(), CmpVal));

    }

  }


  // (A << C) == (B << C) --> ((A^B) & (~0U >> C)) == 0

  ConstantInt *Cst1;

  if (match(Op0, m_OneUse(m_Shl(m_Value(A), m_ConstantInt(Cst1)))) &&

      match(Op1, m_OneUse(m_Shl(m_Value(B), m_Specific(Cst1))))) {

    unsigned TypeBits = Cst1->getBitWidth();

    unsigned ShAmt = (unsigned)Cst1->getLimitedValue(TypeBits);

    if (ShAmt < TypeBits && ShAmt != 0) {

      Value *Xor = Builder.CreateXor(A, B, I.getName() + ".unshifted");

      APInt AndVal = APInt::getLowBitsSet(TypeBits, TypeBits - ShAmt);

      Value *And =

          Builder.CreateAnd(Xor, Builder.getInt(AndVal), I.getName() + ".mask");

      return new ICmpInst(Pred, And, Constant::getNullValue(Cst1->getType()));

    }

  }


  // Transform "icmp eq (trunc (lshr(X, cst1)), cst" to

  // "icmp (and X, mask), cst"

  uint64_t ShAmt = 0;

  if (Op0->hasOneUse() &&

      match(Op0, m_Trunc(m_OneUse(m_LShr(m_Value(A), m_ConstantInt(ShAmt))))) &&

      match(Op1, m_ConstantInt(Cst1)) &&

      // Only do this when A has multiple uses.  This is most important to do

      // when it exposes other optimizations.

      !A->hasOneUse()) {

    unsigned ASize = cast<IntegerType>(A->getType())->getPrimitiveSizeInBits();


    if (ShAmt < ASize) {

      APInt MaskV =

          APInt::getLowBitsSet(ASize, Op0->getType()->getPrimitiveSizeInBits());

      MaskV <<= ShAmt;


      APInt CmpV = Cst1->getValue().zext(ASize);

      CmpV <<= ShAmt;


      Value *Mask = Builder.CreateAnd(A, Builder.getInt(MaskV));

      return new ICmpInst(Pred, Mask, Builder.getInt(CmpV));

    }

  }


  if (Instruction *ICmp = foldICmpIntrinsicWithIntrinsic(I, Builder))

    return ICmp;


  // Match icmp eq (trunc (lshr A, BW), (ashr (trunc A), BW-1)), which checks

  // the top BW/2 + 1 bits are all the same. Create "A >=s INT_MIN && A <=s

  // INT_MAX", which we generate as "icmp ult (add A, 2^(BW-1)), 2^BW" to skip a

  // few steps of instcombine.

  unsigned BitWidth = Op0->getType()->getScalarSizeInBits();

  if (match(Op0, m_AShr(m_Trunc(m_Value(A)), m_SpecificInt(BitWidth - 1))) &&

      match(Op1, m_Trunc(m_LShr(m_Specific(A), m_SpecificInt(BitWidth)))) &&

      A->getType()->getScalarSizeInBits() == BitWidth * 2 &&

      (I.getOperand(0)->hasOneUse() || I.getOperand(1)->hasOneUse())) {

    APInt C = APInt::getOneBitSet(BitWidth * 2, BitWidth - 1);

    Value *Add = Builder.CreateAdd(A, ConstantInt::get(A->getType(), C));

    return new ICmpInst(Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_ULT

                                                  : ICmpInst::ICMP_UGE,

                        Add, ConstantInt::get(A->getType(), C.shl(1)));

  }


  // Canonicalize:

  // Assume B_Pow2 != 0

  // 1. A & B_Pow2 != B_Pow2 -> A & B_Pow2 == 0

  // 2. A & B_Pow2 == B_Pow2 -> A & B_Pow2 != 0

  if (match(Op0, m_c_And(m_Specific(Op1), m_Value())) &&

      isKnownToBeAPowerOfTwo(Op1, /* OrZero */ false, &I))

    return new ICmpInst(CmpInst::getInversePredicate(Pred), Op0,

                        ConstantInt::getNullValue(Op0->getType()));


  if (match(Op1, m_c_And(m_Specific(Op0), m_Value())) &&

      isKnownToBeAPowerOfTwo(Op0, /* OrZero */ false, &I))

    return new ICmpInst(CmpInst::getInversePredicate(Pred), Op1,

                        ConstantInt::getNullValue(Op1->getType()));


  // Canonicalize:

  // icmp eq/ne X, OneUse(rotate-right(X))

  //    -> icmp eq/ne X, rotate-left(X)

  // We generally try to convert rotate-right -> rotate-left, this just

  // canonicalizes another case.

  if (match(&I, m_c_ICmp(m_Value(A),

                         m_OneUse(m_Intrinsic<Intrinsic::fshr>(

                             m_Deferred(A), m_Deferred(A), m_Value(B))))))

    return new ICmpInst(

        Pred, A,

        Builder.CreateIntrinsic(Op0->getType(), Intrinsic::fshl, {A, A, B}));


  // Canonicalize:

  // icmp eq/ne OneUse(A ^ Cst), B --> icmp eq/ne (A ^ B), Cst

  Constant *Cst;

  if (match(&I, m_c_ICmp(m_OneUse(m_Xor(m_Value(A), m_ImmConstant(Cst))),

                         m_CombineAnd(m_Value(B), m_Unless(m_ImmConstant())))))

    return new ICmpInst(Pred, Builder.CreateXor(A, B), Cst);


  {

    // (icmp eq/ne (and (add/sub/xor X, P2), P2), P2)

    auto m_Matcher =

        m_CombineOr(m_CombineOr(m_c_Add(m_Value(B), m_Deferred(A)),

                                m_c_Xor(m_Value(B), m_Deferred(A))),

                    m_Sub(m_Value(B), m_Deferred(A)));

    std::optional<bool> IsZero = std::nullopt;

    if (match(&I, m_c_ICmp(m_OneUse(m_c_And(m_Value(A), m_Matcher)),

                           m_Deferred(A))))

      IsZero = false;

    // (icmp eq/ne (and (add/sub/xor X, P2), P2), 0)

    else if (match(&I,

                   m_ICmp(m_OneUse(m_c_And(m_Value(A), m_Matcher)), m_Zero())))

      IsZero = true;


    if (IsZero && isKnownToBeAPowerOfTwo(A, /* OrZero */ true, &I))

      // (icmp eq/ne (and (add/sub/xor X, P2), P2), P2)

      //    -> (icmp eq/ne (and X, P2), 0)

      // (icmp eq/ne (and (add/sub/xor X, P2), P2), 0)

      //    -> (icmp eq/ne (and X, P2), P2)

      return new ICmpInst(Pred, Builder.CreateAnd(B, A),

                          *IsZero ? A

                                  : ConstantInt::getNullValue(A->getType()));

  }


  if (auto *Res = foldICmpEqualityWithOffset(

          I, Builder, getSimplifyQuery().getWithInstruction(&I)))

    return Res;


  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpWithTrunc(ICmpInst &ICmp) {

  ICmpInst::Predicate Pred = ICmp.getPredicate();

  Value *Op0 = ICmp.getOperand(0), *Op1 = ICmp.getOperand(1);


  // Try to canonicalize trunc + compare-to-constant into a mask + cmp.

  // The trunc masks high bits while the compare may effectively mask low bits.

  Value *X;

  const APInt *C;

  if (!match(Op0, m_OneUse(m_Trunc(m_Value(X)))) || !match(Op1, m_APInt(C)))

    return nullptr;


  // This matches patterns corresponding to tests of the signbit as well as:

  // (trunc X) pred C2 --> (X & Mask) == C

  if (auto Res = decomposeBitTestICmp(Op0, Op1, Pred, /*WithTrunc=*/true,

                                      /*AllowNonZeroC=*/true)) {

    Value *And = Builder.CreateAnd(Res->X, Res->Mask);

    Constant *C = ConstantInt::get(Res->X->getType(), Res->C);

    return new ICmpInst(Res->Pred, And, C);

  }


  unsigned SrcBits = X->getType()->getScalarSizeInBits();

  if (auto *II = dyn_cast<IntrinsicInst>(X)) {

    if (II->getIntrinsicID() == Intrinsic::cttz ||

        II->getIntrinsicID() == Intrinsic::ctlz) {

      unsigned MaxRet = SrcBits;

      // If the "is_zero_poison" argument is set, then we know at least

      // one bit is set in the input, so the result is always at least one

      // less than the full bitwidth of that input.

      if (match(II->getArgOperand(1), m_One()))

        MaxRet--;


      // Make sure the destination is wide enough to hold the largest output of

      // the intrinsic.

      if (llvm::Log2_32(MaxRet) + 1 <= Op0->getType()->getScalarSizeInBits())

        if (Instruction *I =

                foldICmpIntrinsicWithConstant(ICmp, II, C->zext(SrcBits)))

          return I;

    }

  }


  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpWithZextOrSext(ICmpInst &ICmp) {

  assert(isa<CastInst>(ICmp.getOperand(0)) && "Expected cast for operand 0");

  auto *CastOp0 = cast<CastInst>(ICmp.getOperand(0));

  Value *X;

  if (!match(CastOp0, m_ZExtOrSExt(m_Value(X))))

    return nullptr;


  bool IsSignedExt = CastOp0->getOpcode() == Instruction::SExt;

  bool IsSignedCmp = ICmp.isSigned();


  // icmp Pred (ext X), (ext Y)

  Value *Y;

  if (match(ICmp.getOperand(1), m_ZExtOrSExt(m_Value(Y)))) {

    bool IsZext0 = isa<ZExtInst>(ICmp.getOperand(0));

    bool IsZext1 = isa<ZExtInst>(ICmp.getOperand(1));


    if (IsZext0 != IsZext1) {

      // If X and Y and both i1

      // (icmp eq/ne (zext X) (sext Y))

      //      eq -> (icmp eq (or X, Y), 0)

      //      ne -> (icmp ne (or X, Y), 0)

      if (ICmp.isEquality() && X->getType()->isIntOrIntVectorTy(1) &&

          Y->getType()->isIntOrIntVectorTy(1))

        return new ICmpInst(ICmp.getPredicate(), Builder.CreateOr(X, Y),

                            Constant::getNullValue(X->getType()));


      // If we have mismatched casts and zext has the nneg flag, we can

      //  treat the "zext nneg" as "sext". Otherwise, we cannot fold and quit.


      auto *NonNegInst0 = dyn_cast<PossiblyNonNegInst>(ICmp.getOperand(0));

      auto *NonNegInst1 = dyn_cast<PossiblyNonNegInst>(ICmp.getOperand(1));


      bool IsNonNeg0 = NonNegInst0 && NonNegInst0->hasNonNeg();

      bool IsNonNeg1 = NonNegInst1 && NonNegInst1->hasNonNeg();


      if ((IsZext0 && IsNonNeg0) || (IsZext1 && IsNonNeg1))

        IsSignedExt = true;

      else

        return nullptr;

    }


    // Not an extension from the same type?

    Type *XTy = X->getType(), *YTy = Y->getType();

    if (XTy != YTy) {

      // One of the casts must have one use because we are creating a new cast.

      if (!ICmp.getOperand(0)->hasOneUse() && !ICmp.getOperand(1)->hasOneUse())

        return nullptr;

      // Extend the narrower operand to the type of the wider operand.

      CastInst::CastOps CastOpcode =

          IsSignedExt ? Instruction::SExt : Instruction::ZExt;

      if (XTy->getScalarSizeInBits() < YTy->getScalarSizeInBits())

        X = Builder.CreateCast(CastOpcode, X, YTy);

      else if (YTy->getScalarSizeInBits() < XTy->getScalarSizeInBits())

        Y = Builder.CreateCast(CastOpcode, Y, XTy);

      else

        return nullptr;

    }


    // (zext X) == (zext Y) --> X == Y

    // (sext X) == (sext Y) --> X == Y

    if (ICmp.isEquality())

      return new ICmpInst(ICmp.getPredicate(), X, Y);


    // A signed comparison of sign extended values simplifies into a

    // signed comparison.

    if (IsSignedCmp && IsSignedExt)

      return new ICmpInst(ICmp.getPredicate(), X, Y);


    // The other three cases all fold into an unsigned comparison.

    return new ICmpInst(ICmp.getUnsignedPredicate(), X, Y);

  }


  // Below here, we are only folding a compare with constant.

  auto *C = dyn_cast<Constant>(ICmp.getOperand(1));

  if (!C)

    return nullptr;


  // If a lossless truncate is possible...

  Type *SrcTy = CastOp0->getSrcTy();

  Constant *Res = getLosslessInvCast(C, SrcTy, CastOp0->getOpcode(), DL);

  if (Res) {

    if (ICmp.isEquality())

      return new ICmpInst(ICmp.getPredicate(), X, Res);


    // A signed comparison of sign extended values simplifies into a

    // signed comparison.

    if (IsSignedExt && IsSignedCmp)

      return new ICmpInst(ICmp.getPredicate(), X, Res);


    // The other three cases all fold into an unsigned comparison.

    return new ICmpInst(ICmp.getUnsignedPredicate(), X, Res);

  }


  // The re-extended constant changed, partly changed (in the case of a vector),

  // or could not be determined to be equal (in the case of a constant

  // expression), so the constant cannot be represented in the shorter type.

  // All the cases that fold to true or false will have already been handled

  // by simplifyICmpInst, so only deal with the tricky case.

  if (IsSignedCmp || !IsSignedExt || !isa<ConstantInt>(C))

    return nullptr;


  // Is source op positive?

  // icmp ult (sext X), C --> icmp sgt X, -1

  if (ICmp.getPredicate() == ICmpInst::ICMP_ULT)

    return new ICmpInst(CmpInst::ICMP_SGT, X, Constant::getAllOnesValue(SrcTy));


  // Is source op negative?

  // icmp ugt (sext X), C --> icmp slt X, 0

  assert(ICmp.getPredicate() == ICmpInst::ICMP_UGT && "ICmp should be folded!");

  return new ICmpInst(CmpInst::ICMP_SLT, X, Constant::getNullValue(SrcTy));

}


/// Handle icmp (cast x), (cast or constant).


Instruction *InstCombinerImpl::foldICmpWithCastOp(ICmpInst &ICmp) {

  // If any operand of ICmp is a inttoptr roundtrip cast then remove it as

  // icmp compares only pointer's value.

  // icmp (inttoptr (ptrtoint p1)), p2 --> icmp p1, p2.

  Value *SimplifiedOp0 = simplifyIntToPtrRoundTripCast(ICmp.getOperand(0));

  Value *SimplifiedOp1 = simplifyIntToPtrRoundTripCast(ICmp.getOperand(1));

  if (SimplifiedOp0 || SimplifiedOp1)

    return new ICmpInst(ICmp.getPredicate(),

                        SimplifiedOp0 ? SimplifiedOp0 : ICmp.getOperand(0),

                        SimplifiedOp1 ? SimplifiedOp1 : ICmp.getOperand(1));


  auto *CastOp0 = dyn_cast<CastInst>(ICmp.getOperand(0));

  if (!CastOp0)

    return nullptr;

  if (!isa<Constant>(ICmp.getOperand(1)) && !isa<CastInst>(ICmp.getOperand(1)))

    return nullptr;


  Value *Op0Src = CastOp0->getOperand(0);

  Type *SrcTy = CastOp0->getSrcTy();

  Type *DestTy = CastOp0->getDestTy();


  // Turn icmp (ptrtoint x), (ptrtoint/c) into a compare of the input if the

  // integer type is the same size as the pointer type.

  auto CompatibleSizes = [&](Type *PtrTy, Type *IntTy) {

    if (isa<VectorType>(PtrTy)) {

      PtrTy = cast<VectorType>(PtrTy)->getElementType();

      IntTy = cast<VectorType>(IntTy)->getElementType();

    }

    return DL.getPointerTypeSizeInBits(PtrTy) == IntTy->getIntegerBitWidth();

  };

  if (CastOp0->getOpcode() == Instruction::PtrToInt &&

      CompatibleSizes(SrcTy, DestTy)) {

    Value *NewOp1 = nullptr;

    if (auto *PtrToIntOp1 = dyn_cast<PtrToIntOperator>(ICmp.getOperand(1))) {

      Value *PtrSrc = PtrToIntOp1->getOperand(0);

      if (PtrSrc->getType() == Op0Src->getType())

        NewOp1 = PtrToIntOp1->getOperand(0);

    } else if (auto *RHSC = dyn_cast<Constant>(ICmp.getOperand(1))) {

      NewOp1 = ConstantExpr::getIntToPtr(RHSC, SrcTy);

    }


    if (NewOp1)

      return new ICmpInst(ICmp.getPredicate(), Op0Src, NewOp1);

  }


  // Do the same in the other direction for icmp (inttoptr x), (inttoptr/c).

  if (CastOp0->getOpcode() == Instruction::IntToPtr &&

      CompatibleSizes(DestTy, SrcTy)) {

    Value *NewOp1 = nullptr;

    if (auto *IntToPtrOp1 = dyn_cast<IntToPtrInst>(ICmp.getOperand(1))) {

      Value *IntSrc = IntToPtrOp1->getOperand(0);

      if (IntSrc->getType() == Op0Src->getType())

        NewOp1 = IntToPtrOp1->getOperand(0);

    } else if (auto *RHSC = dyn_cast<Constant>(ICmp.getOperand(1))) {

      NewOp1 = ConstantFoldConstant(ConstantExpr::getPtrToInt(RHSC, SrcTy), DL);

    }


    if (NewOp1)

      return new ICmpInst(ICmp.getPredicate(), Op0Src, NewOp1);

  }


  if (Instruction *R = foldICmpWithTrunc(ICmp))

    return R;


  return foldICmpWithZextOrSext(ICmp);

}


static bool isNeutralValue(Instruction::BinaryOps BinaryOp, Value *RHS,

                           bool IsSigned) {

  switch (BinaryOp) {

  default:

    llvm_unreachable("Unsupported binary op");

  case Instruction::Add:

  case Instruction::Sub:

    return match(RHS, m_Zero());

  case Instruction::Mul:

    return !(RHS->getType()->isIntOrIntVectorTy(1) && IsSigned) &&

           match(RHS, m_One());

  }

}


OverflowResult


InstCombinerImpl::computeOverflow(Instruction::BinaryOps BinaryOp,

                                  bool IsSigned, Value *LHS, Value *RHS,

                                  Instruction *CxtI) const {

  switch (BinaryOp) {

  default:

    llvm_unreachable("Unsupported binary op");

  case Instruction::Add:

    if (IsSigned)

      return computeOverflowForSignedAdd(LHS, RHS, CxtI);

    else

      return computeOverflowForUnsignedAdd(LHS, RHS, CxtI);

  case Instruction::Sub:

    if (IsSigned)

      return computeOverflowForSignedSub(LHS, RHS, CxtI);

    else

      return computeOverflowForUnsignedSub(LHS, RHS, CxtI);

  case Instruction::Mul:

    if (IsSigned)

      return computeOverflowForSignedMul(LHS, RHS, CxtI);

    else

      return computeOverflowForUnsignedMul(LHS, RHS, CxtI);

  }

}


bool InstCombinerImpl::OptimizeOverflowCheck(Instruction::BinaryOps BinaryOp,

                                             bool IsSigned, Value *LHS,

                                             Value *RHS, Instruction &OrigI,

                                             Value *&Result,

                                             Constant *&Overflow) {

  if (OrigI.isCommutative() && isa<Constant>(LHS) && !isa<Constant>(RHS))

    std::swap(LHS, RHS);


  // If the overflow check was an add followed by a compare, the insertion point

  // may be pointing to the compare.  We want to insert the new instructions

  // before the add in case there are uses of the add between the add and the

  // compare.

  Builder.SetInsertPoint(&OrigI);


  Type *OverflowTy = Type::getInt1Ty(LHS->getContext());

  if (auto *LHSTy = dyn_cast<VectorType>(LHS->getType()))

    OverflowTy = VectorType::get(OverflowTy, LHSTy->getElementCount());


  if (isNeutralValue(BinaryOp, RHS, IsSigned)) {

    Result = LHS;

    Overflow = ConstantInt::getFalse(OverflowTy);

    return true;

  }


  switch (computeOverflow(BinaryOp, IsSigned, LHS, RHS, &OrigI)) {

  case OverflowResult::MayOverflow:

    return false;

  case OverflowResult::AlwaysOverflowsLow:

  case OverflowResult::AlwaysOverflowsHigh:

    Result = Builder.CreateBinOp(BinaryOp, LHS, RHS);

    Result->takeName(&OrigI);

    Overflow = ConstantInt::getTrue(OverflowTy);

    return true;

  case OverflowResult::NeverOverflows:

    Result = Builder.CreateBinOp(BinaryOp, LHS, RHS);

    Result->takeName(&OrigI);

    Overflow = ConstantInt::getFalse(OverflowTy);

    if (auto *Inst = dyn_cast<Instruction>(Result)) {

      if (IsSigned)

        Inst->setHasNoSignedWrap();

      else

        Inst->setHasNoUnsignedWrap();

    }

    return true;

  }


  llvm_unreachable("Unexpected overflow result");

}


/// Recognize and process idiom involving test for multiplication

/// overflow.

///

/// The caller has matched a pattern of the form:

///   I = cmp u (mul(zext A, zext B), V

/// The function checks if this is a test for overflow and if so replaces

/// multiplication with call to 'mul.with.overflow' intrinsic.

///

/// \param I Compare instruction.

/// \param MulVal Result of 'mult' instruction.  It is one of the arguments of

///               the compare instruction.  Must be of integer type.

/// \param OtherVal The other argument of compare instruction.

/// \returns Instruction which must replace the compare instruction, NULL if no

///          replacement required.


static Instruction *processUMulZExtIdiom(ICmpInst &I, Value *MulVal,

                                         const APInt *OtherVal,

                                         InstCombinerImpl &IC) {

  // Don't bother doing this transformation for pointers, don't do it for

  // vectors.

  if (!isa<IntegerType>(MulVal->getType()))

    return nullptr;


  auto *MulInstr = dyn_cast<Instruction>(MulVal);

  if (!MulInstr)

    return nullptr;

  assert(MulInstr->getOpcode() == Instruction::Mul);


  auto *LHS = cast<ZExtInst>(MulInstr->getOperand(0)),

       *RHS = cast<ZExtInst>(MulInstr->getOperand(1));

  assert(LHS->getOpcode() == Instruction::ZExt);

  assert(RHS->getOpcode() == Instruction::ZExt);

  Value *A = LHS->getOperand(0), *B = RHS->getOperand(0);


  // Calculate type and width of the result produced by mul.with.overflow.

  Type *TyA = A->getType(), *TyB = B->getType();

  unsigned WidthA = TyA->getPrimitiveSizeInBits(),

           WidthB = TyB->getPrimitiveSizeInBits();

  unsigned MulWidth;

  Type *MulType;

  if (WidthB > WidthA) {

    MulWidth = WidthB;

    MulType = TyB;

  } else {

    MulWidth = WidthA;

    MulType = TyA;

  }


  // In order to replace the original mul with a narrower mul.with.overflow,

  // all uses must ignore upper bits of the product.  The number of used low

  // bits must be not greater than the width of mul.with.overflow.

  if (MulVal->hasNUsesOrMore(2))

    for (User *U : MulVal->users()) {

      if (U == &I)

        continue;

      if (TruncInst *TI = dyn_cast<TruncInst>(U)) {

        // Check if truncation ignores bits above MulWidth.

        unsigned TruncWidth = TI->getType()->getPrimitiveSizeInBits();

        if (TruncWidth > MulWidth)

          return nullptr;

      } else if (BinaryOperator *BO = dyn_cast<BinaryOperator>(U)) {

        // Check if AND ignores bits above MulWidth.

        if (BO->getOpcode() != Instruction::And)

          return nullptr;

        if (ConstantInt *CI = dyn_cast<ConstantInt>(BO->getOperand(1))) {

          const APInt &CVal = CI->getValue();

          if (CVal.getBitWidth() - CVal.countl_zero() > MulWidth)

            return nullptr;

        } else {

          // In this case we could have the operand of the binary operation

          // being defined in another block, and performing the replacement

          // could break the dominance relation.

          return nullptr;

        }

      } else {

        // Other uses prohibit this transformation.

        return nullptr;

      }

    }


  // Recognize patterns

  switch (I.getPredicate()) {

  case ICmpInst::ICMP_UGT: {

    // Recognize pattern:

    //   mulval = mul(zext A, zext B)

    //   cmp ugt mulval, max

    APInt MaxVal = APInt::getMaxValue(MulWidth);

    MaxVal = MaxVal.zext(OtherVal->getBitWidth());

    if (MaxVal.eq(*OtherVal))

      break; // Recognized

    return nullptr;

  }


  case ICmpInst::ICMP_ULT: {

    // Recognize pattern:

    //   mulval = mul(zext A, zext B)

    //   cmp ule mulval, max + 1

    APInt MaxVal = APInt::getOneBitSet(OtherVal->getBitWidth(), MulWidth);

    if (MaxVal.eq(*OtherVal))

      break; // Recognized

    return nullptr;

  }


  default:

    return nullptr;

  }


  InstCombiner::BuilderTy &Builder = IC.Builder;

  Builder.SetInsertPoint(MulInstr);


  // Replace: mul(zext A, zext B) --> mul.with.overflow(A, B)

  Value *MulA = A, *MulB = B;

  if (WidthA < MulWidth)

    MulA = Builder.CreateZExt(A, MulType);

  if (WidthB < MulWidth)

    MulB = Builder.CreateZExt(B, MulType);

  CallInst *Call =

      Builder.CreateIntrinsic(Intrinsic::umul_with_overflow, MulType,

                              {MulA, MulB}, /*FMFSource=*/nullptr, "umul");

  IC.addToWorklist(MulInstr);


  // If there are uses of mul result other than the comparison, we know that

  // they are truncation or binary AND. Change them to use result of

  // mul.with.overflow and adjust properly mask/size.

  if (MulVal->hasNUsesOrMore(2)) {

    Value *Mul = Builder.CreateExtractValue(Call, 0, "umul.value");

    for (User *U : make_early_inc_range(MulVal->users())) {

      if (U == &I)

        continue;

      if (TruncInst *TI = dyn_cast<TruncInst>(U)) {

        if (TI->getType()->getPrimitiveSizeInBits() == MulWidth)

          IC.replaceInstUsesWith(*TI, Mul);

        else

          TI->setOperand(0, Mul);

      } else if (BinaryOperator *BO = dyn_cast<BinaryOperator>(U)) {

        assert(BO->getOpcode() == Instruction::And);

        // Replace (mul & mask) --> zext (mul.with.overflow & short_mask)

        ConstantInt *CI = cast<ConstantInt>(BO->getOperand(1));

        APInt ShortMask = CI->getValue().trunc(MulWidth);

        Value *ShortAnd = Builder.CreateAnd(Mul, ShortMask);

        Value *Zext = Builder.CreateZExt(ShortAnd, BO->getType());

        IC.replaceInstUsesWith(*BO, Zext);

      } else {

        llvm_unreachable("Unexpected Binary operation");

      }

      IC.addToWorklist(cast<Instruction>(U));

    }

  }


  // The original icmp gets replaced with the overflow value, maybe inverted

  // depending on predicate.

  if (I.getPredicate() == ICmpInst::ICMP_ULT) {

    Value *Res = Builder.CreateExtractValue(Call, 1);

    return BinaryOperator::CreateNot(Res);

  }


  return ExtractValueInst::Create(Call, 1);

}


/// When performing a comparison against a constant, it is possible that not all

/// the bits in the LHS are demanded. This helper method computes the mask that

/// IS demanded.


static APInt getDemandedBitsLHSMask(ICmpInst &I, unsigned BitWidth) {

  const APInt *RHS;

  if (!match(I.getOperand(1), m_APInt(RHS)))

    return APInt::getAllOnes(BitWidth);


  // If this is a normal comparison, it demands all bits. If it is a sign bit

  // comparison, it only demands the sign bit.

  bool UnusedBit;

  if (isSignBitCheck(I.getPredicate(), *RHS, UnusedBit))

    return APInt::getSignMask(BitWidth);


  switch (I.getPredicate()) {

  // For a UGT comparison, we don't care about any bits that

  // correspond to the trailing ones of the comparand.  The value of these

  // bits doesn't impact the outcome of the comparison, because any value

  // greater than the RHS must differ in a bit higher than these due to carry.

  case ICmpInst::ICMP_UGT:

    return APInt::getBitsSetFrom(BitWidth, RHS->countr_one());


  // Similarly, for a ULT comparison, we don't care about the trailing zeros.

  // Any value less than the RHS must differ in a higher bit because of carries.

  case ICmpInst::ICMP_ULT:

    return APInt::getBitsSetFrom(BitWidth, RHS->countr_zero());


  default:

    return APInt::getAllOnes(BitWidth);

  }

}


/// Check that one use is in the same block as the definition and all

/// other uses are in blocks dominated by a given block.

///

/// \param DI Definition

/// \param UI Use

/// \param DB Block that must dominate all uses of \p DI outside

///           the parent block

/// \return true when \p UI is the only use of \p DI in the parent block

/// and all other uses of \p DI are in blocks dominated by \p DB.

///


bool InstCombinerImpl::dominatesAllUses(const Instruction *DI,

                                        const Instruction *UI,

                                        const BasicBlock *DB) const {

  assert(DI && UI && "Instruction not defined\n");

  // Ignore incomplete definitions.

  if (!DI->getParent())

    return false;

  // DI and UI must be in the same block.

  if (DI->getParent() != UI->getParent())

    return false;

  // Protect from self-referencing blocks.

  if (DI->getParent() == DB)

    return false;

  for (const User *U : DI->users()) {

    auto *Usr = cast<Instruction>(U);

    if (Usr != UI && !DT.dominates(DB, Usr->getParent()))

      return false;

  }

  return true;

}


/// Return true when the instruction sequence within a block is select-cmp-br.


static bool isChainSelectCmpBranch(const SelectInst *SI) {

  const BasicBlock *BB = SI->getParent();

  if (!BB)

    return false;

  auto *BI = dyn_cast_or_null<BranchInst>(BB->getTerminator());

  if (!BI || BI->getNumSuccessors() != 2)

    return false;

  auto *IC = dyn_cast<ICmpInst>(BI->getCondition());

  if (!IC || (IC->getOperand(0) != SI && IC->getOperand(1) != SI))

    return false;

  return true;

}


/// True when a select result is replaced by one of its operands

/// in select-icmp sequence. This will eventually result in the elimination

/// of the select.

///

/// \param SI    Select instruction

/// \param Icmp  Compare instruction

/// \param SIOpd Operand that replaces the select

///

/// Notes:

/// - The replacement is global and requires dominator information

/// - The caller is responsible for the actual replacement

///

/// Example:

///

/// entry:

///  %4 = select i1 %3, %C* %0, %C* null

///  %5 = icmp eq %C* %4, null

///  br i1 %5, label %9, label %7

///  ...

///  ; <label>:7                                       ; preds = %entry

///  %8 = getelementptr inbounds %C* %4, i64 0, i32 0

///  ...

///

/// can be transformed to

///

///  %5 = icmp eq %C* %0, null

///  %6 = select i1 %3, i1 %5, i1 true

///  br i1 %6, label %9, label %7

///  ...

///  ; <label>:7                                       ; preds = %entry

///  %8 = getelementptr inbounds %C* %0, i64 0, i32 0  // replace by %0!

///

/// Similar when the first operand of the select is a constant or/and

/// the compare is for not equal rather than equal.

///

/// NOTE: The function is only called when the select and compare constants

/// are equal, the optimization can work only for EQ predicates. This is not a

/// major restriction since a NE compare should be 'normalized' to an equal

/// compare, which usually happens in the combiner and test case

/// select-cmp-br.ll checks for it.


bool InstCombinerImpl::replacedSelectWithOperand(SelectInst *SI,

                                                 const ICmpInst *Icmp,

                                                 const unsigned SIOpd) {

  assert((SIOpd == 1 || SIOpd == 2) && "Invalid select operand!");

  if (isChainSelectCmpBranch(SI) && Icmp->getPredicate() == ICmpInst::ICMP_EQ) {

    BasicBlock *Succ = SI->getParent()->getTerminator()->getSuccessor(1);

    // The check for the single predecessor is not the best that can be

    // done. But it protects efficiently against cases like when SI's

    // home block has two successors, Succ and Succ1, and Succ1 predecessor

    // of Succ. Then SI can't be replaced by SIOpd because the use that gets

    // replaced can be reached on either path. So the uniqueness check

    // guarantees that the path all uses of SI (outside SI's parent) are on

    // is disjoint from all other paths out of SI. But that information

    // is more expensive to compute, and the trade-off here is in favor

    // of compile-time. It should also be noticed that we check for a single

    // predecessor and not only uniqueness. This to handle the situation when

    // Succ and Succ1 points to the same basic block.

    if (Succ->getSinglePredecessor() && dominatesAllUses(SI, Icmp, Succ)) {

      NumSel++;

      SI->replaceUsesOutsideBlock(SI->getOperand(SIOpd), SI->getParent());

      return true;

    }

  }

  return false;

}


/// Try to fold the comparison based on range information we can get by checking

/// whether bits are known to be zero or one in the inputs.


Instruction *InstCombinerImpl::foldICmpUsingKnownBits(ICmpInst &I) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  Type *Ty = Op0->getType();

  ICmpInst::Predicate Pred = I.getPredicate();


  // Get scalar or pointer size.

  unsigned BitWidth = Ty->isIntOrIntVectorTy()

                          ? Ty->getScalarSizeInBits()

                          : DL.getPointerTypeSizeInBits(Ty->getScalarType());


  if (!BitWidth)

    return nullptr;


  KnownBits Op0Known(BitWidth);

  KnownBits Op1Known(BitWidth);


  {

    // Don't use dominating conditions when folding icmp using known bits. This

    // may convert signed into unsigned predicates in ways that other passes

    // (especially IndVarSimplify) may not be able to reliably undo.

    SimplifyQuery Q = SQ.getWithoutDomCondCache().getWithInstruction(&I);

    if (SimplifyDemandedBits(&I, 0, getDemandedBitsLHSMask(I, BitWidth),

                             Op0Known, Q))

      return &I;


    if (SimplifyDemandedBits(&I, 1, APInt::getAllOnes(BitWidth), Op1Known, Q))

      return &I;

  }


  if (!isa<Constant>(Op0) && Op0Known.isConstant())

    return new ICmpInst(

        Pred, ConstantExpr::getIntegerValue(Ty, Op0Known.getConstant()), Op1);

  if (!isa<Constant>(Op1) && Op1Known.isConstant())

    return new ICmpInst(

        Pred, Op0, ConstantExpr::getIntegerValue(Ty, Op1Known.getConstant()));


  if (std::optional<bool> Res = ICmpInst::compare(Op0Known, Op1Known, Pred))

    return replaceInstUsesWith(I, ConstantInt::getBool(I.getType(), *Res));


  // Given the known and unknown bits, compute a range that the LHS could be

  // in.  Compute the Min, Max and RHS values based on the known bits. For the

  // EQ and NE we use unsigned values.

  APInt Op0Min(BitWidth, 0), Op0Max(BitWidth, 0);

  APInt Op1Min(BitWidth, 0), Op1Max(BitWidth, 0);

  if (I.isSigned()) {

    Op0Min = Op0Known.getSignedMinValue();

    Op0Max = Op0Known.getSignedMaxValue();

    Op1Min = Op1Known.getSignedMinValue();

    Op1Max = Op1Known.getSignedMaxValue();

  } else {

    Op0Min = Op0Known.getMinValue();

    Op0Max = Op0Known.getMaxValue();

    Op1Min = Op1Known.getMinValue();

    Op1Max = Op1Known.getMaxValue();

  }


  // Don't break up a clamp pattern -- (min(max X, Y), Z) -- by replacing a

  // min/max canonical compare with some other compare. That could lead to

  // conflict with select canonicalization and infinite looping.

  // FIXME: This constraint may go away if min/max intrinsics are canonical.

  auto isMinMaxCmp = [&](Instruction &Cmp) {

    if (!Cmp.hasOneUse())

      return false;

    Value *A, *B;

    SelectPatternFlavor SPF = matchSelectPattern(Cmp.user_back(), A, B).Flavor;

    if (!SelectPatternResult::isMinOrMax(SPF))

      return false;

    return match(Op0, m_MaxOrMin(m_Value(), m_Value())) ||

           match(Op1, m_MaxOrMin(m_Value(), m_Value()));

  };

  if (!isMinMaxCmp(I)) {

    switch (Pred) {

    default:

      break;

    case ICmpInst::ICMP_ULT: {

      if (Op1Min == Op0Max) // A <u B -> A != B if max(A) == min(B)

        return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);

      const APInt *CmpC;

      if (match(Op1, m_APInt(CmpC))) {

        // A <u C -> A == C-1 if min(A)+1 == C

        if (*CmpC == Op0Min + 1)

          return new ICmpInst(ICmpInst::ICMP_EQ, Op0,

                              ConstantInt::get(Op1->getType(), *CmpC - 1));

        // X <u C --> X == 0, if the number of zero bits in the bottom of X

        // exceeds the log2 of C.

        if (Op0Known.countMinTrailingZeros() >= CmpC->ceilLogBase2())

          return new ICmpInst(ICmpInst::ICMP_EQ, Op0,

                              Constant::getNullValue(Op1->getType()));

      }

      break;

    }

    case ICmpInst::ICMP_UGT: {

      if (Op1Max == Op0Min) // A >u B -> A != B if min(A) == max(B)

        return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);

      const APInt *CmpC;

      if (match(Op1, m_APInt(CmpC))) {

        // A >u C -> A == C+1 if max(a)-1 == C

        if (*CmpC == Op0Max - 1)

          return new ICmpInst(ICmpInst::ICMP_EQ, Op0,

                              ConstantInt::get(Op1->getType(), *CmpC + 1));

        // X >u C --> X != 0, if the number of zero bits in the bottom of X

        // exceeds the log2 of C.

        if (Op0Known.countMinTrailingZeros() >= CmpC->getActiveBits())

          return new ICmpInst(ICmpInst::ICMP_NE, Op0,

                              Constant::getNullValue(Op1->getType()));

      }

      break;

    }

    case ICmpInst::ICMP_SLT: {

      if (Op1Min == Op0Max) // A <s B -> A != B if max(A) == min(B)

        return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);

      const APInt *CmpC;

      if (match(Op1, m_APInt(CmpC))) {

        if (*CmpC == Op0Min + 1) // A <s C -> A == C-1 if min(A)+1 == C

          return new ICmpInst(ICmpInst::ICMP_EQ, Op0,

                              ConstantInt::get(Op1->getType(), *CmpC - 1));

      }

      break;

    }

    case ICmpInst::ICMP_SGT: {

      if (Op1Max == Op0Min) // A >s B -> A != B if min(A) == max(B)

        return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);

      const APInt *CmpC;

      if (match(Op1, m_APInt(CmpC))) {

        if (*CmpC == Op0Max - 1) // A >s C -> A == C+1 if max(A)-1 == C

          return new ICmpInst(ICmpInst::ICMP_EQ, Op0,

                              ConstantInt::get(Op1->getType(), *CmpC + 1));

      }

      break;

    }

    }

  }


  // Based on the range information we know about the LHS, see if we can

  // simplify this comparison.  For example, (x&4) < 8 is always true.

  switch (Pred) {

  default:

    break;

  case ICmpInst::ICMP_EQ:

  case ICmpInst::ICMP_NE: {

    // If all bits are known zero except for one, then we know at most one bit

    // is set. If the comparison is against zero, then this is a check to see if

    // *that* bit is set.

    APInt Op0KnownZeroInverted = ~Op0Known.Zero;

    if (Op1Known.isZero()) {

      // If the LHS is an AND with the same constant, look through it.

      Value *LHS = nullptr;

      const APInt *LHSC;

      if (!match(Op0, m_And(m_Value(LHS), m_APInt(LHSC))) ||

          *LHSC != Op0KnownZeroInverted)

        LHS = Op0;


      Value *X;

      const APInt *C1;

      if (match(LHS, m_Shl(m_Power2(C1), m_Value(X)))) {

        Type *XTy = X->getType();

        unsigned Log2C1 = C1->countr_zero();

        APInt C2 = Op0KnownZeroInverted;

        APInt C2Pow2 = (C2 & ~(*C1 - 1)) + *C1;

        if (C2Pow2.isPowerOf2()) {

          // iff (C1 is pow2) & ((C2 & ~(C1-1)) + C1) is pow2):

          // ((C1 << X) & C2) == 0 -> X >= (Log2(C2+C1) - Log2(C1))

          // ((C1 << X) & C2) != 0 -> X  < (Log2(C2+C1) - Log2(C1))

          unsigned Log2C2 = C2Pow2.countr_zero();

          auto *CmpC = ConstantInt::get(XTy, Log2C2 - Log2C1);

          auto NewPred =

              Pred == CmpInst::ICMP_EQ ? CmpInst::ICMP_UGE : CmpInst::ICMP_ULT;

          return new ICmpInst(NewPred, X, CmpC);

        }

      }

    }


    // Op0 eq C_Pow2 -> Op0 ne 0 if Op0 is known to be C_Pow2 or zero.

    if (Op1Known.isConstant() && Op1Known.getConstant().isPowerOf2() &&

        (Op0Known & Op1Known) == Op0Known)

      return new ICmpInst(CmpInst::getInversePredicate(Pred), Op0,

                          ConstantInt::getNullValue(Op1->getType()));

    break;

  }

  case ICmpInst::ICMP_SGE:

    if (Op1Min == Op0Max) // A >=s B -> A == B if max(A) == min(B)

      return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);

    break;

  case ICmpInst::ICMP_SLE:

    if (Op1Max == Op0Min) // A <=s B -> A == B if min(A) == max(B)

      return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);

    break;

  case ICmpInst::ICMP_UGE:

    if (Op1Min == Op0Max) // A >=u B -> A == B if max(A) == min(B)

      return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);

    break;

  case ICmpInst::ICMP_ULE:

    if (Op1Max == Op0Min) // A <=u B -> A == B if min(A) == max(B)

      return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);

    break;

  }


  // Turn a signed comparison into an unsigned one if both operands are known to

  // have the same sign. Set samesign if possible (except for equality

  // predicates).

  if ((I.isSigned() || (I.isUnsigned() && !I.hasSameSign())) &&

      ((Op0Known.Zero.isNegative() && Op1Known.Zero.isNegative()) ||

       (Op0Known.One.isNegative() && Op1Known.One.isNegative()))) {

    I.setPredicate(I.getUnsignedPredicate());

    I.setSameSign();

    return &I;

  }


  return nullptr;

}


/// If one operand of an icmp is effectively a bool (value range of {0,1}),

/// then try to reduce patterns based on that limit.


Instruction *InstCombinerImpl::foldICmpUsingBoolRange(ICmpInst &I) {

  Value *X, *Y;

  CmpPredicate Pred;


  // X must be 0 and bool must be true for "ULT":

  // X <u (zext i1 Y) --> (X == 0) & Y

  if (match(&I, m_c_ICmp(Pred, m_Value(X), m_OneUse(m_ZExt(m_Value(Y))))) &&

      Y->getType()->isIntOrIntVectorTy(1) && Pred == ICmpInst::ICMP_ULT)

    return BinaryOperator::CreateAnd(Builder.CreateIsNull(X), Y);


  // X must be 0 or bool must be true for "ULE":

  // X <=u (sext i1 Y) --> (X == 0) | Y

  if (match(&I, m_c_ICmp(Pred, m_Value(X), m_OneUse(m_SExt(m_Value(Y))))) &&

      Y->getType()->isIntOrIntVectorTy(1) && Pred == ICmpInst::ICMP_ULE)

    return BinaryOperator::CreateOr(Builder.CreateIsNull(X), Y);


  // icmp eq/ne X, (zext/sext (icmp eq/ne X, C))

  CmpPredicate Pred1, Pred2;

  const APInt *C;

  Instruction *ExtI;

  if (match(&I, m_c_ICmp(Pred1, m_Value(X),

                         m_CombineAnd(m_Instruction(ExtI),

                                      m_ZExtOrSExt(m_ICmp(Pred2, m_Deferred(X),

                                                          m_APInt(C)))))) &&

      ICmpInst::isEquality(Pred1) && ICmpInst::isEquality(Pred2)) {

    bool IsSExt = ExtI->getOpcode() == Instruction::SExt;

    bool HasOneUse = ExtI->hasOneUse() && ExtI->getOperand(0)->hasOneUse();

    auto CreateRangeCheck = [&] {

      Value *CmpV1 =

          Builder.CreateICmp(Pred1, X, Constant::getNullValue(X->getType()));

      Value *CmpV2 = Builder.CreateICmp(

          Pred1, X, ConstantInt::getSigned(X->getType(), IsSExt ? -1 : 1));

      return BinaryOperator::Create(

          Pred1 == ICmpInst::ICMP_EQ ? Instruction::Or : Instruction::And,

          CmpV1, CmpV2);

    };

    if (C->isZero()) {

      if (Pred2 == ICmpInst::ICMP_EQ) {

        // icmp eq X, (zext/sext (icmp eq X, 0)) --> false

        // icmp ne X, (zext/sext (icmp eq X, 0)) --> true

        return replaceInstUsesWith(

            I, ConstantInt::getBool(I.getType(), Pred1 == ICmpInst::ICMP_NE));

      } else if (!IsSExt || HasOneUse) {

        // icmp eq X, (zext (icmp ne X, 0)) --> X == 0 || X == 1

        // icmp ne X, (zext (icmp ne X, 0)) --> X != 0 && X != 1

        // icmp eq X, (sext (icmp ne X, 0)) --> X == 0 || X == -1

        // icmp ne X, (sext (icmp ne X, 0)) --> X != 0 && X != -1

        return CreateRangeCheck();

      }

    } else if (IsSExt ? C->isAllOnes() : C->isOne()) {

      if (Pred2 == ICmpInst::ICMP_NE) {

        // icmp eq X, (zext (icmp ne X, 1)) --> false

        // icmp ne X, (zext (icmp ne X, 1)) --> true

        // icmp eq X, (sext (icmp ne X, -1)) --> false

        // icmp ne X, (sext (icmp ne X, -1)) --> true

        return replaceInstUsesWith(

            I, ConstantInt::getBool(I.getType(), Pred1 == ICmpInst::ICMP_NE));

      } else if (!IsSExt || HasOneUse) {

        // icmp eq X, (zext (icmp eq X, 1)) --> X == 0 || X == 1

        // icmp ne X, (zext (icmp eq X, 1)) --> X != 0 && X != 1

        // icmp eq X, (sext (icmp eq X, -1)) --> X == 0 || X == -1

        // icmp ne X, (sext (icmp eq X, -1)) --> X != 0 && X == -1

        return CreateRangeCheck();

      }

    } else {

      // when C != 0 && C != 1:

      //   icmp eq X, (zext (icmp eq X, C)) --> icmp eq X, 0

      //   icmp eq X, (zext (icmp ne X, C)) --> icmp eq X, 1

      //   icmp ne X, (zext (icmp eq X, C)) --> icmp ne X, 0

      //   icmp ne X, (zext (icmp ne X, C)) --> icmp ne X, 1

      // when C != 0 && C != -1:

      //   icmp eq X, (sext (icmp eq X, C)) --> icmp eq X, 0

      //   icmp eq X, (sext (icmp ne X, C)) --> icmp eq X, -1

      //   icmp ne X, (sext (icmp eq X, C)) --> icmp ne X, 0

      //   icmp ne X, (sext (icmp ne X, C)) --> icmp ne X, -1

      return ICmpInst::Create(

          Instruction::ICmp, Pred1, X,

          ConstantInt::getSigned(X->getType(), Pred2 == ICmpInst::ICMP_NE

                                                   ? (IsSExt ? -1 : 1)

                                                   : 0));

    }

  }


  return nullptr;

}


/// If we have an icmp le or icmp ge instruction with a constant operand, turn

/// it into the appropriate icmp lt or icmp gt instruction. This transform

/// allows them to be folded in visitICmpInst.


static ICmpInst *canonicalizeCmpWithConstant(ICmpInst &I) {

  ICmpInst::Predicate Pred = I.getPredicate();

  if (ICmpInst::isEquality(Pred) || !ICmpInst::isIntPredicate(Pred) ||

      InstCombiner::isCanonicalPredicate(Pred))

    return nullptr;


  Value *Op0 = I.getOperand(0);

  Value *Op1 = I.getOperand(1);

  auto *Op1C = dyn_cast<Constant>(Op1);

  if (!Op1C)

    return nullptr;


  auto FlippedStrictness = getFlippedStrictnessPredicateAndConstant(Pred, Op1C);

  if (!FlippedStrictness)

    return nullptr;


  return new ICmpInst(FlippedStrictness->first, Op0, FlippedStrictness->second);

}


/// If we have a comparison with a non-canonical predicate, if we can update

/// all the users, invert the predicate and adjust all the users.


CmpInst *InstCombinerImpl::canonicalizeICmpPredicate(CmpInst &I) {

  // Is the predicate already canonical?

  CmpInst::Predicate Pred = I.getPredicate();

  if (InstCombiner::isCanonicalPredicate(Pred))

    return nullptr;


  // Can all users be adjusted to predicate inversion?

  if (!InstCombiner::canFreelyInvertAllUsersOf(&I, /*IgnoredUser=*/nullptr))

    return nullptr;


  // Ok, we can canonicalize comparison!

  // Let's first invert the comparison's predicate.

  I.setPredicate(CmpInst::getInversePredicate(Pred));

  I.setName(I.getName() + ".not");


  // And, adapt users.

  freelyInvertAllUsersOf(&I);


  return &I;

}


/// Integer compare with boolean values can always be turned into bitwise ops.


static Instruction *canonicalizeICmpBool(ICmpInst &I,

                                         InstCombiner::BuilderTy &Builder) {

  Value *A = I.getOperand(0), *B = I.getOperand(1);

  assert(A->getType()->isIntOrIntVectorTy(1) && "Bools only");


  // A boolean compared to true/false can be simplified to Op0/true/false in

  // 14 out of the 20 (10 predicates * 2 constants) possible combinations.

  // Cases not handled by InstSimplify are always 'not' of Op0.

  if (match(B, m_Zero())) {

    switch (I.getPredicate()) {

    case CmpInst::ICMP_EQ:  // A ==   0 -> !A

    case CmpInst::ICMP_ULE: // A <=u  0 -> !A

    case CmpInst::ICMP_SGE: // A >=s  0 -> !A

      return BinaryOperator::CreateNot(A);

    default:

      llvm_unreachable("ICmp i1 X, C not simplified as expected.");

    }

  } else if (match(B, m_One())) {

    switch (I.getPredicate()) {

    case CmpInst::ICMP_NE:  // A !=  1 -> !A

    case CmpInst::ICMP_ULT: // A <u  1 -> !A

    case CmpInst::ICMP_SGT: // A >s -1 -> !A

      return BinaryOperator::CreateNot(A);

    default:

      llvm_unreachable("ICmp i1 X, C not simplified as expected.");

    }

  }


  switch (I.getPredicate()) {

  default:

    llvm_unreachable("Invalid icmp instruction!");

  case ICmpInst::ICMP_EQ:

    // icmp eq i1 A, B -> ~(A ^ B)

    return BinaryOperator::CreateNot(Builder.CreateXor(A, B));


  case ICmpInst::ICMP_NE:

    // icmp ne i1 A, B -> A ^ B

    return BinaryOperator::CreateXor(A, B);


  case ICmpInst::ICMP_UGT:

    // icmp ugt -> icmp ult

    std::swap(A, B);

    [[fallthrough]];

  case ICmpInst::ICMP_ULT:

    // icmp ult i1 A, B -> ~A & B

    return BinaryOperator::CreateAnd(Builder.CreateNot(A), B);


  case ICmpInst::ICMP_SGT:

    // icmp sgt -> icmp slt

    std::swap(A, B);

    [[fallthrough]];

  case ICmpInst::ICMP_SLT:

    // icmp slt i1 A, B -> A & ~B

    return BinaryOperator::CreateAnd(Builder.CreateNot(B), A);


  case ICmpInst::ICMP_UGE:

    // icmp uge -> icmp ule

    std::swap(A, B);

    [[fallthrough]];

  case ICmpInst::ICMP_ULE:

    // icmp ule i1 A, B -> ~A | B

    return BinaryOperator::CreateOr(Builder.CreateNot(A), B);


  case ICmpInst::ICMP_SGE:

    // icmp sge -> icmp sle

    std::swap(A, B);

    [[fallthrough]];

  case ICmpInst::ICMP_SLE:

    // icmp sle i1 A, B -> A | ~B

    return BinaryOperator::CreateOr(Builder.CreateNot(B), A);

  }

}


// Transform pattern like:

//   (1 << Y) u<= X  or  ~(-1 << Y) u<  X  or  ((1 << Y)+(-1)) u<  X

//   (1 << Y) u>  X  or  ~(-1 << Y) u>= X  or  ((1 << Y)+(-1)) u>= X

// Into:

//   (X l>> Y) != 0

//   (X l>> Y) == 0


static Instruction *foldICmpWithHighBitMask(ICmpInst &Cmp,

                                            InstCombiner::BuilderTy &Builder) {

  CmpPredicate Pred, NewPred;

  Value *X, *Y;

  if (match(&Cmp,

            m_c_ICmp(Pred, m_OneUse(m_Shl(m_One(), m_Value(Y))), m_Value(X)))) {

    switch (Pred) {

    case ICmpInst::ICMP_ULE:

      NewPred = ICmpInst::ICMP_NE;

      break;

    case ICmpInst::ICMP_UGT:

      NewPred = ICmpInst::ICMP_EQ;

      break;

    default:

      return nullptr;

    }

  } else if (match(&Cmp, m_c_ICmp(Pred,

                                  m_OneUse(m_CombineOr(

                                      m_Not(m_Shl(m_AllOnes(), m_Value(Y))),

                                      m_Add(m_Shl(m_One(), m_Value(Y)),

                                            m_AllOnes()))),

                                  m_Value(X)))) {

    // The variant with 'add' is not canonical, (the variant with 'not' is)

    // we only get it because it has extra uses, and can't be canonicalized,


    switch (Pred) {

    case ICmpInst::ICMP_ULT:

      NewPred = ICmpInst::ICMP_NE;

      break;

    case ICmpInst::ICMP_UGE:

      NewPred = ICmpInst::ICMP_EQ;

      break;

    default:

      return nullptr;

    }

  } else

    return nullptr;


  Value *NewX = Builder.CreateLShr(X, Y, X->getName() + ".highbits");

  Constant *Zero = Constant::getNullValue(NewX->getType());

  return CmpInst::Create(Instruction::ICmp, NewPred, NewX, Zero);

}


static Instruction *foldVectorCmp(CmpInst &Cmp,

                                  InstCombiner::BuilderTy &Builder) {

  const CmpInst::Predicate Pred = Cmp.getPredicate();

  Value *LHS = Cmp.getOperand(0), *RHS = Cmp.getOperand(1);

  Value *V1, *V2;


  auto createCmpReverse = [&](CmpInst::Predicate Pred, Value *X, Value *Y) {

    Value *V = Builder.CreateCmp(Pred, X, Y, Cmp.getName());

    if (auto *I = dyn_cast<Instruction>(V))

      I->copyIRFlags(&Cmp);

    Module *M = Cmp.getModule();

    Function *F = Intrinsic::getOrInsertDeclaration(

        M, Intrinsic::vector_reverse, V->getType());

    return CallInst::Create(F, V);

  };


  if (match(LHS, m_VecReverse(m_Value(V1)))) {

    // cmp Pred, rev(V1), rev(V2) --> rev(cmp Pred, V1, V2)

    if (match(RHS, m_VecReverse(m_Value(V2))) &&

        (LHS->hasOneUse() || RHS->hasOneUse()))

      return createCmpReverse(Pred, V1, V2);


    // cmp Pred, rev(V1), RHSSplat --> rev(cmp Pred, V1, RHSSplat)

    if (LHS->hasOneUse() && isSplatValue(RHS))

      return createCmpReverse(Pred, V1, RHS);

  }

  // cmp Pred, LHSSplat, rev(V2) --> rev(cmp Pred, LHSSplat, V2)

  else if (isSplatValue(LHS) && match(RHS, m_OneUse(m_VecReverse(m_Value(V2)))))

    return createCmpReverse(Pred, LHS, V2);


  ArrayRef<int> M;

  if (!match(LHS, m_Shuffle(m_Value(V1), m_Undef(), m_Mask(M))))

    return nullptr;


  // If both arguments of the cmp are shuffles that use the same mask and

  // shuffle within a single vector, move the shuffle after the cmp:

  // cmp (shuffle V1, M), (shuffle V2, M) --> shuffle (cmp V1, V2), M

  Type *V1Ty = V1->getType();

  if (match(RHS, m_Shuffle(m_Value(V2), m_Undef(), m_SpecificMask(M))) &&

      V1Ty == V2->getType() && (LHS->hasOneUse() || RHS->hasOneUse())) {

    Value *NewCmp = Builder.CreateCmp(Pred, V1, V2);

    return new ShuffleVectorInst(NewCmp, M);

  }


  // Try to canonicalize compare with splatted operand and splat constant.

  // TODO: We could generalize this for more than splats. See/use the code in

  //       InstCombiner::foldVectorBinop().

  Constant *C;

  if (!LHS->hasOneUse() || !match(RHS, m_Constant(C)))

    return nullptr;


  // Length-changing splats are ok, so adjust the constants as needed:

  // cmp (shuffle V1, M), C --> shuffle (cmp V1, C'), M

  Constant *ScalarC = C->getSplatValue(/* AllowPoison */ true);

  int MaskSplatIndex;

  if (ScalarC && match(M, m_SplatOrPoisonMask(MaskSplatIndex))) {

    // We allow poison in matching, but this transform removes it for safety.

    // Demanded elements analysis should be able to recover some/all of that.

    C = ConstantVector::getSplat(cast<VectorType>(V1Ty)->getElementCount(),

                                 ScalarC);

    SmallVector<int, 8> NewM(M.size(), MaskSplatIndex);

    Value *NewCmp = Builder.CreateCmp(Pred, V1, C);

    return new ShuffleVectorInst(NewCmp, NewM);

  }


  return nullptr;

}


// extract(uadd.with.overflow(A, B), 0) ult A

//  -> extract(uadd.with.overflow(A, B), 1)


static Instruction *foldICmpOfUAddOv(ICmpInst &I) {

  CmpInst::Predicate Pred = I.getPredicate();

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);


  Value *UAddOv;

  Value *A, *B;

  auto UAddOvResultPat = m_ExtractValue<0>(

      m_Intrinsic<Intrinsic::uadd_with_overflow>(m_Value(A), m_Value(B)));

  if (match(Op0, UAddOvResultPat) &&

      ((Pred == ICmpInst::ICMP_ULT && (Op1 == A || Op1 == B)) ||

       (Pred == ICmpInst::ICMP_EQ && match(Op1, m_ZeroInt()) &&

        (match(A, m_One()) || match(B, m_One()))) ||

       (Pred == ICmpInst::ICMP_NE && match(Op1, m_AllOnes()) &&

        (match(A, m_AllOnes()) || match(B, m_AllOnes())))))

    // extract(uadd.with.overflow(A, B), 0) < A

    // extract(uadd.with.overflow(A, 1), 0) == 0

    // extract(uadd.with.overflow(A, -1), 0) != -1

    UAddOv = cast<ExtractValueInst>(Op0)->getAggregateOperand();

  else if (match(Op1, UAddOvResultPat) && Pred == ICmpInst::ICMP_UGT &&

           (Op0 == A || Op0 == B))

    // A > extract(uadd.with.overflow(A, B), 0)

    UAddOv = cast<ExtractValueInst>(Op1)->getAggregateOperand();

  else

    return nullptr;


  return ExtractValueInst::Create(UAddOv, 1);

}


static Instruction *foldICmpInvariantGroup(ICmpInst &I) {

  if (!I.getOperand(0)->getType()->isPointerTy() ||

      NullPointerIsDefined(

          I.getParent()->getParent(),

          I.getOperand(0)->getType()->getPointerAddressSpace())) {

    return nullptr;

  }

  Instruction *Op;

  if (match(I.getOperand(0), m_Instruction(Op)) &&

      match(I.getOperand(1), m_Zero()) &&

      Op->isLaunderOrStripInvariantGroup()) {

    return ICmpInst::Create(Instruction::ICmp, I.getPredicate(),

                            Op->getOperand(0), I.getOperand(1));

  }

  return nullptr;

}


/// This function folds patterns produced by lowering of reduce idioms, such as

/// llvm.vector.reduce.and which are lowered into instruction chains. This code

/// attempts to generate fewer number of scalar comparisons instead of vector

/// comparisons when possible.


static Instruction *foldReductionIdiom(ICmpInst &I,

                                       InstCombiner::BuilderTy &Builder,

                                       const DataLayout &DL) {

  if (I.getType()->isVectorTy())

    return nullptr;

  CmpPredicate OuterPred, InnerPred;

  Value *LHS, *RHS;


  // Match lowering of @llvm.vector.reduce.and. Turn

  ///   %vec_ne = icmp ne <8 x i8> %lhs, %rhs

  ///   %scalar_ne = bitcast <8 x i1> %vec_ne to i8

  ///   %res = icmp <pred> i8 %scalar_ne, 0

  ///

  /// into

  ///

  ///   %lhs.scalar = bitcast <8 x i8> %lhs to i64

  ///   %rhs.scalar = bitcast <8 x i8> %rhs to i64

  ///   %res = icmp <pred> i64 %lhs.scalar, %rhs.scalar

  ///

  /// for <pred> in {ne, eq}.

  if (!match(&I, m_ICmp(OuterPred,

                        m_OneUse(m_BitCast(m_OneUse(

                            m_ICmp(InnerPred, m_Value(LHS), m_Value(RHS))))),

                        m_Zero())))

    return nullptr;

  auto *LHSTy = dyn_cast<FixedVectorType>(LHS->getType());

  if (!LHSTy || !LHSTy->getElementType()->isIntegerTy())

    return nullptr;

  unsigned NumBits =

      LHSTy->getNumElements() * LHSTy->getElementType()->getIntegerBitWidth();

  // TODO: Relax this to "not wider than max legal integer type"?

  if (!DL.isLegalInteger(NumBits))

    return nullptr;


  if (ICmpInst::isEquality(OuterPred) && InnerPred == ICmpInst::ICMP_NE) {

    auto *ScalarTy = Builder.getIntNTy(NumBits);

    LHS = Builder.CreateBitCast(LHS, ScalarTy, LHS->getName() + ".scalar");

    RHS = Builder.CreateBitCast(RHS, ScalarTy, RHS->getName() + ".scalar");

    return ICmpInst::Create(Instruction::ICmp, OuterPred, LHS, RHS,

                            I.getName());

  }


  return nullptr;

}


// This helper will be called with icmp operands in both orders.


Instruction *InstCombinerImpl::foldICmpCommutative(CmpPredicate Pred,

                                                   Value *Op0, Value *Op1,

                                                   ICmpInst &CxtI) {

  // Try to optimize 'icmp GEP, P' or 'icmp P, GEP'.

  if (auto *GEP = dyn_cast<GEPOperator>(Op0))

    if (Instruction *NI = foldGEPICmp(GEP, Op1, Pred, CxtI))

      return NI;


  if (auto *SI = dyn_cast<SelectInst>(Op0))

    if (Instruction *NI = foldSelectICmp(Pred, SI, Op1, CxtI))

      return NI;


  if (auto *MinMax = dyn_cast<MinMaxIntrinsic>(Op0))

    if (Instruction *Res = foldICmpWithMinMax(CxtI, MinMax, Op1, Pred))

      return Res;


  {

    Value *X;

    const APInt *C;

    // icmp X+Cst, X

    if (match(Op0, m_Add(m_Value(X), m_APInt(C))) && Op1 == X)

      return foldICmpAddOpConst(X, *C, Pred);

  }


  // abs(X) >=  X --> true

  // abs(X) u<= X --> true

  // abs(X) <   X --> false

  // abs(X) u>  X --> false

  // abs(X) u>= X --> IsIntMinPosion ? `X > -1`: `X u<= INTMIN`

  // abs(X) <=  X --> IsIntMinPosion ? `X > -1`: `X u<= INTMIN`

  // abs(X) ==  X --> IsIntMinPosion ? `X > -1`: `X u<= INTMIN`

  // abs(X) u<  X --> IsIntMinPosion ? `X < 0` : `X >   INTMIN`

  // abs(X) >   X --> IsIntMinPosion ? `X < 0` : `X >   INTMIN`

  // abs(X) !=  X --> IsIntMinPosion ? `X < 0` : `X >   INTMIN`

  {

    Value *X;

    Constant *C;

    if (match(Op0, m_Intrinsic<Intrinsic::abs>(m_Value(X), m_Constant(C))) &&

        match(Op1, m_Specific(X))) {

      Value *NullValue = Constant::getNullValue(X->getType());

      Value *AllOnesValue = Constant::getAllOnesValue(X->getType());

      const APInt SMin =

          APInt::getSignedMinValue(X->getType()->getScalarSizeInBits());

      bool IsIntMinPosion = C->isAllOnesValue();

      switch (Pred) {

      case CmpInst::ICMP_ULE:

      case CmpInst::ICMP_SGE:

        return replaceInstUsesWith(CxtI, ConstantInt::getTrue(CxtI.getType()));

      case CmpInst::ICMP_UGT:

      case CmpInst::ICMP_SLT:

        return replaceInstUsesWith(CxtI, ConstantInt::getFalse(CxtI.getType()));

      case CmpInst::ICMP_UGE:

      case CmpInst::ICMP_SLE:

      case CmpInst::ICMP_EQ: {

        return replaceInstUsesWith(

            CxtI, IsIntMinPosion

                      ? Builder.CreateICmpSGT(X, AllOnesValue)

                      : Builder.CreateICmpULT(

                            X, ConstantInt::get(X->getType(), SMin + 1)));

      }

      case CmpInst::ICMP_ULT:

      case CmpInst::ICMP_SGT:

      case CmpInst::ICMP_NE: {

        return replaceInstUsesWith(

            CxtI, IsIntMinPosion

                      ? Builder.CreateICmpSLT(X, NullValue)

                      : Builder.CreateICmpUGT(

                            X, ConstantInt::get(X->getType(), SMin)));

      }

      default:

        llvm_unreachable("Invalid predicate!");

      }

    }

  }


  const SimplifyQuery Q = SQ.getWithInstruction(&CxtI);

  if (Value *V = foldICmpWithLowBitMaskedVal(Pred, Op0, Op1, Q, *this))

    return replaceInstUsesWith(CxtI, V);


  // Folding (X / Y) pred X => X swap(pred) 0 for constant Y other than 0 or 1

  auto CheckUGT1 = [](const APInt &Divisor) { return Divisor.ugt(1); };

  {

    if (match(Op0, m_UDiv(m_Specific(Op1), m_CheckedInt(CheckUGT1)))) {

      return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Op1,

                          Constant::getNullValue(Op1->getType()));

    }


    if (!ICmpInst::isUnsigned(Pred) &&

        match(Op0, m_SDiv(m_Specific(Op1), m_CheckedInt(CheckUGT1)))) {

      return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Op1,

                          Constant::getNullValue(Op1->getType()));

    }

  }


  // Another case of this fold is (X >> Y) pred X => X swap(pred) 0 if Y != 0

  auto CheckNE0 = [](const APInt &Shift) { return !Shift.isZero(); };

  {

    if (match(Op0, m_LShr(m_Specific(Op1), m_CheckedInt(CheckNE0)))) {

      return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Op1,

                          Constant::getNullValue(Op1->getType()));

    }


    if ((Pred == CmpInst::ICMP_SLT || Pred == CmpInst::ICMP_SGE) &&

        match(Op0, m_AShr(m_Specific(Op1), m_CheckedInt(CheckNE0)))) {

      return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Op1,

                          Constant::getNullValue(Op1->getType()));

    }

  }


  return nullptr;

}


Instruction *InstCombinerImpl::visitICmpInst(ICmpInst &I) {

  bool Changed = false;

  const SimplifyQuery Q = SQ.getWithInstruction(&I);

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  unsigned Op0Cplxity = getComplexity(Op0);

  unsigned Op1Cplxity = getComplexity(Op1);


  /// Orders the operands of the compare so that they are listed from most

  /// complex to least complex.  This puts constants before unary operators,

  /// before binary operators.

  if (Op0Cplxity < Op1Cplxity) {

    I.swapOperands();

    std::swap(Op0, Op1);

    Changed = true;

  }


  if (Value *V = simplifyICmpInst(I.getCmpPredicate(), Op0, Op1, Q))

    return replaceInstUsesWith(I, V);


  // Comparing -val or val with non-zero is the same as just comparing val

  // ie, abs(val) != 0 -> val != 0

  if (I.getPredicate() == ICmpInst::ICMP_NE && match(Op1, m_Zero())) {

    Value *Cond, *SelectTrue, *SelectFalse;

    if (match(Op0, m_Select(m_Value(Cond), m_Value(SelectTrue),

                            m_Value(SelectFalse)))) {

      if (Value *V = dyn_castNegVal(SelectTrue)) {

        if (V == SelectFalse)

          return CmpInst::Create(Instruction::ICmp, I.getPredicate(), V, Op1);

      } else if (Value *V = dyn_castNegVal(SelectFalse)) {

        if (V == SelectTrue)

          return CmpInst::Create(Instruction::ICmp, I.getPredicate(), V, Op1);

      }

    }

  }


  if (Instruction *Res = foldICmpTruncWithTruncOrExt(I, Q))

    return Res;


  if (Op0->getType()->isIntOrIntVectorTy(1))

    if (Instruction *Res = canonicalizeICmpBool(I, Builder))

      return Res;


  if (Instruction *Res = canonicalizeCmpWithConstant(I))

    return Res;


  if (Instruction *Res = canonicalizeICmpPredicate(I))

    return Res;


  if (Instruction *Res = foldICmpWithConstant(I))

    return Res;


  if (Instruction *Res = foldICmpWithDominatingICmp(I))

    return Res;


  if (Instruction *Res = foldICmpUsingBoolRange(I))

    return Res;


  if (Instruction *Res = foldICmpUsingKnownBits(I))

    return Res;


  if (Instruction *Res = foldIsMultipleOfAPowerOfTwo(I))

    return Res;


  // Test if the ICmpInst instruction is used exclusively by a select as

  // part of a minimum or maximum operation. If so, refrain from doing

  // any other folding. This helps out other analyses which understand

  // non-obfuscated minimum and maximum idioms, such as ScalarEvolution

  // and CodeGen. And in this case, at least one of the comparison

  // operands has at least one user besides the compare (the select),

  // which would often largely negate the benefit of folding anyway.

  //

  // Do the same for the other patterns recognized by matchSelectPattern.

  if (I.hasOneUse())

    if (SelectInst *SI = dyn_cast<SelectInst>(I.user_back())) {

      Value *A, *B;

      SelectPatternResult SPR = matchSelectPattern(SI, A, B);

      if (SPR.Flavor != SPF_UNKNOWN)

        return nullptr;

    }


  // Do this after checking for min/max to prevent infinite looping.

  if (Instruction *Res = foldICmpWithZero(I))

    return Res;


  // FIXME: We only do this after checking for min/max to prevent infinite

  // looping caused by a reverse canonicalization of these patterns for min/max.

  // FIXME: The organization of folds is a mess. These would naturally go into

  // canonicalizeCmpWithConstant(), but we can't move all of the above folds

  // down here after the min/max restriction.

  ICmpInst::Predicate Pred = I.getPredicate();

  const APInt *C;

  if (match(Op1, m_APInt(C))) {

    // For i32: x >u 2147483647 -> x <s 0  -> true if sign bit set

    if (Pred == ICmpInst::ICMP_UGT && C->isMaxSignedValue()) {

      Constant *Zero = Constant::getNullValue(Op0->getType());

      return new ICmpInst(ICmpInst::ICMP_SLT, Op0, Zero);

    }


    // For i32: x <u 2147483648 -> x >s -1  -> true if sign bit clear

    if (Pred == ICmpInst::ICMP_ULT && C->isMinSignedValue()) {

      Constant *AllOnes = Constant::getAllOnesValue(Op0->getType());

      return new ICmpInst(ICmpInst::ICMP_SGT, Op0, AllOnes);

    }

  }


  // The folds in here may rely on wrapping flags and special constants, so

  // they can break up min/max idioms in some cases but not seemingly similar

  // patterns.

  // FIXME: It may be possible to enhance select folding to make this

  //        unnecessary. It may also be moot if we canonicalize to min/max

  //        intrinsics.

  if (Instruction *Res = foldICmpBinOp(I, Q))

    return Res;


  if (Instruction *Res = foldICmpInstWithConstant(I))

    return Res;


  // Try to match comparison as a sign bit test. Intentionally do this after

  // foldICmpInstWithConstant() to potentially let other folds to happen first.

  if (Instruction *New = foldSignBitTest(I))

    return New;


  if (auto *PN = dyn_cast<PHINode>(Op0))

    if (Instruction *NV = foldOpIntoPhi(I, PN))

      return NV;

  if (auto *PN = dyn_cast<PHINode>(Op1))

    if (Instruction *NV = foldOpIntoPhi(I, PN))

      return NV;


  if (Instruction *Res = foldICmpInstWithConstantNotInt(I))

    return Res;


  if (Instruction *Res = foldICmpCommutative(I.getCmpPredicate(), Op0, Op1, I))

    return Res;

  if (Instruction *Res =

          foldICmpCommutative(I.getSwappedCmpPredicate(), Op1, Op0, I))

    return Res;


  if (I.isCommutative()) {

    if (auto Pair = matchSymmetricPair(I.getOperand(0), I.getOperand(1))) {

      replaceOperand(I, 0, Pair->first);

      replaceOperand(I, 1, Pair->second);

      return &I;

    }

  }


  // In case of a comparison with two select instructions having the same

  // condition, check whether one of the resulting branches can be simplified.

  // If so, just compare the other branch and select the appropriate result.

  // For example:

  //   %tmp1 = select i1 %cmp, i32 %y, i32 %x

  //   %tmp2 = select i1 %cmp, i32 %z, i32 %x

  //   %cmp2 = icmp slt i32 %tmp2, %tmp1

  // The icmp will result false for the false value of selects and the result

  // will depend upon the comparison of true values of selects if %cmp is

  // true. Thus, transform this into:

  //   %cmp = icmp slt i32 %y, %z

  //   %sel = select i1 %cond, i1 %cmp, i1 false

  // This handles similar cases to transform.

  {

    Value *Cond, *A, *B, *C, *D;

    if (match(Op0, m_Select(m_Value(Cond), m_Value(A), m_Value(B))) &&

        match(Op1, m_Select(m_Specific(Cond), m_Value(C), m_Value(D))) &&

        (Op0->hasOneUse() || Op1->hasOneUse())) {

      // Check whether comparison of TrueValues can be simplified

      if (Value *Res = simplifyICmpInst(Pred, A, C, SQ)) {

        Value *NewICMP = Builder.CreateICmp(Pred, B, D);

        return SelectInst::Create(Cond, Res, NewICMP);

      }

      // Check whether comparison of FalseValues can be simplified

      if (Value *Res = simplifyICmpInst(Pred, B, D, SQ)) {

        Value *NewICMP = Builder.CreateICmp(Pred, A, C);

        return SelectInst::Create(Cond, NewICMP, Res);

      }

    }

  }


  // icmp slt (sub nsw x, y), (add nsw x, y)  -->  icmp sgt y, 0

  // icmp ult (sub nuw x, y), (add nuw x, y)  -->  icmp ugt y, 0

  // icmp eq (sub nsw/nuw x, y), (add nsw/nuw x, y)   -->  icmp eq y, 0

  {

    Value *A, *B;

    CmpPredicate CmpPred;

    if (match(&I, m_c_ICmp(CmpPred, m_Sub(m_Value(A), m_Value(B)),

                           m_c_Add(m_Deferred(A), m_Deferred(B))))) {

      auto *I0 = cast<OverflowingBinaryOperator>(Op0);

      auto *I1 = cast<OverflowingBinaryOperator>(Op1);

      bool I0NUW = I0->hasNoUnsignedWrap();

      bool I1NUW = I1->hasNoUnsignedWrap();

      bool I0NSW = I0->hasNoSignedWrap();

      bool I1NSW = I1->hasNoSignedWrap();

      if ((ICmpInst::isUnsigned(Pred) && I0NUW && I1NUW) ||

          (ICmpInst::isSigned(Pred) && I0NSW && I1NSW) ||

          (ICmpInst::isEquality(Pred) &&

           ((I0NUW || I0NSW) && (I1NUW || I1NSW)))) {

        return new ICmpInst(CmpPredicate::getSwapped(CmpPred), B,

                            ConstantInt::get(Op0->getType(), 0));

      }

    }

  }


  // Try to optimize equality comparisons against alloca-based pointers.

  if (Op0->getType()->isPointerTy() && I.isEquality()) {

    assert(Op1->getType()->isPointerTy() &&

           "Comparing pointer with non-pointer?");

    if (auto *Alloca = dyn_cast<AllocaInst>(getUnderlyingObject(Op0)))

      if (foldAllocaCmp(Alloca))

        return nullptr;

    if (auto *Alloca = dyn_cast<AllocaInst>(getUnderlyingObject(Op1)))

      if (foldAllocaCmp(Alloca))

        return nullptr;

  }


  if (Instruction *Res = foldICmpBitCast(I))

    return Res;


  // TODO: Hoist this above the min/max bailout.

  if (Instruction *R = foldICmpWithCastOp(I))

    return R;


  {

    Value *X, *Y;

    // Transform (X & ~Y) == 0 --> (X & Y) != 0

    // and       (X & ~Y) != 0 --> (X & Y) == 0

    // if A is a power of 2.

    if (match(Op0, m_And(m_Value(X), m_Not(m_Value(Y)))) &&

        match(Op1, m_Zero()) && isKnownToBeAPowerOfTwo(X, false, &I) &&

        I.isEquality())

      return new ICmpInst(I.getInversePredicate(), Builder.CreateAnd(X, Y),

                          Op1);


    // Op0 pred Op1 -> ~Op1 pred ~Op0, if this allows us to drop an instruction.

    if (Op0->getType()->isIntOrIntVectorTy()) {

      bool ConsumesOp0, ConsumesOp1;

      if (isFreeToInvert(Op0, Op0->hasOneUse(), ConsumesOp0) &&

          isFreeToInvert(Op1, Op1->hasOneUse(), ConsumesOp1) &&

          (ConsumesOp0 || ConsumesOp1)) {

        Value *InvOp0 = getFreelyInverted(Op0, Op0->hasOneUse(), &Builder);

        Value *InvOp1 = getFreelyInverted(Op1, Op1->hasOneUse(), &Builder);

        assert(InvOp0 && InvOp1 &&

               "Mismatch between isFreeToInvert and getFreelyInverted");

        return new ICmpInst(I.getSwappedPredicate(), InvOp0, InvOp1);

      }

    }


    Instruction *AddI = nullptr;

    if (match(&I, m_UAddWithOverflow(m_Value(X), m_Value(Y),

                                     m_Instruction(AddI))) &&

        isa<IntegerType>(X->getType())) {

      Value *Result;

      Constant *Overflow;

      // m_UAddWithOverflow can match patterns that do not include  an explicit

      // "add" instruction, so check the opcode of the matched op.

      if (AddI->getOpcode() == Instruction::Add &&

          OptimizeOverflowCheck(Instruction::Add, /*Signed*/ false, X, Y, *AddI,

                                Result, Overflow)) {

        replaceInstUsesWith(*AddI, Result);

        eraseInstFromFunction(*AddI);

        return replaceInstUsesWith(I, Overflow);

      }

    }


    // (zext X) * (zext Y)  --> llvm.umul.with.overflow.

    if (match(Op0, m_NUWMul(m_ZExt(m_Value(X)), m_ZExt(m_Value(Y)))) &&

        match(Op1, m_APInt(C))) {

      if (Instruction *R = processUMulZExtIdiom(I, Op0, C, *this))

        return R;

    }


    // Signbit test folds

    // Fold (X u>> BitWidth - 1 Pred ZExt(i1))  -->  X s< 0 Pred i1

    // Fold (X s>> BitWidth - 1 Pred SExt(i1))  -->  X s< 0 Pred i1

    Instruction *ExtI;

    if ((I.isUnsigned() || I.isEquality()) &&

        match(Op1,

              m_CombineAnd(m_Instruction(ExtI), m_ZExtOrSExt(m_Value(Y)))) &&

        Y->getType()->getScalarSizeInBits() == 1 &&

        (Op0->hasOneUse() || Op1->hasOneUse())) {

      unsigned OpWidth = Op0->getType()->getScalarSizeInBits();

      Instruction *ShiftI;

      if (match(Op0, m_CombineAnd(m_Instruction(ShiftI),

                                  m_Shr(m_Value(X), m_SpecificIntAllowPoison(

                                                        OpWidth - 1))))) {

        unsigned ExtOpc = ExtI->getOpcode();

        unsigned ShiftOpc = ShiftI->getOpcode();

        if ((ExtOpc == Instruction::ZExt && ShiftOpc == Instruction::LShr) ||

            (ExtOpc == Instruction::SExt && ShiftOpc == Instruction::AShr)) {

          Value *SLTZero =

              Builder.CreateICmpSLT(X, Constant::getNullValue(X->getType()));

          Value *Cmp = Builder.CreateICmp(Pred, SLTZero, Y, I.getName());

          return replaceInstUsesWith(I, Cmp);

        }

      }

    }

  }


  if (Instruction *Res = foldICmpEquality(I))

    return Res;


  if (Instruction *Res = foldICmpPow2Test(I, Builder))

    return Res;


  if (Instruction *Res = foldICmpOfUAddOv(I))

    return Res;


  // The 'cmpxchg' instruction returns an aggregate containing the old value and

  // an i1 which indicates whether or not we successfully did the swap.

  //

  // Replace comparisons between the old value and the expected value with the

  // indicator that 'cmpxchg' returns.

  //

  // N.B.  This transform is only valid when the 'cmpxchg' is not permitted to

  // spuriously fail.  In those cases, the old value may equal the expected

  // value but it is possible for the swap to not occur.

  if (I.getPredicate() == ICmpInst::ICMP_EQ)

    if (auto *EVI = dyn_cast<ExtractValueInst>(Op0))

      if (auto *ACXI = dyn_cast<AtomicCmpXchgInst>(EVI->getAggregateOperand()))

        if (EVI->getIndices()[0] == 0 && ACXI->getCompareOperand() == Op1 &&

            !ACXI->isWeak())

          return ExtractValueInst::Create(ACXI, 1);


  if (Instruction *Res = foldICmpWithHighBitMask(I, Builder))

    return Res;


  if (I.getType()->isVectorTy())

    if (Instruction *Res = foldVectorCmp(I, Builder))

      return Res;


  if (Instruction *Res = foldICmpInvariantGroup(I))

    return Res;


  if (Instruction *Res = foldReductionIdiom(I, Builder, DL))

    return Res;


  {

    Value *A;

    const APInt *C1, *C2;

    ICmpInst::Predicate Pred = I.getPredicate();

    if (ICmpInst::isEquality(Pred)) {

      // sext(a) & c1 == c2 --> a & c3 == trunc(c2)

      // sext(a) & c1 != c2 --> a & c3 != trunc(c2)

      if (match(Op0, m_And(m_SExt(m_Value(A)), m_APInt(C1))) &&

          match(Op1, m_APInt(C2))) {

        Type *InputTy = A->getType();

        unsigned InputBitWidth = InputTy->getScalarSizeInBits();

        // c2 must be non-negative at the bitwidth of a.

        if (C2->getActiveBits() < InputBitWidth) {

          APInt TruncC1 = C1->trunc(InputBitWidth);

          // Check if there are 1s in C1 high bits of size InputBitWidth.

          if (C1->uge(APInt::getOneBitSet(C1->getBitWidth(), InputBitWidth)))

            TruncC1.setBit(InputBitWidth - 1);

          Value *AndInst = Builder.CreateAnd(A, TruncC1);

          return new ICmpInst(

              Pred, AndInst,

              ConstantInt::get(InputTy, C2->trunc(InputBitWidth)));

        }

      }

    }

  }


  return Changed ? &I : nullptr;

}


/// Fold fcmp ([us]itofp x, cst) if possible.


Instruction *InstCombinerImpl::foldFCmpIntToFPConst(FCmpInst &I,

                                                    Instruction *LHSI,

                                                    Constant *RHSC) {

  const APFloat *RHS;

  if (!match(RHSC, m_APFloat(RHS)))

    return nullptr;


  // Get the width of the mantissa.  We don't want to hack on conversions that

  // might lose information from the integer, e.g. "i64 -> float"

  int MantissaWidth = LHSI->getType()->getFPMantissaWidth();

  if (MantissaWidth == -1)

    return nullptr; // Unknown.


  Type *IntTy = LHSI->getOperand(0)->getType();

  unsigned IntWidth = IntTy->getScalarSizeInBits();

  bool LHSUnsigned = isa<UIToFPInst>(LHSI);


  if (I.isEquality()) {

    FCmpInst::Predicate P = I.getPredicate();

    bool IsExact = false;

    APSInt RHSCvt(IntWidth, LHSUnsigned);

    RHS->convertToInteger(RHSCvt, APFloat::rmNearestTiesToEven, &IsExact);


    // If the floating point constant isn't an integer value, we know if we will

    // ever compare equal / not equal to it.

    if (!IsExact) {

      // TODO: Can never be -0.0 and other non-representable values

      APFloat RHSRoundInt(*RHS);

      RHSRoundInt.roundToIntegral(APFloat::rmNearestTiesToEven);

      if (*RHS != RHSRoundInt) {

        if (P == FCmpInst::FCMP_OEQ || P == FCmpInst::FCMP_UEQ)

          return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));


        assert(P == FCmpInst::FCMP_ONE || P == FCmpInst::FCMP_UNE);

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      }

    }


    // TODO: If the constant is exactly representable, is it always OK to do

    // equality compares as integer?

  }


  // Check to see that the input is converted from an integer type that is small

  // enough that preserves all bits.  TODO: check here for "known" sign bits.

  // This would allow us to handle (fptosi (x >>s 62) to float) if x is i64 f.e.


  // Following test does NOT adjust IntWidth downwards for signed inputs,

  // because the most negative value still requires all the mantissa bits

  // to distinguish it from one less than that value.

  if ((int)IntWidth > MantissaWidth) {

    // Conversion would lose accuracy. Check if loss can impact comparison.

    int Exp = ilogb(*RHS);

    if (Exp == APFloat::IEK_Inf) {

      int MaxExponent = ilogb(APFloat::getLargest(RHS->getSemantics()));

      if (MaxExponent < (int)IntWidth - !LHSUnsigned)

        // Conversion could create infinity.

        return nullptr;

    } else {

      // Note that if RHS is zero or NaN, then Exp is negative

      // and first condition is trivially false.

      if (MantissaWidth <= Exp && Exp <= (int)IntWidth - !LHSUnsigned)

        // Conversion could affect comparison.

        return nullptr;

    }

  }


  // Otherwise, we can potentially simplify the comparison.  We know that it

  // will always come through as an integer value and we know the constant is

  // not a NAN (it would have been previously simplified).

  assert(!RHS->isNaN() && "NaN comparison not already folded!");


  ICmpInst::Predicate Pred;

  switch (I.getPredicate()) {

  default:

    llvm_unreachable("Unexpected predicate!");

  case FCmpInst::FCMP_UEQ:

  case FCmpInst::FCMP_OEQ:

    Pred = ICmpInst::ICMP_EQ;

    break;

  case FCmpInst::FCMP_UGT:

  case FCmpInst::FCMP_OGT:

    Pred = LHSUnsigned ? ICmpInst::ICMP_UGT : ICmpInst::ICMP_SGT;

    break;

  case FCmpInst::FCMP_UGE:

  case FCmpInst::FCMP_OGE:

    Pred = LHSUnsigned ? ICmpInst::ICMP_UGE : ICmpInst::ICMP_SGE;

    break;

  case FCmpInst::FCMP_ULT:

  case FCmpInst::FCMP_OLT:

    Pred = LHSUnsigned ? ICmpInst::ICMP_ULT : ICmpInst::ICMP_SLT;

    break;

  case FCmpInst::FCMP_ULE:

  case FCmpInst::FCMP_OLE:

    Pred = LHSUnsigned ? ICmpInst::ICMP_ULE : ICmpInst::ICMP_SLE;

    break;

  case FCmpInst::FCMP_UNE:

  case FCmpInst::FCMP_ONE:

    Pred = ICmpInst::ICMP_NE;

    break;

  case FCmpInst::FCMP_ORD:

    return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

  case FCmpInst::FCMP_UNO:

    return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

  }


  // Now we know that the APFloat is a normal number, zero or inf.


  // See if the FP constant is too large for the integer.  For example,

  // comparing an i8 to 300.0.

  if (!LHSUnsigned) {

    // If the RHS value is > SignedMax, fold the comparison.  This handles +INF

    // and large values.

    APFloat SMax(RHS->getSemantics());

    SMax.convertFromAPInt(APInt::getSignedMaxValue(IntWidth), true,

                          APFloat::rmNearestTiesToEven);

    if (SMax < *RHS) { // smax < 13123.0

      if (Pred == ICmpInst::ICMP_NE || Pred == ICmpInst::ICMP_SLT ||

          Pred == ICmpInst::ICMP_SLE)

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    }

  } else {

    // If the RHS value is > UnsignedMax, fold the comparison. This handles

    // +INF and large values.

    APFloat UMax(RHS->getSemantics());

    UMax.convertFromAPInt(APInt::getMaxValue(IntWidth), false,

                          APFloat::rmNearestTiesToEven);

    if (UMax < *RHS) { // umax < 13123.0

      if (Pred == ICmpInst::ICMP_NE || Pred == ICmpInst::ICMP_ULT ||

          Pred == ICmpInst::ICMP_ULE)

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    }

  }


  if (!LHSUnsigned) {

    // See if the RHS value is < SignedMin.

    APFloat SMin(RHS->getSemantics());

    SMin.convertFromAPInt(APInt::getSignedMinValue(IntWidth), true,

                          APFloat::rmNearestTiesToEven);

    if (SMin > *RHS) { // smin > 12312.0

      if (Pred == ICmpInst::ICMP_NE || Pred == ICmpInst::ICMP_SGT ||

          Pred == ICmpInst::ICMP_SGE)

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    }

  } else {

    // See if the RHS value is < UnsignedMin.

    APFloat UMin(RHS->getSemantics());

    UMin.convertFromAPInt(APInt::getMinValue(IntWidth), false,

                          APFloat::rmNearestTiesToEven);

    if (UMin > *RHS) { // umin > 12312.0

      if (Pred == ICmpInst::ICMP_NE || Pred == ICmpInst::ICMP_UGT ||

          Pred == ICmpInst::ICMP_UGE)

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    }

  }


  // Okay, now we know that the FP constant fits in the range [SMIN, SMAX] or

  // [0, UMAX], but it may still be fractional. Check whether this is the case

  // using the IsExact flag.

  // Don't do this for zero, because -0.0 is not fractional.

  APSInt RHSInt(IntWidth, LHSUnsigned);

  bool IsExact;

  RHS->convertToInteger(RHSInt, APFloat::rmTowardZero, &IsExact);

  if (!RHS->isZero()) {

    if (!IsExact) {

      // If we had a comparison against a fractional value, we have to adjust

      // the compare predicate and sometimes the value.  RHSC is rounded towards

      // zero at this point.

      switch (Pred) {

      default:

        llvm_unreachable("Unexpected integer comparison!");

      case ICmpInst::ICMP_NE: // (float)int != 4.4   --> true

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      case ICmpInst::ICMP_EQ: // (float)int == 4.4   --> false

        return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

      case ICmpInst::ICMP_ULE:

        // (float)int <= 4.4   --> int <= 4

        // (float)int <= -4.4  --> false

        if (RHS->isNegative())

          return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

        break;

      case ICmpInst::ICMP_SLE:

        // (float)int <= 4.4   --> int <= 4

        // (float)int <= -4.4  --> int < -4

        if (RHS->isNegative())

          Pred = ICmpInst::ICMP_SLT;

        break;

      case ICmpInst::ICMP_ULT:

        // (float)int < -4.4   --> false

        // (float)int < 4.4    --> int <= 4

        if (RHS->isNegative())

          return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

        Pred = ICmpInst::ICMP_ULE;

        break;

      case ICmpInst::ICMP_SLT:

        // (float)int < -4.4   --> int < -4

        // (float)int < 4.4    --> int <= 4

        if (!RHS->isNegative())

          Pred = ICmpInst::ICMP_SLE;

        break;

      case ICmpInst::ICMP_UGT:

        // (float)int > 4.4    --> int > 4

        // (float)int > -4.4   --> true

        if (RHS->isNegative())

          return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

        break;

      case ICmpInst::ICMP_SGT:

        // (float)int > 4.4    --> int > 4

        // (float)int > -4.4   --> int >= -4

        if (RHS->isNegative())

          Pred = ICmpInst::ICMP_SGE;

        break;

      case ICmpInst::ICMP_UGE:

        // (float)int >= -4.4   --> true

        // (float)int >= 4.4    --> int > 4

        if (RHS->isNegative())

          return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

        Pred = ICmpInst::ICMP_UGT;

        break;

      case ICmpInst::ICMP_SGE:

        // (float)int >= -4.4   --> int >= -4

        // (float)int >= 4.4    --> int > 4

        if (!RHS->isNegative())

          Pred = ICmpInst::ICMP_SGT;

        break;

      }

    }

  }


  // Lower this FP comparison into an appropriate integer version of the

  // comparison.

  return new ICmpInst(Pred, LHSI->getOperand(0),

                      ConstantInt::get(LHSI->getOperand(0)->getType(), RHSInt));

}


/// Fold (C / X) < 0.0 --> X < 0.0 if possible. Swap predicate if necessary.


static Instruction *foldFCmpReciprocalAndZero(FCmpInst &I, Instruction *LHSI,

                                              Constant *RHSC) {

  // When C is not 0.0 and infinities are not allowed:

  // (C / X) < 0.0 is a sign-bit test of X

  // (C / X) < 0.0 --> X < 0.0 (if C is positive)

  // (C / X) < 0.0 --> X > 0.0 (if C is negative, swap the predicate)

  //

  // Proof:

  // Multiply (C / X) < 0.0 by X * X / C.

  // - X is non zero, if it is the flag 'ninf' is violated.

  // - C defines the sign of X * X * C. Thus it also defines whether to swap

  //   the predicate. C is also non zero by definition.

  //

  // Thus X * X / C is non zero and the transformation is valid. [qed]


  FCmpInst::Predicate Pred = I.getPredicate();


  // Check that predicates are valid.

  if ((Pred != FCmpInst::FCMP_OGT) && (Pred != FCmpInst::FCMP_OLT) &&

      (Pred != FCmpInst::FCMP_OGE) && (Pred != FCmpInst::FCMP_OLE))

    return nullptr;


  // Check that RHS operand is zero.

  if (!match(RHSC, m_AnyZeroFP()))

    return nullptr;


  // Check fastmath flags ('ninf').

  if (!LHSI->hasNoInfs() || !I.hasNoInfs())

    return nullptr;


  // Check the properties of the dividend. It must not be zero to avoid a

  // division by zero (see Proof).

  const APFloat *C;

  if (!match(LHSI->getOperand(0), m_APFloat(C)))

    return nullptr;


  if (C->isZero())

    return nullptr;


  // Get swapped predicate if necessary.

  if (C->isNegative())

    Pred = I.getSwappedPredicate();


  return new FCmpInst(Pred, LHSI->getOperand(1), RHSC, "", &I);

}


// Transform 'fptrunc(x) cmp C' to 'x cmp ext(C)' if possible.

// Patterns include:

//    fptrunc(x) <  C  -->  x <  ext(C)

//    fptrunc(x) <= C  -->  x <= ext(C)

//    fptrunc(x) >  C  -->  x >  ext(C)

//    fptrunc(x) >= C  -->  x >= ext(C)

// where 'ext(C)' is the extension of 'C' to the type of 'x' with a small bias

// due to precision loss.


static Instruction *foldFCmpFpTrunc(FCmpInst &I, const Instruction &FPTrunc,

                                    const Constant &C) {

  FCmpInst::Predicate Pred = I.getPredicate();

  bool RoundDown = false;


  if (Pred == FCmpInst::FCMP_OGE || Pred == FCmpInst::FCMP_UGE ||

      Pred == FCmpInst::FCMP_OLT || Pred == FCmpInst::FCMP_ULT)

    RoundDown = true;

  else if (Pred == FCmpInst::FCMP_OGT || Pred == FCmpInst::FCMP_UGT ||

           Pred == FCmpInst::FCMP_OLE || Pred == FCmpInst::FCMP_ULE)

    RoundDown = false;

  else

    return nullptr;


  const APFloat *CValue;

  if (!match(&C, m_APFloat(CValue)))

    return nullptr;


  if (CValue->isNaN() || CValue->isInfinity())

    return nullptr;


  auto ConvertFltSema = [](const APFloat &Src, const fltSemantics &Sema) {

    bool LosesInfo;

    APFloat Dest = Src;

    Dest.convert(Sema, APFloat::rmNearestTiesToEven, &LosesInfo);

    return Dest;

  };


  auto NextValue = [](const APFloat &Value, bool RoundDown) {

    APFloat NextValue = Value;

    NextValue.next(RoundDown);

    return NextValue;

  };


  APFloat NextCValue = NextValue(*CValue, RoundDown);


  Type *DestType = FPTrunc.getOperand(0)->getType();

  const fltSemantics &DestFltSema =

      DestType->getScalarType()->getFltSemantics();


  APFloat ExtCValue = ConvertFltSema(*CValue, DestFltSema);

  APFloat ExtNextCValue = ConvertFltSema(NextCValue, DestFltSema);


  // When 'NextCValue' is infinity, use an imaged 'NextCValue' that equals

  // 'CValue + bias' to avoid the infinity after conversion. The bias is

  // estimated as 'CValue - PrevCValue', where 'PrevCValue' is the previous

  // value of 'CValue'.

  if (NextCValue.isInfinity()) {

    APFloat PrevCValue = NextValue(*CValue, !RoundDown);

    APFloat Bias = ConvertFltSema(*CValue - PrevCValue, DestFltSema);


    ExtNextCValue = ExtCValue + Bias;

  }


  APFloat ExtMidValue =

      scalbn(ExtCValue + ExtNextCValue, -1, APFloat::rmNearestTiesToEven);


  const fltSemantics &SrcFltSema =

      C.getType()->getScalarType()->getFltSemantics();


  // 'MidValue' might be rounded to 'NextCValue'. Correct it here.

  APFloat MidValue = ConvertFltSema(ExtMidValue, SrcFltSema);

  if (MidValue != *CValue)

    ExtMidValue.next(!RoundDown);


  // Check whether 'ExtMidValue' is a valid result since the assumption on

  // imaged 'NextCValue' might not hold for new float types.

  // ppc_fp128 can't pass here when converting from max float because of

  // APFloat implementation.

  if (NextCValue.isInfinity()) {

    // ExtMidValue --- narrowed ---> Finite

    if (ConvertFltSema(ExtMidValue, SrcFltSema).isInfinity())

      return nullptr;


    // NextExtMidValue --- narrowed ---> Infinity

    APFloat NextExtMidValue = NextValue(ExtMidValue, RoundDown);

    if (ConvertFltSema(NextExtMidValue, SrcFltSema).isFinite())

      return nullptr;

  }


  return new FCmpInst(Pred, FPTrunc.getOperand(0),

                      ConstantFP::get(DestType, ExtMidValue), "", &I);

}


/// Optimize fabs(X) compared with zero.


static Instruction *foldFabsWithFcmpZero(FCmpInst &I, InstCombinerImpl &IC) {

  Value *X;

  if (!match(I.getOperand(0), m_FAbs(m_Value(X))))

    return nullptr;


  const APFloat *C;

  if (!match(I.getOperand(1), m_APFloat(C)))

    return nullptr;


  if (!C->isPosZero()) {

    if (!C->isSmallestNormalized())

      return nullptr;


    const Function *F = I.getFunction();

    DenormalMode Mode = F->getDenormalMode(C->getSemantics());

    if (Mode.Input == DenormalMode::PreserveSign ||

        Mode.Input == DenormalMode::PositiveZero) {


      auto replaceFCmp = [](FCmpInst *I, FCmpInst::Predicate P, Value *X) {

        Constant *Zero = ConstantFP::getZero(X->getType());

        return new FCmpInst(P, X, Zero, "", I);

      };


      switch (I.getPredicate()) {

      case FCmpInst::FCMP_OLT:

        // fcmp olt fabs(x), smallest_normalized_number -> fcmp oeq x, 0.0

        return replaceFCmp(&I, FCmpInst::FCMP_OEQ, X);

      case FCmpInst::FCMP_UGE:

        // fcmp uge fabs(x), smallest_normalized_number -> fcmp une x, 0.0

        return replaceFCmp(&I, FCmpInst::FCMP_UNE, X);

      case FCmpInst::FCMP_OGE:

        // fcmp oge fabs(x), smallest_normalized_number -> fcmp one x, 0.0

        return replaceFCmp(&I, FCmpInst::FCMP_ONE, X);

      case FCmpInst::FCMP_ULT:

        // fcmp ult fabs(x), smallest_normalized_number -> fcmp ueq x, 0.0

        return replaceFCmp(&I, FCmpInst::FCMP_UEQ, X);

      default:

        break;

      }

    }


    return nullptr;

  }


  auto replacePredAndOp0 = [&IC](FCmpInst *I, FCmpInst::Predicate P, Value *X) {

    I->setPredicate(P);

    return IC.replaceOperand(*I, 0, X);

  };


  switch (I.getPredicate()) {

  case FCmpInst::FCMP_UGE:

  case FCmpInst::FCMP_OLT:

    // fabs(X) >= 0.0 --> true

    // fabs(X) <  0.0 --> false

    llvm_unreachable("fcmp should have simplified");


  case FCmpInst::FCMP_OGT:

    // fabs(X) > 0.0 --> X != 0.0

    return replacePredAndOp0(&I, FCmpInst::FCMP_ONE, X);


  case FCmpInst::FCMP_UGT:

    // fabs(X) u> 0.0 --> X u!= 0.0

    return replacePredAndOp0(&I, FCmpInst::FCMP_UNE, X);


  case FCmpInst::FCMP_OLE:

    // fabs(X) <= 0.0 --> X == 0.0

    return replacePredAndOp0(&I, FCmpInst::FCMP_OEQ, X);


  case FCmpInst::FCMP_ULE:

    // fabs(X) u<= 0.0 --> X u== 0.0

    return replacePredAndOp0(&I, FCmpInst::FCMP_UEQ, X);


  case FCmpInst::FCMP_OGE:

    // fabs(X) >= 0.0 --> !isnan(X)

    assert(!I.hasNoNaNs() && "fcmp should have simplified");

    return replacePredAndOp0(&I, FCmpInst::FCMP_ORD, X);


  case FCmpInst::FCMP_ULT:

    // fabs(X) u< 0.0 --> isnan(X)

    assert(!I.hasNoNaNs() && "fcmp should have simplified");

    return replacePredAndOp0(&I, FCmpInst::FCMP_UNO, X);


  case FCmpInst::FCMP_OEQ:

  case FCmpInst::FCMP_UEQ:

  case FCmpInst::FCMP_ONE:

  case FCmpInst::FCMP_UNE:

  case FCmpInst::FCMP_ORD:

  case FCmpInst::FCMP_UNO:

    // Look through the fabs() because it doesn't change anything but the sign.

    // fabs(X) == 0.0 --> X == 0.0,

    // fabs(X) != 0.0 --> X != 0.0

    // isnan(fabs(X)) --> isnan(X)

    // !isnan(fabs(X) --> !isnan(X)

    return replacePredAndOp0(&I, I.getPredicate(), X);


  default:

    return nullptr;

  }

}


/// Optimize sqrt(X) compared with zero.


static Instruction *foldSqrtWithFcmpZero(FCmpInst &I, InstCombinerImpl &IC) {

  Value *X;

  if (!match(I.getOperand(0), m_Sqrt(m_Value(X))))

    return nullptr;


  if (!match(I.getOperand(1), m_PosZeroFP()))

    return nullptr;


  auto ReplacePredAndOp0 = [&](FCmpInst::Predicate P) {

    I.setPredicate(P);

    return IC.replaceOperand(I, 0, X);

  };


  // Clear ninf flag if sqrt doesn't have it.

  if (!cast<Instruction>(I.getOperand(0))->hasNoInfs())

    I.setHasNoInfs(false);


  switch (I.getPredicate()) {

  case FCmpInst::FCMP_OLT:

  case FCmpInst::FCMP_UGE:

    // sqrt(X) < 0.0 --> false

    // sqrt(X) u>= 0.0 --> true

    llvm_unreachable("fcmp should have simplified");

  case FCmpInst::FCMP_ULT:

  case FCmpInst::FCMP_ULE:

  case FCmpInst::FCMP_OGT:

  case FCmpInst::FCMP_OGE:

  case FCmpInst::FCMP_OEQ:

  case FCmpInst::FCMP_UNE:

    // sqrt(X) u< 0.0 --> X u< 0.0

    // sqrt(X) u<= 0.0 --> X u<= 0.0

    // sqrt(X) > 0.0 --> X > 0.0

    // sqrt(X) >= 0.0 --> X >= 0.0

    // sqrt(X) == 0.0 --> X == 0.0

    // sqrt(X) u!= 0.0 --> X u!= 0.0

    return IC.replaceOperand(I, 0, X);


  case FCmpInst::FCMP_OLE:

    // sqrt(X) <= 0.0 --> X == 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_OEQ);

  case FCmpInst::FCMP_UGT:

    // sqrt(X) u> 0.0 --> X u!= 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_UNE);

  case FCmpInst::FCMP_UEQ:

    // sqrt(X) u== 0.0 --> X u<= 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_ULE);

  case FCmpInst::FCMP_ONE:

    // sqrt(X) != 0.0 --> X > 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_OGT);

  case FCmpInst::FCMP_ORD:

    // !isnan(sqrt(X)) --> X >= 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_OGE);

  case FCmpInst::FCMP_UNO:

    // isnan(sqrt(X)) --> X u< 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_ULT);

  default:

    llvm_unreachable("Unexpected predicate!");

  }

}


static Instruction *foldFCmpFNegCommonOp(FCmpInst &I) {

  CmpInst::Predicate Pred = I.getPredicate();

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);


  // Canonicalize fneg as Op1.

  if (match(Op0, m_FNeg(m_Value())) && !match(Op1, m_FNeg(m_Value()))) {

    std::swap(Op0, Op1);

    Pred = I.getSwappedPredicate();

  }


  if (!match(Op1, m_FNeg(m_Specific(Op0))))

    return nullptr;


  // Replace the negated operand with 0.0:

  // fcmp Pred Op0, -Op0 --> fcmp Pred Op0, 0.0

  Constant *Zero = ConstantFP::getZero(Op0->getType());

  return new FCmpInst(Pred, Op0, Zero, "", &I);

}


static Instruction *foldFCmpFSubIntoFCmp(FCmpInst &I, Instruction *LHSI,

                                         Constant *RHSC, InstCombinerImpl &CI) {

  const CmpInst::Predicate Pred = I.getPredicate();

  Value *X = LHSI->getOperand(0);

  Value *Y = LHSI->getOperand(1);

  switch (Pred) {

  default:

    break;

  case FCmpInst::FCMP_UGT:

  case FCmpInst::FCMP_ULT:

  case FCmpInst::FCMP_UNE:

  case FCmpInst::FCMP_OEQ:

  case FCmpInst::FCMP_OGE:

  case FCmpInst::FCMP_OLE:

    // The optimization is not valid if X and Y are infinities of the same

    // sign, i.e. the inf - inf = nan case. If the fsub has the ninf or nnan

    // flag then we can assume we do not have that case. Otherwise we might be

    // able to prove that either X or Y is not infinity.

    if (!LHSI->hasNoNaNs() && !LHSI->hasNoInfs() &&

        !isKnownNeverInfinity(Y,

                              CI.getSimplifyQuery().getWithInstruction(&I)) &&

        !isKnownNeverInfinity(X, CI.getSimplifyQuery().getWithInstruction(&I)))

      break;


    [[fallthrough]];

  case FCmpInst::FCMP_OGT:

  case FCmpInst::FCMP_OLT:

  case FCmpInst::FCMP_ONE:

  case FCmpInst::FCMP_UEQ:

  case FCmpInst::FCMP_UGE:

  case FCmpInst::FCMP_ULE:

    // fcmp pred (x - y), 0 --> fcmp pred x, y

    if (match(RHSC, m_AnyZeroFP()) &&

        I.getFunction()->getDenormalMode(

            LHSI->getType()->getScalarType()->getFltSemantics()) ==

            DenormalMode::getIEEE()) {

      CI.replaceOperand(I, 0, X);

      CI.replaceOperand(I, 1, Y);

      return &I;

    }

    break;

  }


  return nullptr;

}


static Instruction *foldFCmpWithFloorAndCeil(FCmpInst &I,

                                             InstCombinerImpl &IC) {

  Value *LHS = I.getOperand(0), *RHS = I.getOperand(1);

  Type *OpType = LHS->getType();

  CmpInst::Predicate Pred = I.getPredicate();


  bool FloorX = match(LHS, m_Intrinsic<Intrinsic::floor>(m_Specific(RHS)));

  bool CeilX = match(LHS, m_Intrinsic<Intrinsic::ceil>(m_Specific(RHS)));


  if (!FloorX && !CeilX) {

    if ((FloorX = match(RHS, m_Intrinsic<Intrinsic::floor>(m_Specific(LHS)))) ||

        (CeilX = match(RHS, m_Intrinsic<Intrinsic::ceil>(m_Specific(LHS))))) {

      std::swap(LHS, RHS);

      Pred = I.getSwappedPredicate();

    }

  }


  switch (Pred) {

  case FCmpInst::FCMP_OLE:

    // fcmp ole floor(x), x => fcmp ord x, 0

    if (FloorX)

      return new FCmpInst(FCmpInst::FCMP_ORD, RHS, ConstantFP::getZero(OpType),

                          "", &I);

    break;

  case FCmpInst::FCMP_OGT:

    // fcmp ogt floor(x), x => false

    if (FloorX)

      return IC.replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    break;

  case FCmpInst::FCMP_OGE:

    // fcmp oge ceil(x), x => fcmp ord x, 0

    if (CeilX)

      return new FCmpInst(FCmpInst::FCMP_ORD, RHS, ConstantFP::getZero(OpType),

                          "", &I);

    break;

  case FCmpInst::FCMP_OLT:

    // fcmp olt ceil(x), x => false

    if (CeilX)

      return IC.replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    break;

  case FCmpInst::FCMP_ULE:

    // fcmp ule floor(x), x => true

    if (FloorX)

      return IC.replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

    break;

  case FCmpInst::FCMP_UGT:

    // fcmp ugt floor(x), x => fcmp uno x, 0

    if (FloorX)

      return new FCmpInst(FCmpInst::FCMP_UNO, RHS, ConstantFP::getZero(OpType),

                          "", &I);

    break;

  case FCmpInst::FCMP_UGE:

    // fcmp uge ceil(x), x => true

    if (CeilX)

      return IC.replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

    break;

  case FCmpInst::FCMP_ULT:

    // fcmp ult ceil(x), x => fcmp uno x, 0

    if (CeilX)

      return new FCmpInst(FCmpInst::FCMP_UNO, RHS, ConstantFP::getZero(OpType),

                          "", &I);

    break;

  default:

    break;

  }


  return nullptr;

}


Instruction *InstCombinerImpl::visitFCmpInst(FCmpInst &I) {

  bool Changed = false;


  /// Orders the operands of the compare so that they are listed from most

  /// complex to least complex.  This puts constants before unary operators,

  /// before binary operators.

  if (getComplexity(I.getOperand(0)) < getComplexity(I.getOperand(1))) {

    I.swapOperands();

    Changed = true;

  }


  const CmpInst::Predicate Pred = I.getPredicate();

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  if (Value *V = simplifyFCmpInst(Pred, Op0, Op1, I.getFastMathFlags(),

                                  SQ.getWithInstruction(&I)))

    return replaceInstUsesWith(I, V);


  // Simplify 'fcmp pred X, X'

  Type *OpType = Op0->getType();

  assert(OpType == Op1->getType() && "fcmp with different-typed operands?");

  if (Op0 == Op1) {

    switch (Pred) {

    default:

      break;

    case FCmpInst::FCMP_UNO: // True if unordered: isnan(X) | isnan(Y)

    case FCmpInst::FCMP_ULT: // True if unordered or less than

    case FCmpInst::FCMP_UGT: // True if unordered or greater than

    case FCmpInst::FCMP_UNE: // True if unordered or not equal

      // Canonicalize these to be 'fcmp uno %X, 0.0'.

      I.setPredicate(FCmpInst::FCMP_UNO);

      I.setOperand(1, Constant::getNullValue(OpType));

      return &I;


    case FCmpInst::FCMP_ORD: // True if ordered (no nans)

    case FCmpInst::FCMP_OEQ: // True if ordered and equal

    case FCmpInst::FCMP_OGE: // True if ordered and greater than or equal

    case FCmpInst::FCMP_OLE: // True if ordered and less than or equal

      // Canonicalize these to be 'fcmp ord %X, 0.0'.

      I.setPredicate(FCmpInst::FCMP_ORD);

      I.setOperand(1, Constant::getNullValue(OpType));

      return &I;

    }

  }


  if (I.isCommutative()) {

    if (auto Pair = matchSymmetricPair(I.getOperand(0), I.getOperand(1))) {

      replaceOperand(I, 0, Pair->first);

      replaceOperand(I, 1, Pair->second);

      return &I;

    }

  }


  // If we're just checking for a NaN (ORD/UNO) and have a non-NaN operand,

  // then canonicalize the operand to 0.0.

  if (Pred == CmpInst::FCMP_ORD || Pred == CmpInst::FCMP_UNO) {

    if (!match(Op0, m_PosZeroFP()) &&

        isKnownNeverNaN(Op0, getSimplifyQuery().getWithInstruction(&I)))

      return replaceOperand(I, 0, ConstantFP::getZero(OpType));


    if (!match(Op1, m_PosZeroFP()) &&

        isKnownNeverNaN(Op1, getSimplifyQuery().getWithInstruction(&I)))

      return replaceOperand(I, 1, ConstantFP::getZero(OpType));

  }


  // fcmp pred (fneg X), (fneg Y) -> fcmp swap(pred) X, Y

  Value *X, *Y;

  if (match(Op0, m_FNeg(m_Value(X))) && match(Op1, m_FNeg(m_Value(Y))))

    return new FCmpInst(I.getSwappedPredicate(), X, Y, "", &I);


  if (Instruction *R = foldFCmpFNegCommonOp(I))

    return R;


  // Test if the FCmpInst instruction is used exclusively by a select as

  // part of a minimum or maximum operation. If so, refrain from doing

  // any other folding. This helps out other analyses which understand

  // non-obfuscated minimum and maximum idioms, such as ScalarEvolution

  // and CodeGen. And in this case, at least one of the comparison

  // operands has at least one user besides the compare (the select),

  // which would often largely negate the benefit of folding anyway.

  if (I.hasOneUse())

    if (SelectInst *SI = dyn_cast<SelectInst>(I.user_back())) {

      Value *A, *B;

      SelectPatternResult SPR = matchSelectPattern(SI, A, B);

      if (SPR.Flavor != SPF_UNKNOWN)

        return nullptr;

    }


  // The sign of 0.0 is ignored by fcmp, so canonicalize to +0.0:

  // fcmp Pred X, -0.0 --> fcmp Pred X, 0.0

  if (match(Op1, m_AnyZeroFP()) && !match(Op1, m_PosZeroFP()))

    return replaceOperand(I, 1, ConstantFP::getZero(OpType));


  // Canonicalize:

  // fcmp olt X, +inf -> fcmp one X, +inf

  // fcmp ole X, +inf -> fcmp ord X, 0

  // fcmp ogt X, +inf -> false

  // fcmp oge X, +inf -> fcmp oeq X, +inf

  // fcmp ult X, +inf -> fcmp une X, +inf

  // fcmp ule X, +inf -> true

  // fcmp ugt X, +inf -> fcmp uno X, 0

  // fcmp uge X, +inf -> fcmp ueq X, +inf

  // fcmp olt X, -inf -> false

  // fcmp ole X, -inf -> fcmp oeq X, -inf

  // fcmp ogt X, -inf -> fcmp one X, -inf

  // fcmp oge X, -inf -> fcmp ord X, 0

  // fcmp ult X, -inf -> fcmp uno X, 0

  // fcmp ule X, -inf -> fcmp ueq X, -inf

  // fcmp ugt X, -inf -> fcmp une X, -inf

  // fcmp uge X, -inf -> true

  const APFloat *C;

  if (match(Op1, m_APFloat(C)) && C->isInfinity()) {

    switch (C->isNegative() ? FCmpInst::getSwappedPredicate(Pred) : Pred) {

    default:

      break;

    case FCmpInst::FCMP_ORD:

    case FCmpInst::FCMP_UNO:

    case FCmpInst::FCMP_TRUE:

    case FCmpInst::FCMP_FALSE:

    case FCmpInst::FCMP_OGT:

    case FCmpInst::FCMP_ULE:

      llvm_unreachable("Should be simplified by InstSimplify");

    case FCmpInst::FCMP_OLT:

      return new FCmpInst(FCmpInst::FCMP_ONE, Op0, Op1, "", &I);

    case FCmpInst::FCMP_OLE:

      return new FCmpInst(FCmpInst::FCMP_ORD, Op0, ConstantFP::getZero(OpType),

                          "", &I);

    case FCmpInst::FCMP_OGE:

      return new FCmpInst(FCmpInst::FCMP_OEQ, Op0, Op1, "", &I);

    case FCmpInst::FCMP_ULT:

      return new FCmpInst(FCmpInst::FCMP_UNE, Op0, Op1, "", &I);

    case FCmpInst::FCMP_UGT:

      return new FCmpInst(FCmpInst::FCMP_UNO, Op0, ConstantFP::getZero(OpType),

                          "", &I);

    case FCmpInst::FCMP_UGE:

      return new FCmpInst(FCmpInst::FCMP_UEQ, Op0, Op1, "", &I);

    }

  }


  // Ignore signbit of bitcasted int when comparing equality to FP 0.0:

  // fcmp oeq/une (bitcast X), 0.0 --> (and X, SignMaskC) ==/!= 0

  if (match(Op1, m_PosZeroFP()) &&

      match(Op0, m_OneUse(m_ElementWiseBitCast(m_Value(X))))) {

    ICmpInst::Predicate IntPred = ICmpInst::BAD_ICMP_PREDICATE;

    if (Pred == FCmpInst::FCMP_OEQ)

      IntPred = ICmpInst::ICMP_EQ;

    else if (Pred == FCmpInst::FCMP_UNE)

      IntPred = ICmpInst::ICMP_NE;


    if (IntPred != ICmpInst::BAD_ICMP_PREDICATE) {

      Type *IntTy = X->getType();

      const APInt &SignMask = ~APInt::getSignMask(IntTy->getScalarSizeInBits());

      Value *MaskX = Builder.CreateAnd(X, ConstantInt::get(IntTy, SignMask));

      return new ICmpInst(IntPred, MaskX, ConstantInt::getNullValue(IntTy));

    }

  }


  // Handle fcmp with instruction LHS and constant RHS.

  Instruction *LHSI;

  Constant *RHSC;

  if (match(Op0, m_Instruction(LHSI)) && match(Op1, m_Constant(RHSC))) {

    switch (LHSI->getOpcode()) {

    case Instruction::Select:

      // fcmp eq (cond ? x : -x), 0 --> fcmp eq x, 0

      if (FCmpInst::isEquality(Pred) && match(RHSC, m_AnyZeroFP()) &&

          match(LHSI, m_c_Select(m_FNeg(m_Value(X)), m_Deferred(X))))

        return replaceOperand(I, 0, X);

      if (Instruction *NV = FoldOpIntoSelect(I, cast<SelectInst>(LHSI)))

        return NV;

      break;

    case Instruction::FSub:

      if (LHSI->hasOneUse())

        if (Instruction *NV = foldFCmpFSubIntoFCmp(I, LHSI, RHSC, *this))

          return NV;

      break;

    case Instruction::PHI:

      if (Instruction *NV = foldOpIntoPhi(I, cast<PHINode>(LHSI)))

        return NV;

      break;

    case Instruction::SIToFP:

    case Instruction::UIToFP:

      if (Instruction *NV = foldFCmpIntToFPConst(I, LHSI, RHSC))

        return NV;

      break;

    case Instruction::FDiv:

      if (Instruction *NV = foldFCmpReciprocalAndZero(I, LHSI, RHSC))

        return NV;

      break;

    case Instruction::Load:

      if (auto *GEP = dyn_cast<GetElementPtrInst>(LHSI->getOperand(0)))

        if (Instruction *Res =

                foldCmpLoadFromIndexedGlobal(cast<LoadInst>(LHSI), GEP, I))

          return Res;

      break;

    case Instruction::FPTrunc:

      if (Instruction *NV = foldFCmpFpTrunc(I, *LHSI, *RHSC))

        return NV;

      break;

    }

  }


  if (Instruction *R = foldFabsWithFcmpZero(I, *this))

    return R;


  if (Instruction *R = foldSqrtWithFcmpZero(I, *this))

    return R;


  if (Instruction *R = foldFCmpWithFloorAndCeil(I, *this))

    return R;


  if (match(Op0, m_FNeg(m_Value(X)))) {

    // fcmp pred (fneg X), C --> fcmp swap(pred) X, -C

    Constant *C;

    if (match(Op1, m_Constant(C)))

      if (Constant *NegC = ConstantFoldUnaryOpOperand(Instruction::FNeg, C, DL))

        return new FCmpInst(I.getSwappedPredicate(), X, NegC, "", &I);

  }


  // fcmp (fadd X, 0.0), Y --> fcmp X, Y

  if (match(Op0, m_FAdd(m_Value(X), m_AnyZeroFP())))

    return new FCmpInst(Pred, X, Op1, "", &I);


  // fcmp X, (fadd Y, 0.0) --> fcmp X, Y

  if (match(Op1, m_FAdd(m_Value(Y), m_AnyZeroFP())))

    return new FCmpInst(Pred, Op0, Y, "", &I);


  if (match(Op0, m_FPExt(m_Value(X)))) {

    // fcmp (fpext X), (fpext Y) -> fcmp X, Y

    if (match(Op1, m_FPExt(m_Value(Y))) && X->getType() == Y->getType())

      return new FCmpInst(Pred, X, Y, "", &I);


    const APFloat *C;

    if (match(Op1, m_APFloat(C))) {

      const fltSemantics &FPSem =

          X->getType()->getScalarType()->getFltSemantics();

      bool Lossy;

      APFloat TruncC = *C;

      TruncC.convert(FPSem, APFloat::rmNearestTiesToEven, &Lossy);


      if (Lossy) {

        // X can't possibly equal the higher-precision constant, so reduce any

        // equality comparison.

        // TODO: Other predicates can be handled via getFCmpCode().

        switch (Pred) {

        case FCmpInst::FCMP_OEQ:

          // X is ordered and equal to an impossible constant --> false

          return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

        case FCmpInst::FCMP_ONE:

          // X is ordered and not equal to an impossible constant --> ordered

          return new FCmpInst(FCmpInst::FCMP_ORD, X,

                              ConstantFP::getZero(X->getType()));

        case FCmpInst::FCMP_UEQ:

          // X is unordered or equal to an impossible constant --> unordered

          return new FCmpInst(FCmpInst::FCMP_UNO, X,

                              ConstantFP::getZero(X->getType()));

        case FCmpInst::FCMP_UNE:

          // X is unordered or not equal to an impossible constant --> true

          return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

        default:

          break;

        }

      }


      // fcmp (fpext X), C -> fcmp X, (fptrunc C) if fptrunc is lossless

      // Avoid lossy conversions and denormals.

      // Zero is a special case that's OK to convert.

      APFloat Fabs = TruncC;

      Fabs.clearSign();

      if (!Lossy &&

          (Fabs.isZero() || !(Fabs < APFloat::getSmallestNormalized(FPSem)))) {

        Constant *NewC = ConstantFP::get(X->getType(), TruncC);

        return new FCmpInst(Pred, X, NewC, "", &I);

      }

    }

  }


  // Convert a sign-bit test of an FP value into a cast and integer compare.

  // TODO: Simplify if the copysign constant is 0.0 or NaN.

  // TODO: Handle non-zero compare constants.

  // TODO: Handle other predicates.

  if (match(Op0, m_OneUse(m_Intrinsic<Intrinsic::copysign>(m_APFloat(C),

                                                           m_Value(X)))) &&

      match(Op1, m_AnyZeroFP()) && !C->isZero() && !C->isNaN()) {

    Type *IntType = Builder.getIntNTy(X->getType()->getScalarSizeInBits());

    if (auto *VecTy = dyn_cast<VectorType>(OpType))

      IntType = VectorType::get(IntType, VecTy->getElementCount());


    // copysign(non-zero constant, X) < 0.0 --> (bitcast X) < 0

    if (Pred == FCmpInst::FCMP_OLT) {

      Value *IntX = Builder.CreateBitCast(X, IntType);

      return new ICmpInst(ICmpInst::ICMP_SLT, IntX,

                          ConstantInt::getNullValue(IntType));

    }

  }


  {

    Value *CanonLHS = nullptr;

    match(Op0, m_Intrinsic<Intrinsic::canonicalize>(m_Value(CanonLHS)));

    // (canonicalize(x) == x) => (x == x)

    if (CanonLHS == Op1)

      return new FCmpInst(Pred, Op1, Op1, "", &I);


    Value *CanonRHS = nullptr;

    match(Op1, m_Intrinsic<Intrinsic::canonicalize>(m_Value(CanonRHS)));

    // (x == canonicalize(x)) => (x == x)

    if (CanonRHS == Op0)

      return new FCmpInst(Pred, Op0, Op0, "", &I);


    // (canonicalize(x) == canonicalize(y)) => (x == y)

    if (CanonLHS && CanonRHS)

      return new FCmpInst(Pred, CanonLHS, CanonRHS, "", &I);

  }


  if (I.getType()->isVectorTy())

    if (Instruction *Res = foldVectorCmp(I, Builder))

      return Res;


  return Changed ? &I : nullptr;

}


assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

Select
AMDGPU Register Bank Select
Definition AMDGPURegBankSelect.cpp:68

PHI
Rewrite undef for PHI
Definition AMDGPURewriteUndefForPHI.cpp:98

APFloat.h
This file declares a class to represent arbitrary precision floating point values and provide a varie...

APSInt.h
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition ARMSLSHardening.cpp:73

Local.h

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

E
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

CaptureTracking.h

CmpInstAnalysis.h

ConstantFolding.h

ConstantRange.h

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

DataLayout.h

Check
#define Check(C,...)
Definition GenericConvergenceVerifierImpl.h:34

GEP
Hexagon Common GEP
Definition HexagonCommonGEP.cpp:164

IntrinsicInst.h

foldFCmpReciprocalAndZero
static Instruction * foldFCmpReciprocalAndZero(FCmpInst &I, Instruction *LHSI, Constant *RHSC)
Fold (C / X) < 0.0 --> X < 0.0 if possible. Swap predicate if necessary.
Definition InstCombineCompares.cpp:8173

foldFabsWithFcmpZero
static Instruction * foldFabsWithFcmpZero(FCmpInst &I, InstCombinerImpl &IC)
Optimize fabs(X) compared with zero.
Definition InstCombineCompares.cpp:8312

collectOffsetOp
static void collectOffsetOp(Value *V, SmallVectorImpl< OffsetOp > &Offsets, bool AllowRecursion)
Definition InstCombineCompares.cpp:5838

rewriteGEPAsOffset
static Value * rewriteGEPAsOffset(Value *Start, Value *Base, GEPNoWrapFlags NW, const DataLayout &DL, SetVector< Value * > &Explored, InstCombiner &IC)
Returns a re-written value of Start as an indexed GEP using Base as a pointer.
Definition InstCombineCompares.cpp:507

foldICmpEqualityWithOffset
static Instruction * foldICmpEqualityWithOffset(ICmpInst &I, InstCombiner::BuilderTy &Builder, const SimplifyQuery &SQ)
Offset both sides of an equality icmp to see if we can save some instructions: icmp eq/ne X,...
Definition InstCombineCompares.cpp:5899

addWithOverflow
static bool addWithOverflow(APInt &Result, const APInt &In1, const APInt &In2, bool IsSigned=false)
Compute Result = In1+In2, returning true if the result overflowed for this type.
Definition InstCombineCompares.cpp:46

foldICmpAndXX
static Instruction * foldICmpAndXX(ICmpInst &I, const SimplifyQuery &Q, InstCombinerImpl &IC)
Definition InstCombineCompares.cpp:4969

foldVectorCmp
static Instruction * foldVectorCmp(CmpInst &Cmp, InstCombiner::BuilderTy &Builder)
Definition InstCombineCompares.cpp:7293

isMaskOrZero
static bool isMaskOrZero(const Value *V, bool Not, const SimplifyQuery &Q, unsigned Depth=0)
Definition InstCombineCompares.cpp:4385

createLogicFromTable
static Value * createLogicFromTable(const std::bitset< 4 > &Table, Value *Op0, Value *Op1, IRBuilderBase &Builder, bool HasOneUse)
Definition InstCombineCompares.cpp:3044

foldICmpOfUAddOv
static Instruction * foldICmpOfUAddOv(ICmpInst &I)
Definition InstCombineCompares.cpp:7363

isChainSelectCmpBranch
static bool isChainSelectCmpBranch(const SelectInst *SI)
Return true when the instruction sequence within a block is select-cmp-br.
Definition InstCombineCompares.cpp:6745

foldICmpInvariantGroup
static Instruction * foldICmpInvariantGroup(ICmpInst &I)
Definition InstCombineCompares.cpp:7391

OffsetOp
std::pair< Instruction::BinaryOps, Value * > OffsetOp
Find all possible pairs (BinOp, RHS) that BinOp V, RHS can be simplified.
Definition InstCombineCompares.cpp:5837

foldReductionIdiom
static Instruction * foldReductionIdiom(ICmpInst &I, InstCombiner::BuilderTy &Builder, const DataLayout &DL)
This function folds patterns produced by lowering of reduce idioms, such as llvm.vector....
Definition InstCombineCompares.cpp:7412

canonicalizeICmpBool
static Instruction * canonicalizeICmpBool(ICmpInst &I, InstCombiner::BuilderTy &Builder)
Integer compare with boolean values can always be turned into bitwise ops.
Definition InstCombineCompares.cpp:7171

OffsetKind
OffsetKind
Definition InstCombineCompares.cpp:5867

OffsetKind::Invalid
@ Invalid
Definition InstCombineCompares.cpp:5867

OffsetKind::Value
@ Value
Definition InstCombineCompares.cpp:5867

OffsetKind::Select
@ Select
Definition InstCombineCompares.cpp:5867

foldFCmpFSubIntoFCmp
static Instruction * foldFCmpFSubIntoFCmp(FCmpInst &I, Instruction *LHSI, Constant *RHSC, InstCombinerImpl &CI)
Definition InstCombineCompares.cpp:8492

foldICmpOrXorSubChain
static Value * foldICmpOrXorSubChain(ICmpInst &Cmp, BinaryOperator *Or, InstCombiner::BuilderTy &Builder)
Fold icmp eq/ne (or (xor/sub (X1, X2), xor/sub (X3, X4))), 0.
Definition InstCombineCompares.cpp:2018

hasBranchUse
static bool hasBranchUse(ICmpInst &I)
Given an icmp instruction, return true if any use of this comparison is a branch on sign bit comparis...
Definition InstCombineCompares.cpp:72

foldICmpWithLowBitMaskedVal
static Value * foldICmpWithLowBitMaskedVal(CmpPredicate Pred, Value *Op0, Value *Op1, const SimplifyQuery &Q, InstCombiner &IC)
Some comparisons can be simplified.
Definition InstCombineCompares.cpp:4492

getDemandedBitsLHSMask
static APInt getDemandedBitsLHSMask(ICmpInst &I, unsigned BitWidth)
When performing a comparison against a constant, it is possible that not all the bits in the LHS are ...
Definition InstCombineCompares.cpp:6684

foldICmpShlLHSC
static Instruction * foldICmpShlLHSC(ICmpInst &Cmp, Instruction *Shl, const APInt &C)
Fold icmp (shl nuw C2, Y), C.
Definition InstCombineCompares.cpp:2269

foldFCmpWithFloorAndCeil
static Instruction * foldFCmpWithFloorAndCeil(FCmpInst &I, InstCombinerImpl &IC)
Definition InstCombineCompares.cpp:8538

foldICmpXorXX
static Instruction * foldICmpXorXX(ICmpInst &I, const SimplifyQuery &Q, InstCombinerImpl &IC)
Definition InstCombineCompares.cpp:5066

foldICmpOfCmpIntrinsicWithConstant
static Instruction * foldICmpOfCmpIntrinsicWithConstant(CmpPredicate Pred, IntrinsicInst *I, const APInt &C, InstCombiner::BuilderTy &Builder)
Definition InstCombineCompares.cpp:4128

processUMulZExtIdiom
static Instruction * processUMulZExtIdiom(ICmpInst &I, Value *MulVal, const APInt *OtherVal, InstCombinerImpl &IC)
Recognize and process idiom involving test for multiplication overflow.
Definition InstCombineCompares.cpp:6537

foldSqrtWithFcmpZero
static Instruction * foldSqrtWithFcmpZero(FCmpInst &I, InstCombinerImpl &IC)
Optimize sqrt(X) compared with zero.
Definition InstCombineCompares.cpp:8413

foldFCmpFNegCommonOp
static Instruction * foldFCmpFNegCommonOp(FCmpInst &I)
Definition InstCombineCompares.cpp:8473

foldICmpWithHighBitMask
static Instruction * foldICmpWithHighBitMask(ICmpInst &Cmp, InstCombiner::BuilderTy &Builder)
Definition InstCombineCompares.cpp:7250

canonicalizeCmpWithConstant
static ICmpInst * canonicalizeCmpWithConstant(ICmpInst &I)
If we have an icmp le or icmp ge instruction with a constant operand, turn it into the appropriate ic...
Definition InstCombineCompares.cpp:7128

foldICmpIntrinsicWithIntrinsic
static Instruction * foldICmpIntrinsicWithIntrinsic(ICmpInst &Cmp, InstCombiner::BuilderTy &Builder)
Fold an icmp with LLVM intrinsics.
Definition InstCombineCompares.cpp:3901

foldICmpUSubSatOrUAddSatWithConstant
static Instruction * foldICmpUSubSatOrUAddSatWithConstant(CmpPredicate Pred, SaturatingInst *II, const APInt &C, InstCombiner::BuilderTy &Builder)
Definition InstCombineCompares.cpp:4043

foldICmpPow2Test
static Instruction * foldICmpPow2Test(ICmpInst &I, InstCombiner::BuilderTy &Builder)
Definition InstCombineCompares.cpp:5784

subWithOverflow
static bool subWithOverflow(APInt &Result, const APInt &In1, const APInt &In2, bool IsSigned=false)
Compute Result = In1-In2, returning true if the result overflowed for this type.
Definition InstCombineCompares.cpp:59

canRewriteGEPAsOffset
static bool canRewriteGEPAsOffset(Value *Start, Value *Base, GEPNoWrapFlags &NW, const DataLayout &DL, SetVector< Value * > &Explored)
Returns true if we can rewrite Start as a GEP with pointer Base and some integer offset.
Definition InstCombineCompares.cpp:393

foldFCmpFpTrunc
static Instruction * foldFCmpFpTrunc(FCmpInst &I, const Instruction &FPTrunc, const Constant &C)
Definition InstCombineCompares.cpp:8227

foldICmpXNegX
static Instruction * foldICmpXNegX(ICmpInst &I, InstCombiner::BuilderTy &Builder)
Definition InstCombineCompares.cpp:4937

processUGT_ADDCST_ADD
static Instruction * processUGT_ADDCST_ADD(ICmpInst &I, Value *A, Value *B, ConstantInt *CI2, ConstantInt *CI1, InstCombinerImpl &IC)
The caller has matched a pattern of the form: I = icmp ugt (add (add A, B), CI2), CI1 If this is of t...
Definition InstCombineCompares.cpp:1060

foldShiftIntoShiftInAnotherHandOfAndInICmp
static Value * foldShiftIntoShiftInAnotherHandOfAndInICmp(ICmpInst &I, const SimplifyQuery SQ, InstCombiner::BuilderTy &Builder)
Definition InstCombineCompares.cpp:4696

isSignTest
static bool isSignTest(ICmpInst::Predicate &Pred, const APInt &C)
Returns true if the exploded icmp can be expressed as a signed comparison to zero and updates the pre...
Definition InstCombineCompares.cpp:83

transformToIndexedCompare
static Instruction * transformToIndexedCompare(GEPOperator *GEPLHS, Value *RHS, CmpPredicate Cond, const DataLayout &DL, InstCombiner &IC)
Converts (CMP GEPLHS, RHS) if this change would make RHS a constant.
Definition InstCombineCompares.cpp:601

foldCtpopPow2Test
static Instruction * foldCtpopPow2Test(ICmpInst &I, IntrinsicInst *CtpopLhs, const APInt &CRhs, InstCombiner::BuilderTy &Builder, const SimplifyQuery &Q)
Definition InstCombineCompares.cpp:3755

setInsertionPoint
static void setInsertionPoint(IRBuilder<> &Builder, Value *V, bool Before=true)
Definition InstCombineCompares.cpp:481

isNeutralValue
static bool isNeutralValue(Instruction::BinaryOps BinaryOp, Value *RHS, bool IsSigned)
Definition InstCombineCompares.cpp:6435

isMultipleOf
static bool isMultipleOf(Value *X, const APInt &C, const SimplifyQuery &Q)
Return true if X is a multiple of C.
Definition InstCombineCompares.cpp:5112

foldICmpWithTruncSignExtendedVal
static Value * foldICmpWithTruncSignExtendedVal(ICmpInst &I, InstCombiner::BuilderTy &Builder)
Some comparisons can be simplified.
Definition InstCombineCompares.cpp:4622

foldICmpOrXX
static Instruction * foldICmpOrXX(ICmpInst &I, const SimplifyQuery &Q, InstCombinerImpl &IC)
Definition InstCombineCompares.cpp:5031

InstCombineInternal.h
This file provides internal interfaces used to implement the InstCombine.

InstCombiner.h
This file provides the interface for the instcombine pass implementation.

InstrTypes.h

InstructionSimplify.h

Instructions.h

Ops
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Definition ItaniumDemangle.h:3368

KnownBits.h

isZero
static bool isZero(Value *V, const DataLayout &DL, DominatorTree *DT, AssumptionCache *AC)
Definition Lint.cpp:546

Loads.h

F
#define F(x, y, z)
Definition MD5.cpp:55

I
#define I(x, y, z)
Definition MD5.cpp:58

Operands
mir Rename Register Operands
Definition MIRNamerPass.cpp:74

T1
#define T1
Definition Mips16ISelLowering.cpp:352

II
uint64_t IntrinsicInst * II
Definition NVVMIntrRange.cpp:46

P
#define P(N)

PatternMatch.h

Cond
const SmallVectorImpl< MachineOperand > & Cond
Definition RISCVRedundantCopyElimination.cpp:71

Mode
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))

SetVector.h
This file implements a set that has insertion order iteration characteristics.

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition Statistic.h:167

Y
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")

X
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")

getType
static SymbolRef::Type getType(const Symbol *Sym)
Definition TapiFile.cpp:39

IntX
@ IntX
Definition TargetLibraryInfo.cpp:68

VectorUtils.h

RHS
Value * RHS
Definition X86PartialReduction.cpp:74

LHS
Value * LHS
Definition X86PartialReduction.cpp:73

Mul
BinaryOperator * Mul
Definition X86PartialReduction.cpp:68

BaseType

llvm::APFloat
Definition APFloat.h:900

llvm::APFloat::convert
LLVM_ABI opStatus convert(const fltSemantics &ToSemantics, roundingMode RM, bool *losesInfo)
Definition APFloat.cpp:6057

llvm::APFloat::clearSign
void clearSign()
Definition APFloat.h:1298

llvm::APFloat::isNaN
bool isNaN() const
Definition APFloat.h:1447

llvm::APFloat::isZero
bool isZero() const
Definition APFloat.h:1445

llvm::APFloat::getSmallestNormalized
static APFloat getSmallestNormalized(const fltSemantics &Sem, bool Negative=false)
Returns the smallest (by magnitude) normalized finite number in the given semantics.
Definition APFloat.h:1158

llvm::APFloat::bitcastToAPInt
APInt bitcastToAPInt() const
Definition APFloat.h:1353

llvm::APFloat::getLargest
static APFloat getLargest(const fltSemantics &Sem, bool Negative=false)
Returns the largest finite number in the given semantics.
Definition APFloat.h:1138

llvm::APFloat::next
opStatus next(bool nextDown)
Definition APFloat.h:1254

llvm::APFloat::getInf
static APFloat getInf(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Infinity.
Definition APFloat.h:1098

llvm::APFloat::classify
LLVM_ABI FPClassTest classify() const
Return the FPClassTest which will return true for the value.
Definition APFloat.cpp:5986

llvm::APFloat::roundToIntegral
opStatus roundToIntegral(roundingMode RM)
Definition APFloat.h:1248

llvm::APFloat::isInfinity
bool isInfinity() const
Definition APFloat.h:1446

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::APInt::udiv
LLVM_ABI APInt udiv(const APInt &RHS) const
Unsigned division operation.
Definition APInt.cpp:1573

llvm::APInt::getAllOnes
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition APInt.h:234

llvm::APInt::udivrem
static LLVM_ABI void udivrem(const APInt &LHS, const APInt &RHS, APInt &Quotient, APInt &Remainder)
Dual division/remainder interface.
Definition APInt.cpp:1758

llvm::APInt::isNegatedPowerOf2
bool isNegatedPowerOf2() const
Check if this APInt's negated value is a power of two greater than zero.
Definition APInt.h:449

llvm::APInt::zext
LLVM_ABI APInt zext(unsigned width) const
Zero extend to a new width.
Definition APInt.cpp:1012

llvm::APInt::getSignMask
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition APInt.h:229

llvm::APInt::isMinSignedValue
bool isMinSignedValue() const
Determine if this is the smallest signed value.
Definition APInt.h:423

llvm::APInt::getZExtValue
uint64_t getZExtValue() const
Get zero extended value.
Definition APInt.h:1540

llvm::APInt::getActiveBits
unsigned getActiveBits() const
Compute the number of active bits in the value.
Definition APInt.h:1512

llvm::APInt::trunc
LLVM_ABI APInt trunc(unsigned width) const
Truncate to new width.
Definition APInt.cpp:936

llvm::APInt::getMaxValue
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
Definition APInt.h:206

llvm::APInt::setBit
void setBit(unsigned BitPosition)
Set the given bit to 1 whose position is given as "bitPosition".
Definition APInt.h:1330

llvm::APInt::abs
APInt abs() const
Get the absolute value.
Definition APInt.h:1795

llvm::APInt::ceilLogBase2
unsigned ceilLogBase2() const
Definition APInt.h:1764

llvm::APInt::Rounding::DOWN
@ DOWN
Definition APInt.h:89

llvm::APInt::Rounding::UP
@ UP
Definition APInt.h:91

llvm::APInt::sgt
bool sgt(const APInt &RHS) const
Signed greater than comparison.
Definition APInt.h:1201

llvm::APInt::isAllOnes
bool isAllOnes() const
Determine if all bits are set. This is true for zero-width values.
Definition APInt.h:371

llvm::APInt::usub_ov
LLVM_ABI APInt usub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1948

llvm::APInt::ugt
bool ugt(const APInt &RHS) const
Unsigned greater than comparison.
Definition APInt.h:1182

llvm::APInt::isZero
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition APInt.h:380

llvm::APInt::isSignMask
bool isSignMask() const
Check if the APInt's value is returned by getSignMask.
Definition APInt.h:466

llvm::APInt::getBitWidth
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition APInt.h:1488

llvm::APInt::ult
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition APInt.h:1111

llvm::APInt::getSignedMaxValue
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:209

llvm::APInt::getMinValue
static APInt getMinValue(unsigned numBits)
Gets minimum unsigned value of APInt for a specific bit width.
Definition APInt.h:216

llvm::APInt::isNegative
bool isNegative() const
Determine sign of this APInt.
Definition APInt.h:329

llvm::APInt::sadd_ov
LLVM_ABI APInt sadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1928

llvm::APInt::eq
bool eq(const APInt &RHS) const
Equality comparison.
Definition APInt.h:1079

llvm::APInt::sdiv
LLVM_ABI APInt sdiv(const APInt &RHS) const
Signed division function for APInt.
Definition APInt.cpp:1644

llvm::APInt::uadd_ov
LLVM_ABI APInt uadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1935

llvm::APInt::negate
void negate()
Negate this APInt in place.
Definition APInt.h:1468

llvm::APInt::countr_zero
unsigned countr_zero() const
Count the number of trailing zero bits.
Definition APInt.h:1639

llvm::APInt::countl_zero
unsigned countl_zero() const
The APInt version of std::countl_zero.
Definition APInt.h:1598

llvm::APInt::getSignedMinValue
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition APInt.h:219

llvm::APInt::isStrictlyPositive
bool isStrictlyPositive() const
Determine if this APInt Value is positive.
Definition APInt.h:356

llvm::APInt::flipAllBits
void flipAllBits()
Toggle every bit to its opposite value.
Definition APInt.h:1452

llvm::APInt::countl_one
unsigned countl_one() const
Count the number of leading one bits.
Definition APInt.h:1615

llvm::APInt::logBase2
unsigned logBase2() const
Definition APInt.h:1761

llvm::APInt::getLimitedValue
uint64_t getLimitedValue(uint64_t Limit=UINT64_MAX) const
If this value is smaller than the specified limit, return it, otherwise return the limit value.
Definition APInt.h:475

llvm::APInt::ashr
APInt ashr(unsigned ShiftAmt) const
Arithmetic right-shift function.
Definition APInt.h:827

llvm::APInt::isMaxSignedValue
bool isMaxSignedValue() const
Determine if this is the largest signed value.
Definition APInt.h:405

llvm::APInt::ule
bool ule(const APInt &RHS) const
Unsigned less or equal comparison.
Definition APInt.h:1150

llvm::APInt::shl
APInt shl(unsigned shiftAmt) const
Left-shift function.
Definition APInt.h:873

llvm::APInt::isPowerOf2
bool isPowerOf2() const
Check if this APInt's value is a power of two greater than zero.
Definition APInt.h:440

llvm::APInt::getLowBitsSet
static APInt getLowBitsSet(unsigned numBits, unsigned loBitsSet)
Constructs an APInt value that has the bottom loBitsSet bits set.
Definition APInt.h:306

llvm::APInt::getHighBitsSet
static APInt getHighBitsSet(unsigned numBits, unsigned hiBitsSet)
Constructs an APInt value that has the top hiBitsSet bits set.
Definition APInt.h:296

llvm::APInt::getZero
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition APInt.h:200

llvm::APInt::sge
bool sge(const APInt &RHS) const
Signed greater or equal comparison.
Definition APInt.h:1237

llvm::APInt::ssub_ov
LLVM_ABI APInt ssub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1941

llvm::APInt::isOne
bool isOne() const
Determine if this is a value of 1.
Definition APInt.h:389

llvm::APInt::getBitsSetFrom
static APInt getBitsSetFrom(unsigned numBits, unsigned loBit)
Constructs an APInt value that has a contiguous range of bits set.
Definition APInt.h:286

llvm::APInt::getOneBitSet
static APInt getOneBitSet(unsigned numBits, unsigned BitNo)
Return an APInt with exactly one bit set in the result.
Definition APInt.h:239

llvm::APInt::lshr
APInt lshr(unsigned shiftAmt) const
Logical right-shift function.
Definition APInt.h:851

llvm::APInt::countr_one
unsigned countr_one() const
Count the number of trailing one bits.
Definition APInt.h:1656

llvm::APInt::uge
bool uge(const APInt &RHS) const
Unsigned greater or equal comparison.
Definition APInt.h:1221

llvm::APSInt
An arbitrary precision integer that knows its signedness.
Definition APSInt.h:24

llvm::AllocaInst
an instruction to allocate memory on the stack
Definition Instructions.h:64

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:41

llvm::BasicBlockEdge
Definition Dominators.h:97

llvm::BasicBlock
LLVM Basic Block Representation.
Definition BasicBlock.h:62

llvm::BasicBlock::getFirstInsertionPt
LLVM_ABI const_iterator getFirstInsertionPt() const
Returns an iterator to the first instruction in this block that is suitable for inserting a non-PHI i...
Definition BasicBlock.cpp:393

llvm::BasicBlock::getSinglePredecessor
LLVM_ABI const BasicBlock * getSinglePredecessor() const
Return the predecessor of this block if it has a single predecessor block.
Definition BasicBlock.cpp:437

llvm::BasicBlock::getTerminator
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
Definition BasicBlock.h:233

llvm::BinaryOperator
Definition InstrTypes.h:171

llvm::BinaryOperator::getOpcode
BinaryOps getOpcode() const
Definition InstrTypes.h:374

llvm::BinaryOperator::CreateNot
static LLVM_ABI BinaryOperator * CreateNot(Value *Op, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition Instructions.cpp:2724

llvm::BinaryOperator::Create
static LLVM_ABI BinaryOperator * Create(BinaryOps Op, Value *S1, Value *S2, const Twine &Name=Twine(), InsertPosition InsertBefore=nullptr)
Construct a binary instruction, given the opcode and the two operands.
Definition Instructions.cpp:2703

llvm::BranchInst
Conditional or Unconditional Branch instruction.
Definition Instructions.h:3057

llvm::CallBase::getArgOperand
Value * getArgOperand(unsigned i) const
Definition InstrTypes.h:1292

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition Instructions.h:1510

llvm::CallInst::Create
static CallInst * Create(FunctionType *Ty, Value *F, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Definition Instructions.h:1545

llvm::CmpInst
This class is the base class for the comparison instructions.
Definition InstrTypes.h:666

llvm::CmpInst::makeCmpResultType
static Type * makeCmpResultType(Type *opnd_type)
Create a result type for fcmp/icmp.
Definition InstrTypes.h:984

llvm::CmpInst::getStrictPredicate
Predicate getStrictPredicate() const
For example, SGE -> SGT, SLE -> SLT, ULE -> ULT, UGE -> UGT.
Definition InstrTypes.h:860

llvm::CmpInst::getFlippedStrictnessPredicate
static LLVM_ABI Predicate getFlippedStrictnessPredicate(Predicate pred)
This is a static version that you can use without an instruction available.
Definition Instructions.cpp:3793

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:678

llvm::CmpInst::FCMP_OEQ
@ FCMP_OEQ
0 0 0 1 True if ordered and equal
Definition InstrTypes.h:681

llvm::CmpInst::BAD_ICMP_PREDICATE
@ BAD_ICMP_PREDICATE
Definition InstrTypes.h:711

llvm::CmpInst::FCMP_TRUE
@ FCMP_TRUE
1 1 1 1 Always true (always folded)
Definition InstrTypes.h:695

llvm::CmpInst::ICMP_SLT
@ ICMP_SLT
signed less than
Definition InstrTypes.h:707

llvm::CmpInst::ICMP_SLE
@ ICMP_SLE
signed less or equal
Definition InstrTypes.h:708

llvm::CmpInst::FCMP_OLT
@ FCMP_OLT
0 1 0 0 True if ordered and less than
Definition InstrTypes.h:684

llvm::CmpInst::FCMP_ULE
@ FCMP_ULE
1 1 0 1 True if unordered, less than, or equal
Definition InstrTypes.h:693

llvm::CmpInst::FCMP_OGT
@ FCMP_OGT
0 0 1 0 True if ordered and greater than
Definition InstrTypes.h:682

llvm::CmpInst::FCMP_OGE
@ FCMP_OGE
0 0 1 1 True if ordered and greater than or equal
Definition InstrTypes.h:683

llvm::CmpInst::ICMP_UGE
@ ICMP_UGE
unsigned greater or equal
Definition InstrTypes.h:702

llvm::CmpInst::ICMP_UGT
@ ICMP_UGT
unsigned greater than
Definition InstrTypes.h:701

llvm::CmpInst::ICMP_SGT
@ ICMP_SGT
signed greater than
Definition InstrTypes.h:705

llvm::CmpInst::FCMP_ULT
@ FCMP_ULT
1 1 0 0 True if unordered or less than
Definition InstrTypes.h:692

llvm::CmpInst::FCMP_ONE
@ FCMP_ONE
0 1 1 0 True if ordered and operands are unequal
Definition InstrTypes.h:686

llvm::CmpInst::FCMP_UEQ
@ FCMP_UEQ
1 0 0 1 True if unordered or equal
Definition InstrTypes.h:689

llvm::CmpInst::ICMP_ULT
@ ICMP_ULT
unsigned less than
Definition InstrTypes.h:703

llvm::CmpInst::FCMP_UGT
@ FCMP_UGT
1 0 1 0 True if unordered or greater than
Definition InstrTypes.h:690

llvm::CmpInst::FCMP_OLE
@ FCMP_OLE
0 1 0 1 True if ordered and less than or equal
Definition InstrTypes.h:685

llvm::CmpInst::FCMP_ORD
@ FCMP_ORD
0 1 1 1 True if ordered (no nans)
Definition InstrTypes.h:687

llvm::CmpInst::ICMP_EQ
@ ICMP_EQ
equal
Definition InstrTypes.h:699

llvm::CmpInst::ICMP_NE
@ ICMP_NE
not equal
Definition InstrTypes.h:700

llvm::CmpInst::ICMP_SGE
@ ICMP_SGE
signed greater or equal
Definition InstrTypes.h:706

llvm::CmpInst::FCMP_UNE
@ FCMP_UNE
1 1 1 0 True if unordered or not equal
Definition InstrTypes.h:694

llvm::CmpInst::ICMP_ULE
@ ICMP_ULE
unsigned less or equal
Definition InstrTypes.h:704

llvm::CmpInst::FCMP_UGE
@ FCMP_UGE
1 0 1 1 True if unordered, greater than, or equal
Definition InstrTypes.h:691

llvm::CmpInst::FCMP_FALSE
@ FCMP_FALSE
0 0 0 0 Always false (always folded)
Definition InstrTypes.h:680

llvm::CmpInst::FCMP_UNO
@ FCMP_UNO
1 0 0 0 True if unordered: isnan(X) | isnan(Y)
Definition InstrTypes.h:688

llvm::CmpInst::isSigned
bool isSigned() const
Definition InstrTypes.h:932

llvm::CmpInst::getSwappedPredicate
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Definition InstrTypes.h:829

llvm::CmpInst::isTrueWhenEqual
bool isTrueWhenEqual() const
This is just a convenience.
Definition InstrTypes.h:944

llvm::CmpInst::Create
static LLVM_ABI CmpInst * Create(OtherOps Op, Predicate Pred, Value *S1, Value *S2, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Construct a compare instruction, given the opcode, the predicate and the two operands.
Definition Instructions.cpp:3509

llvm::CmpInst::getNonStrictPredicate
Predicate getNonStrictPredicate() const
For example, SGT -> SGE, SLT -> SLE, ULT -> ULE, UGT -> UGE.
Definition InstrTypes.h:873

llvm::CmpInst::isStrictPredicate
static LLVM_ABI bool isStrictPredicate(Predicate predicate)
This is a static version that you can use without an instruction available.
Definition Instructions.cpp:3731

llvm::CmpInst::getInversePredicate
Predicate getInversePredicate() const
For example, EQ -> NE, UGT -> ULE, SLT -> SGE, OEQ -> UNE, UGT -> OLE, OLT -> UGE,...
Definition InstrTypes.h:791

llvm::CmpInst::getPredicate
Predicate getPredicate() const
Return the predicate for this instruction.
Definition InstrTypes.h:767

llvm::CmpInst::isIntPredicate
static bool isIntPredicate(Predicate P)
Definition InstrTypes.h:778

llvm::CmpInst::isUnsigned
bool isUnsigned() const
Definition InstrTypes.h:938

llvm::CmpPredicate
An abstraction over a floating-point predicate, and a pack of an integer predicate with samesign info...
Definition CmpPredicate.h:23

llvm::CmpPredicate::getSwapped
static LLVM_ABI CmpPredicate getSwapped(CmpPredicate P)
Get the swapped predicate of a CmpPredicate.
Definition Instructions.cpp:4038

llvm::ConstantExpr::getIntToPtr
static LLVM_ABI Constant * getIntToPtr(Constant *C, Type *Ty, bool OnlyIfReduced=false)
Definition Constants.cpp:2314

llvm::ConstantExpr::getPointerBitCastOrAddrSpaceCast
static LLVM_ABI Constant * getPointerBitCastOrAddrSpaceCast(Constant *C, Type *Ty)
Create a BitCast or AddrSpaceCast for a pointer type depending on the address space.
Definition Constants.cpp:2261

llvm::ConstantExpr::getSub
static LLVM_ABI Constant * getSub(Constant *C1, Constant *C2, bool HasNUW=false, bool HasNSW=false)
Definition Constants.cpp:2654

llvm::ConstantExpr::getNot
static LLVM_ABI Constant * getNot(Constant *C)
Definition Constants.cpp:2641

llvm::ConstantExpr::getPtrToInt
static LLVM_ABI Constant * getPtrToInt(Constant *C, Type *Ty, bool OnlyIfReduced=false)
Definition Constants.cpp:2300

llvm::ConstantExpr::getXor
static LLVM_ABI Constant * getXor(Constant *C1, Constant *C2)
Definition Constants.cpp:2661

llvm::ConstantExpr::getNeg
static LLVM_ABI Constant * getNeg(Constant *C, bool HasNSW=false)
Definition Constants.cpp:2635

llvm::ConstantFP::getZero
static LLVM_ABI Constant * getZero(Type *Ty, bool Negative=false)
Definition Constants.cpp:1059

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition Constants.h:87

llvm::ConstantInt::getLimitedValue
uint64_t getLimitedValue(uint64_t Limit=~0ULL) const
getLimitedValue - If the value is smaller than the specified limit, return it, otherwise return the l...
Definition Constants.h:264

llvm::ConstantInt::getTrue
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
Definition Constants.cpp:868

llvm::ConstantInt::isZero
bool isZero() const
This is just a convenience method to make client code smaller for a common code.
Definition Constants.h:214

llvm::ConstantInt::getSigned
static ConstantInt * getSigned(IntegerType *Ty, int64_t V)
Return a ConstantInt with the specified value for the specified type.
Definition Constants.h:131

llvm::ConstantInt::getFalse
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
Definition Constants.cpp:875

llvm::ConstantInt::getBitWidth
unsigned getBitWidth() const
getBitWidth - Return the scalar bitwidth of this constant.
Definition Constants.h:157

llvm::ConstantInt::getValue
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition Constants.h:154

llvm::ConstantInt::getBool
static LLVM_ABI ConstantInt * getBool(LLVMContext &Context, bool V)
Definition Constants.cpp:882

llvm::ConstantRange
This class represents a range of values.
Definition ConstantRange.h:47

llvm::ConstantRange::add
LLVM_ABI ConstantRange add(const ConstantRange &Other) const
Return a new range representing the possible values resulting from an addition of a value in this ran...
Definition ConstantRange.cpp:1097

llvm::ConstantRange::exactUnionWith
LLVM_ABI std::optional< ConstantRange > exactUnionWith(const ConstantRange &CR) const
Union the two ranges and return the result if it can be represented exactly, otherwise return std::nu...
Definition ConstantRange.cpp:780

llvm::ConstantRange::getEquivalentICmp
LLVM_ABI bool getEquivalentICmp(CmpInst::Predicate &Pred, APInt &RHS) const
Set up Pred and RHS such that ConstantRange::makeExactICmpRegion(Pred, RHS) == *this.
Definition ConstantRange.cpp:246

llvm::ConstantRange::subtract
LLVM_ABI ConstantRange subtract(const APInt &CI) const
Subtract the specified constant from the endpoints of this constant range.
Definition ConstantRange.cpp:559

llvm::ConstantRange::getSingleElement
const APInt * getSingleElement() const
If this set contains a single element, return it, otherwise return null.
Definition ConstantRange.h:257

llvm::ConstantRange::difference
LLVM_ABI ConstantRange difference(const ConstantRange &CR) const
Subtract the specified range from this range (aka relative complement of the sets).
Definition ConstantRange.cpp:567

llvm::ConstantRange::isEmptySet
LLVM_ABI bool isEmptySet() const
Return true if this set contains no members.
Definition ConstantRange.cpp:428

llvm::ConstantRange::truncate
LLVM_ABI ConstantRange truncate(uint32_t BitWidth, unsigned NoWrapKind=0) const
Return a new range in the specified integer type, which must be strictly smaller than the current typ...
Definition ConstantRange.cpp:875

llvm::ConstantRange::makeExactICmpRegion
static LLVM_ABI ConstantRange makeExactICmpRegion(CmpInst::Predicate Pred, const APInt &Other)
Produce the exact range such that all values in the returned range satisfy the given predicate with a...
Definition ConstantRange.cpp:169

llvm::ConstantRange::inverse
LLVM_ABI ConstantRange inverse() const
Return a new range that is the logical not of the current set.
Definition ConstantRange.cpp:1959

llvm::ConstantRange::exactIntersectWith
LLVM_ABI std::optional< ConstantRange > exactIntersectWith(const ConstantRange &CR) const
Intersect the two ranges and return the result if it can be represented exactly, otherwise return std...
Definition ConstantRange.cpp:771

llvm::ConstantRange::intersectWith
LLVM_ABI ConstantRange intersectWith(const ConstantRange &CR, PreferredRangeType Type=Smallest) const
Return the range that results from the intersection of this range with another range.
Definition ConstantRange.cpp:591

llvm::ConstantRange::sub
LLVM_ABI ConstantRange sub(const ConstantRange &Other) const
Return a new range representing the possible values resulting from a subtraction of a value in this r...
Definition ConstantRange.cpp:1144

llvm::ConstantRange::makeExactNoWrapRegion
static LLVM_ABI ConstantRange makeExactNoWrapRegion(Instruction::BinaryOps BinOp, const APInt &Other, unsigned NoWrapKind)
Produce the range that contains X if and only if "X BinOp Other" does not wrap.
Definition ConstantRange.cpp:399

llvm::ConstantVector::getSplat
static LLVM_ABI Constant * getSplat(ElementCount EC, Constant *Elt)
Return a ConstantVector with the specified constant in each element.
Definition Constants.cpp:1474

llvm::Constant
This is an important base class in LLVM.
Definition Constant.h:43

llvm::Constant::getIntegerValue
static LLVM_ABI Constant * getIntegerValue(Type *Ty, const APInt &V)
Return the value for an integer or pointer constant, or a vector thereof, with the given scalar value...
Definition Constants.cpp:403

llvm::Constant::getAllOnesValue
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
Definition Constants.cpp:420

llvm::Constant::getUniqueInteger
LLVM_ABI const APInt & getUniqueInteger() const
If C is a constant integer then return its value, otherwise C must be a vector of constant integers,...
Definition Constants.cpp:1778

llvm::Constant::getNullValue
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
Definition Constants.cpp:373

llvm::Constant::isNullValue
LLVM_ABI bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
Definition Constants.cpp:90

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:63

llvm::DenseMapBase::find
iterator find(const_arg_type_t< KeyT > Val)
Definition DenseMap.h:165

llvm::DenseMapBase::end
iterator end()
Definition DenseMap.h:81

llvm::DenseMapBase::contains
bool contains(const_arg_type_t< KeyT > Val) const
Return true if the specified key is in the map, false otherwise.
Definition DenseMap.h:156

llvm::DenseMap
Definition DenseMap.h:700

llvm::ExtractValueInst::Create
static ExtractValueInst * Create(Value *Agg, ArrayRef< unsigned > Idxs, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Definition Instructions.h:2456

llvm::FCmpInst
This instruction compares its operands according to the predicate given to the constructor.
Definition Instructions.h:1410

llvm::FCmpInst::isEquality
static bool isEquality(Predicate Pred)
Definition Instructions.h:1453

llvm::Function
Definition Function.h:64

llvm::GEPNoWrapFlags
Represents flags for the getelementptr instruction/expression.
Definition GEPNoWrapFlags.h:26

llvm::GEPNoWrapFlags::hasNoUnsignedSignedWrap
bool hasNoUnsignedSignedWrap() const
Definition GEPNoWrapFlags.h:64

llvm::GEPNoWrapFlags::hasNoUnsignedWrap
bool hasNoUnsignedWrap() const
Definition GEPNoWrapFlags.h:65

llvm::GEPNoWrapFlags::isInBounds
bool isInBounds() const
Definition GEPNoWrapFlags.h:63

llvm::GEPNoWrapFlags::intersectForOffsetAdd
GEPNoWrapFlags intersectForOffsetAdd(GEPNoWrapFlags Other) const
Given (gep (gep p, x), y), determine the nowrap flags for (gep p, x+y).
Definition GEPNoWrapFlags.h:78

llvm::GEPNoWrapFlags::none
static GEPNoWrapFlags none()
Definition GEPNoWrapFlags.h:46

llvm::GEPOperator
Definition Operator.h:420

llvm::GEPOperator::isInBounds
bool isInBounds() const
Test whether this is an inbounds GEP, as defined by LangRef.html.
Definition Operator.h:430

llvm::GEPOperator::getSourceElementType
LLVM_ABI Type * getSourceElementType() const
Definition Operator.cpp:70

llvm::GEPOperator::getPointerOperand
Value * getPointerOperand()
Definition Operator.h:457

llvm::GEPOperator::getNoWrapFlags
GEPNoWrapFlags getNoWrapFlags() const
Definition Operator.h:425

llvm::GEPOperator::hasAllConstantIndices
bool hasAllConstantIndices() const
Return true if all of the indices of this GEP are constant integers.
Definition Operator.h:504

llvm::GetElementPtrInst
an instruction for type-safe pointer arithmetic to access elements of arrays and structs
Definition Instructions.h:949

llvm::ICmpInst
This instruction compares its operands according to the predicate given to the constructor.
Definition Instructions.h:1177

llvm::ICmpInst::isGE
static bool isGE(Predicate P)
Return true if the predicate is SGE or UGE.
Definition Instructions.h:1360

llvm::ICmpInst::compare
static LLVM_ABI bool compare(const APInt &LHS, const APInt &RHS, ICmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
Definition Instructions.cpp:3820

llvm::ICmpInst::isLT
static bool isLT(Predicate P)
Return true if the predicate is SLT or ULT.
Definition Instructions.h:1354

llvm::ICmpInst::isGT
static bool isGT(Predicate P)
Return true if the predicate is SGT or UGT.
Definition Instructions.h:1348

llvm::ICmpInst::getFlippedSignednessPredicate
Predicate getFlippedSignednessPredicate() const
For example, SLT->ULT, ULT->SLT, SLE->ULE, ULE->SLE, EQ->EQ.
Definition Instructions.h:1296

llvm::ICmpInst::getSignedPredicate
Predicate getSignedPredicate() const
For example, EQ->EQ, SLE->SLE, UGT->SGT, etc.
Definition Instructions.h:1269

llvm::ICmpInst::isEquality
bool isEquality() const
Return true if this predicate is either EQ or NE.
Definition Instructions.h:1322

llvm::ICmpInst::isEquality
static bool isEquality(Predicate P)
Return true if this predicate is either EQ or NE.
Definition Instructions.h:1316

llvm::ICmpInst::isRelational
bool isRelational() const
Return true if the predicate is relational (not EQ or NE).
Definition Instructions.h:1336

llvm::ICmpInst::getUnsignedPredicate
Predicate getUnsignedPredicate() const
For example, EQ->EQ, SLE->ULE, UGT->UGT, etc.
Definition Instructions.h:1280

llvm::ICmpInst::isLE
static bool isLE(Predicate P)
Return true if the predicate is SLE or ULE.
Definition Instructions.h:1366

llvm::IRBuilderBase::InsertPointGuard
Definition IRBuilder.h:409

llvm::IRBuilderBase
Common base class shared among various IRBuilders.
Definition IRBuilder.h:114

llvm::IRBuilderBase::CreateAnd
Value * CreateAnd(Value *LHS, Value *RHS, const Twine &Name="")
Definition IRBuilder.h:1551

llvm::IRBuilderBase::SetInsertPoint
void SetInsertPoint(BasicBlock *TheBB)
This specifies that created instructions should be appended to the end of the specified block.
Definition IRBuilder.h:207

llvm::IRBuilderBase::CreateICmp
Value * CreateICmp(CmpInst::Predicate P, Value *LHS, Value *RHS, const Twine &Name="")
Definition IRBuilder.h:2439

llvm::IRBuilderBase::CreateOr
Value * CreateOr(Value *LHS, Value *RHS, const Twine &Name="", bool IsDisjoint=false)
Definition IRBuilder.h:1573

llvm::IRBuilderBase::getInt
ConstantInt * getInt(const APInt &AI)
Get a constant integer value.
Definition IRBuilder.h:538

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition IRBuilder.h:2780

llvm::Init
Definition Record.h:286

llvm::InstCombinerImpl
Definition InstCombineInternal.h:62

llvm::InstCombinerImpl::foldICmpShrConstant
Instruction * foldICmpShrConstant(ICmpInst &Cmp, BinaryOperator *Shr, const APInt &C)
Fold icmp ({al}shr X, Y), C.
Definition InstCombineCompares.cpp:2499

llvm::InstCombinerImpl::FoldOpIntoSelect
Instruction * FoldOpIntoSelect(Instruction &Op, SelectInst *SI, bool FoldWithMultiUse=false)
Given an instruction with a select as one operand and a constant as the other operand,...
Definition InstructionCombining.cpp:1767

llvm::InstCombinerImpl::foldICmpWithZextOrSext
Instruction * foldICmpWithZextOrSext(ICmpInst &ICmp)
Definition InstCombineCompares.cpp:6255

llvm::InstCombinerImpl::foldICmpSelectConstant
Instruction * foldICmpSelectConstant(ICmpInst &Cmp, SelectInst *Select, ConstantInt *C)
Definition InstCombineCompares.cpp:3351

llvm::InstCombinerImpl::foldICmpSRemConstant
Instruction * foldICmpSRemConstant(ICmpInst &Cmp, BinaryOperator *UDiv, const APInt &C)
Definition InstCombineCompares.cpp:2663

llvm::InstCombinerImpl::foldICmpBinOpWithConstant
Instruction * foldICmpBinOpWithConstant(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Fold an icmp with BinaryOp and constant operand: icmp Pred BO, C.
Definition InstCombineCompares.cpp:3979

llvm::InstCombinerImpl::foldICmpOrConstant
Instruction * foldICmpOrConstant(ICmpInst &Cmp, BinaryOperator *Or, const APInt &C)
Fold icmp (or X, Y), C.
Definition InstCombineCompares.cpp:2077

llvm::InstCombinerImpl::foldICmpTruncWithTruncOrExt
Instruction * foldICmpTruncWithTruncOrExt(ICmpInst &Cmp, const SimplifyQuery &Q)
Fold icmp (trunc nuw/nsw X), (trunc nuw/nsw Y).
Definition InstCombineCompares.cpp:1529

llvm::InstCombinerImpl::foldSignBitTest
Instruction * foldSignBitTest(ICmpInst &I)
Fold equality-comparison between zero and any (maybe truncated) right-shift by one-less-than-bitwidth...
Definition InstCombineCompares.cpp:1166

llvm::InstCombinerImpl::foldOpIntoPhi
Instruction * foldOpIntoPhi(Instruction &I, PHINode *PN, bool AllowMultipleUses=false)
Given a binary operator, cast instruction, or select which has a PHI node as operand #0,...
Definition InstructionCombining.cpp:1860

llvm::InstCombinerImpl::insertRangeTest
Value * insertRangeTest(Value *V, const APInt &Lo, const APInt &Hi, bool isSigned, bool Inside)
Emit a computation of: (V >= Lo && V < Hi) if Inside is true, otherwise (V < Lo || V >= Hi).
Definition InstCombineAndOrXor.cpp:56

llvm::InstCombinerImpl::foldICmpBinOp
Instruction * foldICmpBinOp(ICmpInst &Cmp, const SimplifyQuery &SQ)
Try to fold icmp (binop), X or icmp X, (binop).
Definition InstCombineCompares.cpp:5126

llvm::InstCombinerImpl::foldCmpLoadFromIndexedGlobal
Instruction * foldCmpLoadFromIndexedGlobal(LoadInst *LI, GetElementPtrInst *GEP, CmpInst &ICI, ConstantInt *AndCst=nullptr)
This is called when we see this pattern: cmp pred (load (gep GV, ...)), cmpcst where GV is a global v...
Definition InstCombineCompares.cpp:113

llvm::InstCombinerImpl::foldICmpSubConstant
Instruction * foldICmpSubConstant(ICmpInst &Cmp, BinaryOperator *Sub, const APInt &C)
Fold icmp (sub X, Y), C.
Definition InstCombineCompares.cpp:2960

llvm::InstCombinerImpl::foldICmpInstWithConstantNotInt
Instruction * foldICmpInstWithConstantNotInt(ICmpInst &Cmp)
Handle icmp with constant (but not simple integer constant) RHS.
Definition InstCombineCompares.cpp:4292

llvm::InstCombinerImpl::SimplifyDemandedBits
bool SimplifyDemandedBits(Instruction *I, unsigned Op, const APInt &DemandedMask, KnownBits &Known, const SimplifyQuery &Q, unsigned Depth=0) override
This form of SimplifyDemandedBits simplifies the specified instruction operand if possible,...
Definition InstCombineSimplifyDemanded.cpp:95

llvm::InstCombinerImpl::foldICmpShlConstConst
Instruction * foldICmpShlConstConst(ICmpInst &I, Value *ShAmt, const APInt &C1, const APInt &C2)
Handle "(icmp eq/ne (shl AP2, A), AP1)" -> (icmp eq/ne A, TrailingZeros(AP1) - TrailingZeros(AP2)).
Definition InstCombineCompares.cpp:1016

llvm::InstCombinerImpl::reassociateShiftAmtsOfTwoSameDirectionShifts
Value * reassociateShiftAmtsOfTwoSameDirectionShifts(BinaryOperator *Sh0, const SimplifyQuery &SQ, bool AnalyzeForSignBitExtraction=false)
Definition InstCombineShifts.cpp:58

llvm::InstCombinerImpl::foldICmpEqIntrinsicWithConstant
Instruction * foldICmpEqIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst *II, const APInt &C)
Fold an equality icmp with LLVM intrinsic and constant operand.
Definition InstCombineCompares.cpp:3793

llvm::InstCombinerImpl::foldMultiplicationOverflowCheck
Value * foldMultiplicationOverflowCheck(ICmpInst &Cmp)
Fold (-1 u/ x) u< y ((x * y) ?
Definition InstCombineCompares.cpp:4869

llvm::InstCombinerImpl::foldICmpWithConstant
Instruction * foldICmpWithConstant(ICmpInst &Cmp)
Fold icmp Pred X, C.
Definition InstCombineCompares.cpp:1316

llvm::InstCombinerImpl::canonicalizeICmpPredicate
CmpInst * canonicalizeICmpPredicate(CmpInst &I)
If we have a comparison with a non-canonical predicate, if we can update all the users,...
Definition InstCombineCompares.cpp:7149

llvm::InstCombinerImpl::eraseInstFromFunction
Instruction * eraseInstFromFunction(Instruction &I) override
Combiner aware instruction erasure.
Definition InstCombineInternal.h:488

llvm::InstCombinerImpl::foldICmpWithZero
Instruction * foldICmpWithZero(ICmpInst &Cmp)
Definition InstCombineCompares.cpp:1197

llvm::InstCombinerImpl::foldICmpCommutative
Instruction * foldICmpCommutative(CmpPredicate Pred, Value *Op0, Value *Op1, ICmpInst &CxtI)
Definition InstCombineCompares.cpp:7458

llvm::InstCombinerImpl::foldICmpBinOpEqualityWithConstant
Instruction * foldICmpBinOpEqualityWithConstant(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Fold an icmp equality instruction with binary operator LHS and constant RHS: icmp eq/ne BO,...
Definition InstCombineCompares.cpp:3600

llvm::InstCombinerImpl::foldICmpUsingBoolRange
Instruction * foldICmpUsingBoolRange(ICmpInst &I)
If one operand of an icmp is effectively a bool (value range of {0,1}), then try to reduce patterns b...
Definition InstCombineCompares.cpp:7039

llvm::InstCombinerImpl::foldICmpWithTrunc
Instruction * foldICmpWithTrunc(ICmpInst &Cmp)
Definition InstCombineCompares.cpp:6212

llvm::InstCombinerImpl::foldICmpIntrinsicWithConstant
Instruction * foldICmpIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst *II, const APInt &C)
Fold an icmp with LLVM intrinsic and constant operand: icmp Pred II, C.
Definition InstCombineCompares.cpp:4184

llvm::InstCombinerImpl::matchThreeWayIntCompare
bool matchThreeWayIntCompare(SelectInst *SI, Value *&LHS, Value *&RHS, ConstantInt *&Less, ConstantInt *&Equal, ConstantInt *&Greater)
Match a select chain which produces one of three values based on whether the LHS is less than,...
Definition InstCombineCompares.cpp:3298

llvm::InstCombinerImpl::visitFCmpInst
Instruction * visitFCmpInst(FCmpInst &I)
Definition InstCombineCompares.cpp:8607

llvm::InstCombinerImpl::foldICmpUsingKnownBits
Instruction * foldICmpUsingKnownBits(ICmpInst &Cmp)
Try to fold the comparison based on range information we can get by checking whether bits are known t...
Definition InstCombineCompares.cpp:6826

llvm::InstCombinerImpl::foldICmpDivConstant
Instruction * foldICmpDivConstant(ICmpInst &Cmp, BinaryOperator *Div, const APInt &C)
Fold icmp ({su}div X, Y), C.
Definition InstCombineCompares.cpp:2778

llvm::InstCombinerImpl::foldIRemByPowerOfTwoToBitTest
Instruction * foldIRemByPowerOfTwoToBitTest(ICmpInst &I)
If we have: icmp eq/ne (urem/srem x, y), 0 iff y is a power-of-two, we can replace this with a bit te...
Definition InstCombineCompares.cpp:1147

llvm::InstCombinerImpl::foldFCmpIntToFPConst
Instruction * foldFCmpIntToFPConst(FCmpInst &I, Instruction *LHSI, Constant *RHSC)
Fold fcmp ([us]itofp x, cst) if possible.
Definition InstCombineCompares.cpp:7934

llvm::InstCombinerImpl::foldICmpUDivConstant
Instruction * foldICmpUDivConstant(ICmpInst &Cmp, BinaryOperator *UDiv, const APInt &C)
Fold icmp (udiv X, Y), C.
Definition InstCombineCompares.cpp:2745

llvm::InstCombinerImpl::foldICmpAddOpConst
Instruction * foldICmpAddOpConst(Value *X, const APInt &C, CmpPredicate Pred)
Fold "icmp pred (X+C), X".
Definition InstCombineCompares.cpp:907

llvm::InstCombinerImpl::foldICmpWithCastOp
Instruction * foldICmpWithCastOp(ICmpInst &ICmp)
Handle icmp (cast x), (cast or constant).
Definition InstCombineCompares.cpp:6368

llvm::InstCombinerImpl::foldICmpTruncConstant
Instruction * foldICmpTruncConstant(ICmpInst &Cmp, TruncInst *Trunc, const APInt &C)
Fold icmp (trunc X), C.
Definition InstCombineCompares.cpp:1442

llvm::InstCombinerImpl::foldICmpAddConstant
Instruction * foldICmpAddConstant(ICmpInst &Cmp, BinaryOperator *Add, const APInt &C)
Fold icmp (add X, Y), C.
Definition InstCombineCompares.cpp:3133

llvm::InstCombinerImpl::foldICmpMulConstant
Instruction * foldICmpMulConstant(ICmpInst &Cmp, BinaryOperator *Mul, const APInt &C)
Fold icmp (mul X, Y), C.
Definition InstCombineCompares.cpp:2178

llvm::InstCombinerImpl::tryFoldInstWithCtpopWithNot
Instruction * tryFoldInstWithCtpopWithNot(Instruction *I)
Definition InstructionCombining.cpp:846

llvm::InstCombinerImpl::foldICmpXorConstant
Instruction * foldICmpXorConstant(ICmpInst &Cmp, BinaryOperator *Xor, const APInt &C)
Fold icmp (xor X, Y), C.
Definition InstCombineCompares.cpp:1588

llvm::InstCombinerImpl::foldSelectICmp
Instruction * foldSelectICmp(CmpPredicate Pred, SelectInst *SI, Value *RHS, const ICmpInst &I)
Definition InstCombineCompares.cpp:4322

llvm::InstCombinerImpl::foldICmpInstWithConstantAllowPoison
Instruction * foldICmpInstWithConstantAllowPoison(ICmpInst &Cmp, const APInt &C)
Try to fold integer comparisons with a constant operand: icmp Pred X, C where X is some kind of instr...
Definition InstCombineCompares.cpp:3957

llvm::InstCombinerImpl::foldIsMultipleOfAPowerOfTwo
Instruction * foldIsMultipleOfAPowerOfTwo(ICmpInst &Cmp)
Fold icmp eq (num + mask) & ~mask, num to icmp eq (and num, mask), 0 Where mask is a low bit mask.
Definition InstCombineCompares.cpp:1286

llvm::InstCombinerImpl::foldICmpAndShift
Instruction * foldICmpAndShift(ICmpInst &Cmp, BinaryOperator *And, const APInt &C1, const APInt &C2)
Fold icmp (and (sh X, Y), C2), C1.
Definition InstCombineCompares.cpp:1689

llvm::InstCombinerImpl::foldICmpBinOpWithConstantViaTruthTable
Instruction * foldICmpBinOpWithConstantViaTruthTable(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Definition InstCombineCompares.cpp:3094

llvm::InstCombinerImpl::foldICmpInstWithConstant
Instruction * foldICmpInstWithConstant(ICmpInst &Cmp)
Try to fold integer comparisons with a constant operand: icmp Pred X, C where X is some kind of instr...
Definition InstCombineCompares.cpp:3553

llvm::InstCombinerImpl::foldICmpXorShiftConst
Instruction * foldICmpXorShiftConst(ICmpInst &Cmp, BinaryOperator *Xor, const APInt &C)
For power-of-2 C: ((X s>> ShiftC) ^ X) u< C --> (X + C) u< (C << 1) ((X s>> ShiftC) ^ X) u> (C - 1) -...
Definition InstCombineCompares.cpp:1660

llvm::InstCombinerImpl::foldICmpShlConstant
Instruction * foldICmpShlConstant(ICmpInst &Cmp, BinaryOperator *Shl, const APInt &C)
Fold icmp (shl X, Y), C.
Definition InstCombineCompares.cpp:2319

llvm::InstCombinerImpl::foldICmpAndConstant
Instruction * foldICmpAndConstant(ICmpInst &Cmp, BinaryOperator *And, const APInt &C)
Fold icmp (and X, Y), C.
Definition InstCombineCompares.cpp:1923

llvm::InstCombinerImpl::foldICmpEquality
Instruction * foldICmpEquality(ICmpInst &Cmp)
Definition InstCombineCompares.cpp:5959

llvm::InstCombinerImpl::foldICmpWithMinMax
Instruction * foldICmpWithMinMax(Instruction &I, MinMaxIntrinsic *MinMax, Value *Z, CmpPredicate Pred)
Fold icmp Pred min|max(X, Y), Z.
Definition InstCombineCompares.cpp:5638

llvm::InstCombinerImpl::dominatesAllUses
bool dominatesAllUses(const Instruction *DI, const Instruction *UI, const BasicBlock *DB) const
True when DB dominates all uses of DI except UI.
Definition InstCombineCompares.cpp:6723

llvm::InstCombinerImpl::foldAllocaCmp
bool foldAllocaCmp(AllocaInst *Alloca)
Definition InstCombineCompares.cpp:829

llvm::InstCombinerImpl::visitICmpInst
Instruction * visitICmpInst(ICmpInst &I)
Definition InstCombineCompares.cpp:7570

llvm::InstCombinerImpl::computeOverflow
OverflowResult computeOverflow(Instruction::BinaryOps BinaryOp, bool IsSigned, Value *LHS, Value *RHS, Instruction *CxtI) const
Definition InstCombineCompares.cpp:6450

llvm::InstCombinerImpl::foldICmpWithDominatingICmp
Instruction * foldICmpWithDominatingICmp(ICmpInst &Cmp)
Canonicalize icmp instructions based on dominating conditions.
Definition InstCombineCompares.cpp:1366

llvm::InstCombinerImpl::replacedSelectWithOperand
bool replacedSelectWithOperand(SelectInst *SI, const ICmpInst *Icmp, const unsigned SIOpd)
Try to replace select with select operand SIOpd in SI-ICmp sequence.
Definition InstCombineCompares.cpp:6798

llvm::InstCombinerImpl::foldICmpShrConstConst
Instruction * foldICmpShrConstConst(ICmpInst &I, Value *ShAmt, const APInt &C1, const APInt &C2)
Handle "(icmp eq/ne (ashr/lshr AP2, A), AP1)" -> (icmp eq/ne A, Log2(AP2/AP1)) -> (icmp eq/ne A,...
Definition InstCombineCompares.cpp:957

llvm::InstCombinerImpl::freelyInvertAllUsersOf
void freelyInvertAllUsersOf(Value *V, Value *IgnoredUser=nullptr)
Freely adapt every user of V as-if V was changed to !V.
Definition InstructionCombining.cpp:1435

llvm::InstCombinerImpl::foldICmpAndConstConst
Instruction * foldICmpAndConstConst(ICmpInst &Cmp, BinaryOperator *And, const APInt &C1)
Fold icmp (and X, C2), C1.
Definition InstCombineCompares.cpp:1776

llvm::InstCombinerImpl::foldICmpBitCast
Instruction * foldICmpBitCast(ICmpInst &Cmp)
Definition InstCombineCompares.cpp:3399

llvm::InstCombinerImpl::foldGEPICmp
Instruction * foldGEPICmp(GEPOperator *GEPLHS, Value *RHS, CmpPredicate Cond, Instruction &I)
Fold comparisons between a GEP instruction and something else.
Definition InstCombineCompares.cpp:645

llvm::InstCombiner
The core instruction combiner logic.
Definition InstCombiner.h:48

llvm::InstCombiner::computeOverflowForSignedSub
OverflowResult computeOverflowForSignedSub(const Value *LHS, const Value *RHS, const Instruction *CxtI) const
Definition InstCombiner.h:505

llvm::InstCombiner::SQ
SimplifyQuery SQ
Definition InstCombiner.h:77

llvm::InstCombiner::ComputeMaxSignificantBits
unsigned ComputeMaxSignificantBits(const Value *Op, const Instruction *CxtI=nullptr, unsigned Depth=0) const
Definition InstCombiner.h:462

llvm::InstCombiner::BuilderTy
IRBuilder< TargetFolder, IRBuilderCallbackInserter > BuilderTy
An IRBuilder that automatically inserts new instructions into the worklist.
Definition InstCombiner.h:60

llvm::InstCombiner::isFreeToInvert
bool isFreeToInvert(Value *V, bool WillInvertAllUses, bool &DoesConsume)
Return true if the specified value is free to invert (apply ~ to).
Definition InstCombiner.h:228

llvm::InstCombiner::computeOverflowForUnsignedMul
OverflowResult computeOverflowForUnsignedMul(const Value *LHS, const Value *RHS, const Instruction *CxtI, bool IsNSW=false) const
Definition InstCombiner.h:468

llvm::InstCombiner::getComplexity
static unsigned getComplexity(Value *V)
Assign a complexity or rank value to LLVM Values.
Definition InstCombiner.h:143

llvm::InstCombiner::TLI
TargetLibraryInfo & TLI
Definition InstCombiner.h:74

llvm::InstCombiner::replaceInstUsesWith
Instruction * replaceInstUsesWith(Instruction &I, Value *V)
A combiner-aware RAUW-like routine.
Definition InstCombiner.h:388

llvm::InstCombiner::MaxArraySizeForCombine
uint64_t MaxArraySizeForCombine
Maximum size of array considered when transforming.
Definition InstCombiner.h:56

llvm::InstCombiner::computeOverflowForSignedAdd
OverflowResult computeOverflowForSignedAdd(const WithCache< const Value * > &LHS, const WithCache< const Value * > &RHS, const Instruction *CxtI) const
Definition InstCombiner.h:491

llvm::InstCombiner::SubOne
static Constant * SubOne(Constant *C)
Subtract one from a Constant.
Definition InstCombiner.h:183

llvm::InstCombiner::computeOverflowForUnsignedSub
OverflowResult computeOverflowForUnsignedSub(const Value *LHS, const Value *RHS, const Instruction *CxtI) const
Definition InstCombiner.h:498

llvm::InstCombiner::isCanonicalPredicate
static bool isCanonicalPredicate(CmpPredicate Pred)
Predicate canonicalization reduces the number of patterns that need to be matched by other transforms...
Definition InstCombiner.h:160

llvm::InstCombiner::DL
const DataLayout & DL
Definition InstCombiner.h:76

llvm::InstCombiner::DC
DomConditionCache DC
Definition InstCombiner.h:82

llvm::InstCombiner::computeKnownBits
void computeKnownBits(const Value *V, KnownBits &Known, const Instruction *CxtI, unsigned Depth=0) const
Definition InstCombiner.h:433

llvm::InstCombiner::canFreelyInvertAllUsersOf
bool canFreelyInvertAllUsersOf(Instruction *V, Value *IgnoredUser)
Given i1 V, can every user of V be freely adapted if V is changed to !V ?
Definition InstCombiner.h:244

llvm::InstCombiner::addToWorklist
void addToWorklist(Instruction *I)
Definition InstCombiner.h:332

llvm::InstCombiner::replaceOperand
Instruction * replaceOperand(Instruction &I, unsigned OpNum, Value *V)
Replace operand of instruction and add old operand to the worklist.
Definition InstCombiner.h:412

llvm::InstCombiner::DT
DominatorTree & DT
Definition InstCombiner.h:75

llvm::InstCombiner::computeOverflowForSignedMul
OverflowResult computeOverflowForSignedMul(const Value *LHS, const Value *RHS, const Instruction *CxtI) const
Definition InstCombiner.h:476

llvm::InstCombiner::Builder
BuilderTy & Builder
Definition InstCombiner.h:61

llvm::InstCombiner::computeOverflowForUnsignedAdd
OverflowResult computeOverflowForUnsignedAdd(const WithCache< const Value * > &LHS, const WithCache< const Value * > &RHS, const Instruction *CxtI) const
Definition InstCombiner.h:483

llvm::InstCombiner::getFreelyInverted
Value * getFreelyInverted(Value *V, bool WillInvertAllUses, BuilderTy *Builder, bool &DoesConsume)
Definition InstCombiner.h:209

llvm::InstCombiner::getSimplifyQuery
const SimplifyQuery & getSimplifyQuery() const
Definition InstCombiner.h:338

llvm::InstCombiner::isKnownToBeAPowerOfTwo
bool isKnownToBeAPowerOfTwo(const Value *V, bool OrZero=false, const Instruction *CxtI=nullptr, unsigned Depth=0)
Definition InstCombiner.h:443

llvm::Instruction
Definition Instruction.h:69

llvm::Instruction::hasNoNaNs
LLVM_ABI bool hasNoNaNs() const LLVM_READONLY
Determine whether the no-NaNs flag is set.
Definition Instruction.cpp:648

llvm::Instruction::hasNoUnsignedWrap
LLVM_ABI bool hasNoUnsignedWrap() const LLVM_READONLY
Determine whether the no unsigned wrap flag is set.
Definition Instruction.cpp:411

llvm::Instruction::hasNoInfs
LLVM_ABI bool hasNoInfs() const LLVM_READONLY
Determine whether the no-infs flag is set.
Definition Instruction.cpp:653

llvm::Instruction::isArithmeticShift
bool isArithmeticShift() const
Return true if this is an arithmetic shift right.
Definition Instruction.h:361

llvm::Instruction::hasNoSignedWrap
LLVM_ABI bool hasNoSignedWrap() const LLVM_READONLY
Determine whether the no signed wrap flag is set.
Definition Instruction.cpp:418

llvm::Instruction::isCommutative
LLVM_ABI bool isCommutative() const LLVM_READONLY
Return true if the instruction is commutative:
Definition Instruction.cpp:1273

llvm::Instruction::isExact
LLVM_ABI bool isExact() const LLVM_READONLY
Determine whether the exact flag is set.
Definition Instruction.cpp:584

llvm::Instruction::getOpcode
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
Definition Instruction.h:312

llvm::Instruction::BinaryOps
BinaryOps
Definition Instruction.h:998

llvm::Instruction::isShift
bool isShift() const
Definition Instruction.h:320

llvm::Instruction::CastOps
CastOps
Definition Instruction.h:1012

llvm::IntegerType::get
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:319

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition IntrinsicInst.h:49

llvm::IntrinsicInst::getIntrinsicID
Intrinsic::ID getIntrinsicID() const
Return the intrinsic ID of this intrinsic.
Definition IntrinsicInst.h:56

llvm::LoadInst
An instruction for reading from memory.
Definition Instructions.h:180

llvm::LoadInst::isVolatile
bool isVolatile() const
Return true if this is a load from a volatile memory location.
Definition Instructions.h:209

llvm::MinMaxIntrinsic
This class represents min/max intrinsics.
Definition IntrinsicInst.h:764

llvm::Module
A Module instance is used to store all the information related to an LLVM module.
Definition Module.h:67

llvm::PHINode
Definition Instructions.h:2638

llvm::PHINode::addIncoming
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
Definition Instructions.h:2773

llvm::PHINode::Create
static PHINode * Create(Type *Ty, unsigned NumReservedValues, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Constructors - NumReservedValues is a hint for the number of incoming edges that this phi node will h...
Definition Instructions.h:2673

llvm::SaturatingInst
Represents a saturating add/sub intrinsic.
Definition IntrinsicInst.h:951

llvm::SelectInst
This class represents the LLVM 'select' instruction.
Definition Instructions.h:1689

llvm::SelectInst::Create
static SelectInst * Create(Value *C, Value *S1, Value *S2, const Twine &NameStr="", InsertPosition InsertBefore=nullptr, Instruction *MDFrom=nullptr)
Definition Instructions.h:1714

llvm::SetVector
A vector that has set insertion semantics.
Definition SetVector.h:59

llvm::SetVector::size
size_type size() const
Determine the number of elements in the SetVector.
Definition SetVector.h:104

llvm::SetVector::insert
bool insert(const value_type &X)
Insert a new element into the SetVector.
Definition SetVector.h:168

llvm::SetVector::contains
bool contains(const key_type &key) const
Check if the SetVector contains the given key.
Definition SetVector.h:269

llvm::ShuffleVectorInst
This instruction constructs a fixed permutation of two input vectors.
Definition Instructions.h:1934

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:574

llvm::SmallVectorImpl::pop_back_val
T pop_back_val()
Definition SmallVector.h:674

llvm::SmallVectorImpl::emplace_back
reference emplace_back(ArgTypes &&... Args)
Definition SmallVector.h:938

llvm::SmallVectorTemplateBase::pop_back
void pop_back()
Definition SmallVector.h:426

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:414

llvm::SmallVectorTemplateCommon::rbegin
reverse_iterator rbegin()
Definition SmallVector.h:274

llvm::SmallVectorTemplateCommon::back
reference back()
Definition SmallVector.h:309

llvm::SmallVectorTemplateCommon::rend
reverse_iterator rend()
Definition SmallVector.h:276

llvm::SmallVectorTemplateCommon::empty
bool empty() const
Definition SmallVector.h:82

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1197

llvm::TruncInst
This class represents a truncation of integer types.
Definition Instructions.h:4555

llvm::TruncInst::hasNoSignedWrap
bool hasNoSignedWrap() const
Test whether this operation is known to never undergo signed overflow, aka the nsw property.
Definition Instructions.h:4600

llvm::TruncInst::NoUnsignedWrap
@ NoUnsignedWrap
Definition Instructions.h:4564

llvm::TruncInst::NoSignedWrap
@ NoSignedWrap
Definition Instructions.h:4564

llvm::TruncInst::hasNoUnsignedWrap
bool hasNoUnsignedWrap() const
Test whether this operation is known to never undergo unsigned overflow, aka the nuw property.
Definition Instructions.h:4594

llvm::TypeSize
Definition TypeSize.h:332

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45

llvm::Type::isVectorTy
bool isVectorTy() const
True if this is an instance of VectorType.
Definition Type.h:273

llvm::Type::isIntOrIntVectorTy
bool isIntOrIntVectorTy() const
Return true if this is an integer type or a vector of integer types.
Definition Type.h:246

llvm::Type::isPointerTy
bool isPointerTy() const
True if this is an instance of PointerType.
Definition Type.h:267

llvm::Type::isPPC_FP128Ty
bool isPPC_FP128Ty() const
Return true if this is powerpc long double.
Definition Type.h:165

llvm::Type::getScalarType
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition Type.h:352

llvm::Type::getPrimitiveSizeInBits
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
Definition Type.cpp:198

llvm::Type::getWithNewBitWidth
LLVM_ABI Type * getWithNewBitWidth(unsigned NewBitWidth) const
Given an integer or vector type, change the lane bitwidth to NewBitwidth, whilst keeping the old numb...
Definition DerivedTypes.h:764

llvm::Type::getContext
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition Type.h:128

llvm::Type::getScalarSizeInBits
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
Definition Type.cpp:231

llvm::Type::getInt1Ty
static LLVM_ABI IntegerType * getInt1Ty(LLVMContext &C)
Definition Type.cpp:294

llvm::Type::getFPMantissaWidth
LLVM_ABI int getFPMantissaWidth() const
Return the width of the mantissa of this type.
Definition Type.cpp:236

llvm::Type::getFltSemantics
LLVM_ABI const fltSemantics & getFltSemantics() const
Definition Type.cpp:107

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition Use.h:35

llvm::User
Definition User.h:44

llvm::User::setOperand
void setOperand(unsigned i, Value *Val)
Definition User.h:237

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition User.h:232

llvm::User::getNumOperands
unsigned getNumOperands() const
Definition User.h:254

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:256

llvm::Value::hasOneUse
bool hasOneUse() const
Return true if there is exactly one use of this value.
Definition Value.h:439

llvm::Value::users
iterator_range< user_iterator > users()
Definition Value.h:426

llvm::Value::hasNUsesOrMore
LLVM_ABI bool hasNUsesOrMore(unsigned N) const
Return true if this value has N uses or more.
Definition Value.cpp:158

llvm::Value::stripAndAccumulateConstantOffsets
LLVM_ABI const Value * stripAndAccumulateConstantOffsets(const DataLayout &DL, APInt &Offset, bool AllowNonInbounds, bool AllowInvariantGroup=false, function_ref< bool(Value &Value, APInt &Offset)> ExternalAnalysis=nullptr, bool LookThroughIntToPtr=false) const
Accumulate the constant offset this value has compared to a base pointer.

llvm::Value::stripPointerCasts
LLVM_ABI const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
Definition Value.cpp:701

llvm::Value::getContext
LLVM_ABI LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.cpp:1101

llvm::Value::uses
iterator_range< use_iterator > uses()
Definition Value.h:380

llvm::Value::getName
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
Definition Value.cpp:322

llvm::Value::takeName
LLVM_ABI void takeName(Value *V)
Transfer the name from V to this value.
Definition Value.cpp:396

llvm::VectorType::get
static LLVM_ABI VectorType * get(Type *ElementType, ElementCount EC)
This static method is the primary way to construct an VectorType.

llvm::details::FixedOrScalableQuantity::getFixedValue
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:200

llvm::details::FixedOrScalableQuantity::isScalable
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition TypeSize.h:169

llvm::ilist_detail::node_parent_access::getParent
const ParentTy * getParent() const
Definition ilist_node.h:34

uint32_t

uint64_t

unsigned

Call
CallInst * Call
Definition ObjCARCOpts.cpp:2360

Changed
Changed
Definition ObjCARCOpts.cpp:2370

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::APIntOps::RoundingUDiv
LLVM_ABI APInt RoundingUDiv(const APInt &A, const APInt &B, APInt::Rounding RM)
Return A unsign-divided by B, rounded by the given rounding mode.
Definition APInt.cpp:2763

llvm::APIntOps::RoundingSDiv
LLVM_ABI APInt RoundingSDiv(const APInt &A, const APInt &B, APInt::Rounding RM)
Return A sign-divided by B, rounded by the given rounding mode.
Definition APInt.cpp:2781

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::Intrinsic::getOrInsertDeclaration
LLVM_ABI Function * getOrInsertDeclaration(Module *M, ID id, ArrayRef< Type * > Tys={})
Look up the Function declaration of the intrinsic id in the Module M.
Definition Intrinsics.cpp:751

llvm::MIPatternMatch::m_ZeroInt
SpecificConstantMatch m_ZeroInt()
Convenience matchers for specific integer values.
Definition MIPatternMatch.h:277

llvm::MIPatternMatch::m_Neg
BinaryOp_match< SpecificConstantMatch, SrcTy, TargetOpcode::G_SUB > m_Neg(const SrcTy &&Src)
Matches a register negated by a G_SUB.
Definition MIPatternMatch.h:928

llvm::MIPatternMatch::m_Not
BinaryOp_match< SrcTy, SpecificConstantMatch, TargetOpcode::G_XOR, true > m_Not(const SrcTy &&Src)
Matches a register not-ed by a G_XOR.
Definition MIPatternMatch.h:936

llvm::MIPatternMatch::m_OneUse
OneUse_match< SubPat > m_OneUse(const SubPat &SP)
Definition MIPatternMatch.h:56

llvm::PatternMatch
Definition PatternMatch.h:47

llvm::PatternMatch::m_AllOnes
cst_pred_ty< is_all_ones > m_AllOnes()
Match an integer or vector with all bits set.
Definition PatternMatch.h:524

llvm::PatternMatch::m_LowBitMask
cst_pred_ty< is_lowbit_mask > m_LowBitMask()
Match an integer or vector with only the low bit(s) set.
Definition PatternMatch.h:673

llvm::PatternMatch::m_And
BinaryOp_match< LHS, RHS, Instruction::And > m_And(const LHS &L, const RHS &R)
Definition PatternMatch.h:1296

llvm::PatternMatch::m_Negative
cst_pred_ty< is_negative > m_Negative()
Match an integer or vector of negative values.
Definition PatternMatch.h:550

llvm::PatternMatch::m_Add
BinaryOp_match< LHS, RHS, Instruction::Add > m_Add(const LHS &L, const RHS &R)
Definition PatternMatch.h:1182

llvm::PatternMatch::m_BinOp
class_match< BinaryOperator > m_BinOp()
Match an arbitrary binary operation and ignore it.
Definition PatternMatch.h:100

llvm::PatternMatch::m_SignMask
cst_pred_ty< is_sign_mask > m_SignMask()
Match an integer or vector with only the sign bit(s) set.
Definition PatternMatch.h:664

llvm::PatternMatch::m_NUWAdd
OverflowingBinaryOp_match< LHS, RHS, Instruction::Add, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWAdd(const LHS &L, const RHS &R)
Definition PatternMatch.h:1441

llvm::PatternMatch::m_AShr
BinaryOp_match< LHS, RHS, Instruction::AShr > m_AShr(const LHS &L, const RHS &R)
Definition PatternMatch.h:1326

llvm::PatternMatch::m_Power2
cst_pred_ty< is_power2 > m_Power2()
Match an integer or vector power-of-2.
Definition PatternMatch.h:619

llvm::PatternMatch::m_URem
BinaryOp_match< LHS, RHS, Instruction::URem > m_URem(const LHS &L, const RHS &R)
Definition PatternMatch.h:1278

llvm::PatternMatch::m_TruncOrSelf
match_combine_or< CastInst_match< OpTy, TruncInst >, OpTy > m_TruncOrSelf(const OpTy &Op)
Definition PatternMatch.h:2231

llvm::PatternMatch::m_Constant
class_match< Constant > m_Constant()
Match an arbitrary Constant and ignore it.
Definition PatternMatch.h:165

llvm::PatternMatch::m_c_And
BinaryOp_match< LHS, RHS, Instruction::And, true > m_c_And(const LHS &L, const RHS &R)
Matches an And with LHS and RHS in either order.
Definition PatternMatch.h:2966

llvm::PatternMatch::m_Trunc
CastInst_match< OpTy, TruncInst > m_Trunc(const OpTy &Op)
Matches Trunc.
Definition PatternMatch.h:2211

llvm::PatternMatch::m_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor > m_Xor(const LHS &L, const RHS &R)
Definition PatternMatch.h:1308

llvm::PatternMatch::m_SpecificInt
specific_intval< false > m_SpecificInt(const APInt &V)
Match a specific integer value or vector with all elements equal to the value.
Definition PatternMatch.h:1060

llvm::PatternMatch::m_ZExtOrSelf
match_combine_or< CastInst_match< OpTy, ZExtInst >, OpTy > m_ZExtOrSelf(const OpTy &Op)
Definition PatternMatch.h:2254

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition PatternMatch.h:49

llvm::PatternMatch::m_IDiv
BinOpPred_match< LHS, RHS, is_idiv_op > m_IDiv(const LHS &L, const RHS &R)
Matches integer division operations.
Definition PatternMatch.h:1680

llvm::PatternMatch::m_Instruction
bind_ty< Instruction > m_Instruction(Instruction *&I)
Match an instruction, capturing it if we match.
Definition PatternMatch.h:862

llvm::PatternMatch::m_AnyZeroFP
cstfp_pred_ty< is_any_zero_fp > m_AnyZeroFP()
Match a floating-point negative zero or positive zero.
Definition PatternMatch.h:766

llvm::PatternMatch::m_Specific
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
Definition PatternMatch.h:962

llvm::PatternMatch::m_Shr
BinOpPred_match< LHS, RHS, is_right_shift_op > m_Shr(const LHS &L, const RHS &R)
Matches logical shift operations.
Definition PatternMatch.h:1652

llvm::PatternMatch::m_SpecificIntAllowPoison
specific_intval< true > m_SpecificIntAllowPoison(const APInt &V)
Definition PatternMatch.h:1068

llvm::PatternMatch::m_c_ICmp
CmpClass_match< LHS, RHS, ICmpInst, true > m_c_ICmp(CmpPredicate &Pred, const LHS &L, const RHS &R)
Matches an ICmp with a predicate over LHS and RHS in either order.
Definition PatternMatch.h:2933

llvm::PatternMatch::m_NSWNeg
OverflowingBinaryOp_match< cst_pred_ty< is_zero_int >, ValTy, Instruction::Sub, OverflowingBinaryOperator::NoSignedWrap > m_NSWNeg(const ValTy &V)
Matches a 'Neg' as 'sub nsw 0, V'.
Definition PatternMatch.h:2997

llvm::PatternMatch::m_NonNegative
cst_pred_ty< is_nonnegative > m_NonNegative()
Match an integer or vector of non-negative values.
Definition PatternMatch.h:560

llvm::PatternMatch::m_ConstantInt
class_match< ConstantInt > m_ConstantInt()
Match an arbitrary ConstantInt and ignore it.
Definition PatternMatch.h:168

llvm::PatternMatch::m_One
cst_pred_ty< is_one > m_One()
Match an integer 1 or a vector with all elements equal to 1.
Definition PatternMatch.h:592

llvm::PatternMatch::m_Intrinsic
IntrinsicID_match m_Intrinsic()
Match intrinsic calls like this: m_Intrinsic<Intrinsic::fabs>(m_Value(X))
Definition PatternMatch.h:2772

llvm::PatternMatch::m_Select
ThreeOps_match< Cond, LHS, RHS, Instruction::Select > m_Select(const Cond &C, const LHS &L, const RHS &R)
Matches SelectInst.
Definition PatternMatch.h:1928

llvm::PatternMatch::m_ExtractValue
ExtractValue_match< Ind, Val_t > m_ExtractValue(const Val_t &V)
Match a single index ExtractValue instruction.
Definition PatternMatch.h:3118

llvm::PatternMatch::m_LogicalShift
BinOpPred_match< LHS, RHS, is_logical_shift_op > m_LogicalShift(const LHS &L, const RHS &R)
Matches logical shift operations.
Definition PatternMatch.h:1660

llvm::PatternMatch::m_CombineAnd
match_combine_and< LTy, RTy > m_CombineAnd(const LTy &L, const RTy &R)
Combine two pattern matchers matching L && R.
Definition PatternMatch.h:245

llvm::PatternMatch::m_SMin
MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > m_SMin(const LHS &L, const RHS &R)
Definition PatternMatch.h:2492

llvm::PatternMatch::m_Sqrt
m_Intrinsic_Ty< Opnd0 >::Ty m_Sqrt(const Opnd0 &Op0)
Definition PatternMatch.h:2904

llvm::PatternMatch::m_c_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor, true > m_c_Xor(const LHS &L, const RHS &R)
Matches an Xor with LHS and RHS in either order.
Definition PatternMatch.h:2980

llvm::PatternMatch::m_FAdd
BinaryOp_match< LHS, RHS, Instruction::FAdd > m_FAdd(const LHS &L, const RHS &R)
Definition PatternMatch.h:1188

llvm::PatternMatch::m_Mul
BinaryOp_match< LHS, RHS, Instruction::Mul > m_Mul(const LHS &L, const RHS &R)
Definition PatternMatch.h:1248

llvm::PatternMatch::m_Deferred
deferredval_ty< Value > m_Deferred(Value *const &V)
Like m_Specific(), but works if the specific value to match is determined as part of the same match()...
Definition PatternMatch.h:980

llvm::PatternMatch::m_APIntAllowPoison
apint_match m_APIntAllowPoison(const APInt *&Res)
Match APInt while allowing poison in splat vector constants.
Definition PatternMatch.h:305

llvm::PatternMatch::m_NSWTrunc
NoWrapTrunc_match< OpTy, TruncInst::NoSignedWrap > m_NSWTrunc(const OpTy &Op)
Matches trunc nsw.
Definition PatternMatch.h:2225

llvm::PatternMatch::m_Shuffle
TwoOps_match< V1_t, V2_t, Instruction::ShuffleVector > m_Shuffle(const V1_t &v1, const V2_t &v2)
Matches ShuffleVectorInst independently of mask value.
Definition PatternMatch.h:2040

llvm::PatternMatch::m_c_Select
ThreeOps_match< decltype(m_Value()), LHS, RHS, Instruction::Select, true > m_c_Select(const LHS &L, const RHS &R)
Match Select(C, LHS, RHS) or Select(C, RHS, LHS)
Definition PatternMatch.h:1944

llvm::PatternMatch::m_FPExt
CastInst_match< OpTy, FPExtInst > m_FPExt(const OpTy &Op)
Definition PatternMatch.h:2320

llvm::PatternMatch::m_ZExt
CastInst_match< OpTy, ZExtInst > m_ZExt(const OpTy &Op)
Matches ZExt.
Definition PatternMatch.h:2243

llvm::PatternMatch::m_NUWShl
OverflowingBinaryOp_match< LHS, RHS, Instruction::Shl, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWShl(const LHS &L, const RHS &R)
Definition PatternMatch.h:1475

llvm::PatternMatch::m_NUWMul
OverflowingBinaryOp_match< LHS, RHS, Instruction::Mul, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWMul(const LHS &L, const RHS &R)
Definition PatternMatch.h:1467

llvm::PatternMatch::m_UDiv
BinaryOp_match< LHS, RHS, Instruction::UDiv > m_UDiv(const LHS &L, const RHS &R)
Definition PatternMatch.h:1260

llvm::PatternMatch::m_ImmConstant
match_immconstant_ty m_ImmConstant()
Match an arbitrary immediate Constant and ignore it.
Definition PatternMatch.h:931

llvm::PatternMatch::m_NegatedPower2OrZero
cst_pred_ty< is_negated_power2_or_zero > m_NegatedPower2OrZero()
Match a integer or vector negated power-of-2.
Definition PatternMatch.h:639

llvm::PatternMatch::m_NUWTrunc
NoWrapTrunc_match< OpTy, TruncInst::NoUnsignedWrap > m_NUWTrunc(const OpTy &Op)
Matches trunc nuw.
Definition PatternMatch.h:2218

llvm::PatternMatch::m_CheckedInt
cst_pred_ty< custom_checkfn< APInt > > m_CheckedInt(function_ref< bool(const APInt &)> CheckFn)
Match an integer or vector where CheckFn(ele) for each element is true.
Definition PatternMatch.h:481

llvm::PatternMatch::m_LowBitMaskOrZero
cst_pred_ty< is_lowbit_mask_or_zero > m_LowBitMaskOrZero()
Match an integer or vector with only the low bit(s) set.
Definition PatternMatch.h:683

llvm::PatternMatch::m_c_Add
BinaryOp_match< LHS, RHS, Instruction::Add, true > m_c_Add(const LHS &L, const RHS &R)
Matches a Add with LHS and RHS in either order.
Definition PatternMatch.h:2952

llvm::PatternMatch::m_AddLike
match_combine_or< BinaryOp_match< LHS, RHS, Instruction::Add >, DisjointOr_match< LHS, RHS > > m_AddLike(const LHS &L, const RHS &R)
Match either "add" or "or disjoint".
Definition PatternMatch.h:1536

llvm::PatternMatch::m_UIToFP
CastInst_match< OpTy, UIToFPInst > m_UIToFP(const OpTy &Op)
Definition PatternMatch.h:2295

llvm::PatternMatch::m_BitCast
CastOperator_match< OpTy, Instruction::BitCast > m_BitCast(const OpTy &Op)
Matches BitCast.
Definition PatternMatch.h:2150

llvm::PatternMatch::m_SDiv
BinaryOp_match< LHS, RHS, Instruction::SDiv > m_SDiv(const LHS &L, const RHS &R)
Definition PatternMatch.h:1266

llvm::PatternMatch::m_APInt
apint_match m_APInt(const APInt *&Res)
Match a ConstantInt or splatted ConstantVector, binding the specified pointer to the contained APInt.
Definition PatternMatch.h:299

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition PatternMatch.h:92

llvm::PatternMatch::m_Signum
Signum_match< Val_t > m_Signum(const Val_t &V)
Matches a signum pattern.
Definition PatternMatch.h:3095

llvm::PatternMatch::m_SIToFP
CastInst_match< OpTy, SIToFPInst > m_SIToFP(const OpTy &Op)
Definition PatternMatch.h:2300

llvm::PatternMatch::m_LShr
BinaryOp_match< LHS, RHS, Instruction::LShr > m_LShr(const LHS &L, const RHS &R)
Definition PatternMatch.h:1320

llvm::PatternMatch::m_ICmp
CmpClass_match< LHS, RHS, ICmpInst > m_ICmp(CmpPredicate &Pred, const LHS &L, const RHS &R)
Definition PatternMatch.h:1754

llvm::PatternMatch::m_ZExtOrSExt
match_combine_or< CastInst_match< OpTy, ZExtInst >, CastInst_match< OpTy, SExtInst > > m_ZExtOrSExt(const OpTy &Op)
Definition PatternMatch.h:2274

llvm::PatternMatch::m_FNeg
FNeg_match< OpTy > m_FNeg(const OpTy &X)
Match 'fneg X' as 'fsub -0.0, X'.
Definition PatternMatch.h:1236

llvm::PatternMatch::m_PosZeroFP
cstfp_pred_ty< is_pos_zero_fp > m_PosZeroFP()
Match a floating-point positive zero.
Definition PatternMatch.h:775

llvm::PatternMatch::m_Shl
BinaryOp_match< LHS, RHS, Instruction::Shl > m_Shl(const LHS &L, const RHS &R)
Definition PatternMatch.h:1314

llvm::PatternMatch::m_UAddWithOverflow
UAddWithOverflow_match< LHS_t, RHS_t, Sum_t > m_UAddWithOverflow(const LHS_t &L, const RHS_t &R, const Sum_t &S)
Match an icmp instruction checking for unsigned overflow on addition.
Definition PatternMatch.h:2692

llvm::PatternMatch::m_VecReverse
m_Intrinsic_Ty< Opnd0 >::Ty m_VecReverse(const Opnd0 &Op0)
Definition PatternMatch.h:2915

llvm::PatternMatch::m_IRem
BinOpPred_match< LHS, RHS, is_irem_op > m_IRem(const LHS &L, const RHS &R)
Matches integer remainder operations.
Definition PatternMatch.h:1687

llvm::PatternMatch::m_APFloat
apfloat_match m_APFloat(const APFloat *&Res)
Match a ConstantFP or splatted ConstantVector, binding the specified pointer to the contained APFloat...
Definition PatternMatch.h:316

llvm::PatternMatch::m_MaxOrMin
match_combine_or< match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > >, match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty > > > m_MaxOrMin(const LHS &L, const RHS &R)
Definition PatternMatch.h:2515

llvm::PatternMatch::m_FPTrunc
CastInst_match< OpTy, FPTruncInst > m_FPTrunc(const OpTy &Op)
Definition PatternMatch.h:2315

llvm::PatternMatch::m_Undef
auto m_Undef()
Match an arbitrary undef constant.
Definition PatternMatch.h:152

llvm::PatternMatch::m_Or
BinaryOp_match< LHS, RHS, Instruction::Or > m_Or(const LHS &L, const RHS &R)
Definition PatternMatch.h:1302

llvm::PatternMatch::m_SExt
CastInst_match< OpTy, SExtInst > m_SExt(const OpTy &Op)
Matches SExt.
Definition PatternMatch.h:2237

llvm::PatternMatch::m_Zero
is_zero m_Zero()
Match any null constant or a vector with all elements equal to 0.
Definition PatternMatch.h:612

llvm::PatternMatch::m_c_Or
BinaryOp_match< LHS, RHS, Instruction::Or, true > m_c_Or(const LHS &L, const RHS &R)
Matches an Or with LHS and RHS in either order.
Definition PatternMatch.h:2973

llvm::PatternMatch::m_ElementWiseBitCast
ElementWiseBitCast_match< OpTy > m_ElementWiseBitCast(const OpTy &Op)
Definition PatternMatch.h:2178

llvm::PatternMatch::m_FAbs
m_Intrinsic_Ty< Opnd0 >::Ty m_FAbs(const Opnd0 &Op0)
Definition PatternMatch.h:2846

llvm::PatternMatch::m_c_Mul
BinaryOp_match< LHS, RHS, Instruction::Mul, true > m_c_Mul(const LHS &L, const RHS &R)
Matches a Mul with LHS and RHS in either order.
Definition PatternMatch.h:2959

llvm::PatternMatch::m_PtrToInt
CastOperator_match< OpTy, Instruction::PtrToInt > m_PtrToInt(const OpTy &Op)
Matches PtrToInt.
Definition PatternMatch.h:2185

llvm::PatternMatch::m_Sub
BinaryOp_match< LHS, RHS, Instruction::Sub > m_Sub(const LHS &L, const RHS &R)
Definition PatternMatch.h:1194

llvm::PatternMatch::m_Unless
match_unless< Ty > m_Unless(const Ty &M)
Match if the inner matcher does NOT match.
Definition PatternMatch.h:203

llvm::PatternMatch::m_CombineOr
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
Definition PatternMatch.h:239

llvm::PatternMatch::m_SpecificInt_ICMP
cst_pred_ty< icmp_pred_with_threshold > m_SpecificInt_ICMP(ICmpInst::Predicate Predicate, const APInt &Threshold)
Match an integer or vector with every element comparing 'pred' (eg/ne/...) to Threshold.
Definition PatternMatch.h:700

llvm::SI
Definition SIInstrInfo.h:1716

llvm::sampleprof::Base
@ Base
Definition Discriminator.h:58

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::Offset
@ Offset
Definition DWP.cpp:477

llvm::zip
detail::zippy< detail::zip_shortest, T, U, Args... > zip(T &&t, U &&u, Args &&...args)
zip iterator for two or more iteratable types.
Definition STLExtras.h:843

llvm::OverflowResult
OverflowResult
Definition ValueTracking.h:616

llvm::OverflowResult::NeverOverflows
@ NeverOverflows
Never overflows.
Definition ValueTracking.h:624

llvm::OverflowResult::AlwaysOverflowsHigh
@ AlwaysOverflowsHigh
Always overflows in the direction of signed/unsigned max value.
Definition ValueTracking.h:620

llvm::OverflowResult::AlwaysOverflowsLow
@ AlwaysOverflowsLow
Always overflows in the direction of signed/unsigned min value.
Definition ValueTracking.h:618

llvm::OverflowResult::MayOverflow
@ MayOverflow
May or may not overflow.
Definition ValueTracking.h:622

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1727

llvm::isKnownNeverInfinity
LLVM_ABI bool isKnownNeverInfinity(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Return true if the floating-point scalar value is not an infinity or if the floating-point vector val...
Definition ValueTracking.cpp:5960

llvm::isSignBitCheck
LLVM_ABI bool isSignBitCheck(ICmpInst::Predicate Pred, const APInt &RHS, bool &TrueIfSigned)
Given an exploded icmp instruction, return true if the comparison only checks the sign bit.
Definition ValueTracking.cpp:4556

llvm::Depth
@ Depth
Definition SIMachineScheduler.h:36

llvm::LoopIdiomVectorizeStyle::Masked
@ Masked
Definition LoopIdiomVectorize.h:16

llvm::dyn_cast
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:649

llvm::stripNullTest
LLVM_ABI Value * stripNullTest(Value *V)
Returns the inner value X if the expression has the form f(X) where f(X) == 0 if and only if X == 0,...
Definition ValueTracking.cpp:10271

llvm::ConstantFoldCompareInstOperands
LLVM_ABI Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
Definition ConstantFolding.cpp:1198

llvm::make_early_inc_range
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
Definition STLExtras.h:646

llvm::simplifyFCmpInst
LLVM_ABI Value * simplifyFCmpInst(CmpPredicate Predicate, Value *LHS, Value *RHS, FastMathFlags FMF, const SimplifyQuery &Q)
Given operands for an FCmpInst, fold the result or return null.
Definition InstructionSimplify.cpp:4289

llvm::ilogb
int ilogb(const APFloat &Arg)
Returns the exponent of the internal representation of the APFloat.
Definition APFloat.h:1534

llvm::computeConstantRange
LLVM_ABI ConstantRange computeConstantRange(const Value *V, bool ForSigned, bool UseInstrInfo=true, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Determine the possible constant range of an integer or vector of integer value.
Definition ValueTracking.cpp:10032

llvm::MaskedValueIsZero
LLVM_ABI bool MaskedValueIsZero(const Value *V, const APInt &Mask, const SimplifyQuery &SQ, unsigned Depth=0)
Return true if 'V & Mask' is known to be zero.
Definition ValueTracking.cpp:315

llvm::simplifyAddInst
LLVM_ABI Value * simplifyAddInst(Value *LHS, Value *RHS, bool IsNSW, bool IsNUW, const SimplifyQuery &Q)
Given operands for an Add, fold the result or return null.
Definition InstructionSimplify.cpp:659

llvm::ConstantFoldConstant
LLVM_ABI Constant * ConstantFoldConstant(const Constant *C, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldConstant - Fold the constant using the specified DataLayout.
Definition ConstantFolding.cpp:1183

llvm::dyn_cast_or_null
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:759

llvm::isSplatValue
LLVM_ABI bool isSplatValue(const Value *V, int Index=-1, unsigned Depth=0)
Return true if each element of the vector value V is poisoned or equal to every other non-poisoned el...
Definition VectorUtils.cpp:406

llvm::Log2_32
unsigned Log2_32(uint32_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
Definition MathExtras.h:336

llvm::countl_zero
int countl_zero(T Val)
Count number of 0's from the most significant bit to the least stopping at the first 1.
Definition bit.h:203

llvm::emitGEPOffset
LLVM_ABI Value * emitGEPOffset(IRBuilderBase *Builder, const DataLayout &DL, User *GEP, bool NoAssumptions=false)
Given a getelementptr instruction/constantexpr, emit the code necessary to compute the offset from th...
Definition Local.cpp:22

llvm::MaxAnalysisRecursionDepth
constexpr unsigned MaxAnalysisRecursionDepth
Definition ValueTracking.h:47

llvm::ConstantFoldUnaryOpOperand
LLVM_ABI Constant * ConstantFoldUnaryOpOperand(unsigned Opcode, Constant *Op, const DataLayout &DL)
Attempt to constant fold a unary operation with the specified operand.
Definition ConstantFolding.cpp:1310

llvm::HexPrintStyle::Upper
@ Upper
Definition NativeFormatting.h:23

llvm::HexPrintStyle::Lower
@ Lower
Definition NativeFormatting.h:23

llvm::isKnownNegative
LLVM_ABI bool isKnownNegative(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Returns true if the given value is known be negative (i.e.
Definition ValueTracking.cpp:295

llvm::SelectPatternFlavor
SelectPatternFlavor
Specific patterns of select instructions we can match.
Definition ValueTracking.h:828

llvm::SPF_UNKNOWN
@ SPF_UNKNOWN
Definition ValueTracking.h:829

llvm::impliesPoison
LLVM_ABI bool impliesPoison(const Value *ValAssumedPoison, const Value *V)
Return true if V is poison given that ValAssumedPoison is already poison.
Definition ValueTracking.cpp:7577

llvm::decomposeLinearExpression
LLVM_ABI LinearExpression decomposeLinearExpression(const DataLayout &DL, Value *Ptr)
Decompose a pointer into a linear expression.
Definition Loads.cpp:881

llvm::isFinite
LLVM_ABI bool isFinite(const Loop *L)
Return true if this loop can be assumed to run for a finite number of iterations.
Definition LoopInfo.cpp:1164

llvm::FPClassTest
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
Definition FloatingPointMode.h:240

llvm::fcInf
@ fcInf
Definition FloatingPointMode.h:255

llvm::fcSubnormal
@ fcSubnormal
Definition FloatingPointMode.h:257

llvm::fcZero
@ fcZero
Definition FloatingPointMode.h:258

llvm::fcAllFlags
@ fcAllFlags
Definition FloatingPointMode.h:265

llvm::fcNan
@ fcNan
Definition FloatingPointMode.h:254

llvm::scalbn
APFloat scalbn(APFloat X, int Exp, APFloat::roundingMode RM)
Returns: X * 2^Exp for integral exponents.
Definition APFloat.h:1543

llvm::computeKnownBits
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
Definition ValueTracking.cpp:148

llvm::matchSelectPattern
LLVM_ABI SelectPatternResult matchSelectPattern(Value *V, Value *&LHS, Value *&RHS, Instruction::CastOps *CastOp=nullptr, unsigned Depth=0)
Pattern match integer [SU]MIN, [SU]MAX and ABS idioms, returning the kind and providing the out param...
Definition ValueTracking.cpp:8966

llvm::NullPointerIsDefined
LLVM_ABI bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
Definition Function.cpp:1172

llvm::none_of
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1741

llvm::simplifyICmpInst
LLVM_ABI Value * simplifyICmpInst(CmpPredicate Pred, Value *LHS, Value *RHS, const SimplifyQuery &Q)
Given operands for an ICmpInst, fold the result or return null.
Definition InstructionSimplify.cpp:4057

llvm::ConstantFoldCastOperand
LLVM_ABI Constant * ConstantFoldCastOperand(unsigned Opcode, Constant *C, Type *DestTy, const DataLayout &DL)
Attempt to constant fold a cast with the specified operand.
Definition ConstantFolding.cpp:1482

llvm::CodeGenOptLevel::Less
@ Less
-O1
Definition CodeGen.h:84

llvm::ConstantFoldLoadFromConst
LLVM_ABI Constant * ConstantFoldLoadFromConst(Constant *C, Type *Ty, const APInt &Offset, const DataLayout &DL)
Extract value of C at the given Offset reinterpreted as Ty.
Definition ConstantFolding.cpp:713

llvm::isa
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:548

llvm::ConstantFoldBinaryOpOperands
LLVM_ABI Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
Definition ConstantFolding.cpp:1317

llvm::isKnownNonZero
LLVM_ABI bool isKnownNonZero(const Value *V, const SimplifyQuery &Q, unsigned Depth=0)
Return true if the given value is known to be non-zero when defined.
Definition ValueTracking.cpp:3563

llvm::divideCeil
constexpr T divideCeil(U Numerator, V Denominator)
Returns the integer ceil(Numerator / Denominator).
Definition MathExtras.h:399

llvm::IRMemLocation::Other
@ Other
Any other memory.
Definition ModRef.h:68

llvm::IRMemLocation::First
@ First
Helpers to iterate all locations in the MemoryEffectsBase class.
Definition ModRef.h:71

llvm::simplifyBinOp
LLVM_ABI Value * simplifyBinOp(unsigned Opcode, Value *LHS, Value *RHS, const SimplifyQuery &Q)
Given operands for a BinaryOperator, fold the result or return null.
Definition InstructionSimplify.cpp:6132

llvm::RecurKind::UMin
@ UMin
Unsigned integer min implemented in terms of select(cmp()).
Definition IVDescriptors.h:46

llvm::RecurKind::Mul
@ Mul
Product of integers.
Definition IVDescriptors.h:40

llvm::RecurKind::Xor
@ Xor
Bitwise or logical XOR of integers.
Definition IVDescriptors.h:43

llvm::RecurKind::SMax
@ SMax
Signed integer max implemented in terms of select(cmp()).
Definition IVDescriptors.h:45

llvm::RecurKind::SMin
@ SMin
Signed integer min implemented in terms of select(cmp()).
Definition IVDescriptors.h:44

llvm::RecurKind::Sub
@ Sub
Subtraction of integers.
Definition IVDescriptors.h:38

llvm::RecurKind::Add
@ Add
Sum of integers.
Definition IVDescriptors.h:37

llvm::RecurKind::UMax
@ UMax
Unsigned integer max implemented in terms of select(cmp()).
Definition IVDescriptors.h:47

llvm::isKnownNonEqual
LLVM_ABI bool isKnownNonEqual(const Value *V1, const Value *V2, const SimplifyQuery &SQ, unsigned Depth=0)
Return true if the given values are known to be non-equal when defined.
Definition ValueTracking.cpp:304

llvm::Op
DWARFExpression::Operation Op
Definition DWARFExpressionPrinter.cpp:22

llvm::PointerMayBeCaptured
LLVM_ABI bool PointerMayBeCaptured(const Value *V, bool ReturnCaptures, unsigned MaxUsesToExplore=0)
PointerMayBeCaptured - Return true if this pointer value may be captured by the enclosing function (w...
Definition CaptureTracking.cpp:213

llvm::BitWidth
constexpr unsigned BitWidth
Definition BitmaskEnum.h:223

llvm::getLosslessInvCast
LLVM_ABI Constant * getLosslessInvCast(Constant *C, Type *InvCastTo, unsigned CastOp, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
Try to cast C to InvC losslessly, satisfying CastOp(InvC) equals C, or CastOp(InvC) is a refined valu...
Definition ConstantFolding.cpp:4611

llvm::count_if
auto count_if(R &&Range, UnaryPredicate P)
Wrapper function around std::count_if to count the number of times an element satisfying a given pred...
Definition STLExtras.h:1963

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:565

llvm::isKnownNeverNaN
LLVM_ABI bool isKnownNeverNaN(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Return true if the floating-point scalar value is not a NaN or if the floating-point vector value has...
Definition ValueTracking.cpp:5976

llvm::getFlippedStrictnessPredicateAndConstant
LLVM_ABI std::optional< std::pair< CmpPredicate, Constant * > > getFlippedStrictnessPredicateAndConstant(CmpPredicate Pred, Constant *C)
Convert an integer comparison with a constant RHS into an equivalent form with the strictness flipped...
Definition ValueTracking.cpp:8583

llvm::all_equal
bool all_equal(std::initializer_list< T > Values)
Returns true if all Values in the initializer lists are equal or the list.
Definition STLExtras.h:2110

llvm::isKnownToBeAPowerOfTwo
LLVM_ABI bool isKnownToBeAPowerOfTwo(const Value *V, const DataLayout &DL, bool OrZero=false, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Return true if the given value is known to have exactly one bit set when defined.
Definition ValueTracking.cpp:265

llvm::Continue
@ Continue
Definition DWP.h:22

llvm::getUnderlyingObject
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
Definition ValueTracking.cpp:6658

llvm::isKnownPositive
LLVM_ABI bool isKnownPositive(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Returns true if the given value is known be positive (i.e.
Definition ValueTracking.cpp:283

llvm::isKnownNonNegative
LLVM_ABI bool isKnownNonNegative(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Returns true if the give value is known to be non-negative.
Definition ValueTracking.cpp:278

llvm::fltNanEncoding::AllOnes
@ AllOnes
Definition APFloat.cpp:92

llvm::Invalid
@ Invalid
Definition PGOCtxProfWriter.h:24

llvm::isImpliedCondition
LLVM_ABI std::optional< bool > isImpliedCondition(const Value *LHS, const Value *RHS, const DataLayout &DL, bool LHSIsTrue=true, unsigned Depth=0)
Return true if RHS is known to be implied true by LHS.
Definition ValueTracking.cpp:9515

llvm::decomposeBitTestICmp
std::optional< DecomposedBitTest > decomposeBitTestICmp(Value *LHS, Value *RHS, CmpInst::Predicate Pred, bool LookThroughTrunc=true, bool AllowNonZeroC=false, bool DecomposeAnd=false)
Decompose an icmp into the form ((X & Mask) pred C) if possible.
Definition CmpInstAnalysis.cpp:77

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:853

NC
#define NC
Definition regutils.h:42

OffsetResult
Definition InstCombineCompares.cpp:5869

OffsetResult::Kind
OffsetKind Kind
Definition InstCombineCompares.cpp:5870

OffsetResult::V2
Value * V2
Definition InstCombineCompares.cpp:5871

OffsetResult::V1
Value * V1
Definition InstCombineCompares.cpp:5871

OffsetResult::materialize
Value * materialize(InstCombiner::BuilderTy &Builder) const
Definition InstCombineCompares.cpp:5883

OffsetResult::isValid
bool isValid() const
Definition InstCombineCompares.cpp:5882

OffsetResult::value
static OffsetResult value(Value *V)
Definition InstCombineCompares.cpp:5876

OffsetResult::select
static OffsetResult select(Value *Cond, Value *TrueV, Value *FalseV)
Definition InstCombineCompares.cpp:5879

OffsetResult::V0
Value * V0
Definition InstCombineCompares.cpp:5871

OffsetResult::invalid
static OffsetResult invalid()
Definition InstCombineCompares.cpp:5873

llvm::APFloatBase::rmNearestTiesToEven
static constexpr roundingMode rmNearestTiesToEven
Definition APFloat.h:304

llvm::APFloatBase::rmTowardZero
static constexpr roundingMode rmTowardZero
Definition APFloat.h:308

llvm::APFloatBase::IEK_Inf
@ IEK_Inf
Definition APFloat.h:346

llvm::CaptureTracker
This callback is used in conjunction with PointerMayBeCaptured.
Definition CaptureTracking.h:139

llvm::CommonPointerBase
Definition InstCombineInternal.h:884

llvm::CommonPointerBase::compute
static CommonPointerBase compute(Value *LHS, Value *RHS)
Definition InstCombineAddSub.cpp:2100

llvm::DenormalMode
Represent subnormal handling kind for floating point instruction inputs and outputs.
Definition FloatingPointMode.h:71

llvm::DenormalMode::PreserveSign
@ PreserveSign
The sign of a flushed-to-zero number is preserved in the sign of 0.
Definition FloatingPointMode.h:81

llvm::DenormalMode::PositiveZero
@ PositiveZero
Denormals are flushed to positive zero.
Definition FloatingPointMode.h:84

llvm::DenormalMode::getIEEE
static constexpr DenormalMode getIEEE()
Definition FloatingPointMode.h:115

llvm::KnownBits
Definition KnownBits.h:24

llvm::KnownBits::isNonNegative
bool isNonNegative() const
Returns true if this value is known to be non-negative.
Definition KnownBits.h:101

llvm::KnownBits::isZero
bool isZero() const
Returns true if value is all zero.
Definition KnownBits.h:80

llvm::KnownBits::countMinTrailingZeros
unsigned countMinTrailingZeros() const
Returns the minimum number of trailing zero bits.
Definition KnownBits.h:235

llvm::KnownBits::countMaxTrailingZeros
unsigned countMaxTrailingZeros() const
Returns the maximum number of trailing zero bits possible.
Definition KnownBits.h:267

llvm::KnownBits::getSignedMaxValue
APInt getSignedMaxValue() const
Return the maximal signed value possible given these KnownBits.
Definition KnownBits.h:144

llvm::KnownBits::countMaxPopulation
unsigned countMaxPopulation() const
Returns the maximum number of bits that could be one.
Definition KnownBits.h:282

llvm::KnownBits::getBitWidth
unsigned getBitWidth() const
Get the bit width of this value.
Definition KnownBits.h:44

llvm::KnownBits::isConstant
bool isConstant() const
Returns true if we know the value of all bits.
Definition KnownBits.h:54

llvm::KnownBits::countMinLeadingZeros
unsigned countMinLeadingZeros() const
Returns the minimum number of leading zero bits.
Definition KnownBits.h:241

llvm::KnownBits::getMaxValue
APInt getMaxValue() const
Return the maximal unsigned value possible given these KnownBits.
Definition KnownBits.h:138

llvm::KnownBits::getMinValue
APInt getMinValue() const
Return the minimal unsigned value possible given these KnownBits.
Definition KnownBits.h:122

llvm::KnownBits::isStrictlyPositive
bool isStrictlyPositive() const
Returns true if this value is known to be positive.
Definition KnownBits.h:107

llvm::KnownBits::isNegative
bool isNegative() const
Returns true if this value is known to be negative.
Definition KnownBits.h:98

llvm::KnownBits::One
APInt One
Definition KnownBits.h:26

llvm::KnownBits::Zero
APInt Zero
Definition KnownBits.h:25

llvm::KnownBits::countMinPopulation
unsigned countMinPopulation() const
Returns the number of bits known to be one.
Definition KnownBits.h:279

llvm::KnownBits::getSignedMinValue
APInt getSignedMinValue() const
Return the minimal signed value possible given these KnownBits.
Definition KnownBits.h:128

llvm::KnownBits::getConstant
const APInt & getConstant() const
Returns the value when all bits have a known value.
Definition KnownBits.h:60

llvm::LinearExpression
Linear expression BasePtr + Index * Scale + Offset.
Definition Loads.h:203

llvm::LinearExpression::Offset
APInt Offset
Definition Loads.h:207

llvm::LinearExpression::Index
Value * Index
Definition Loads.h:205

llvm::LinearExpression::Scale
APInt Scale
Definition Loads.h:206

llvm::LinearExpression::BasePtr
Value * BasePtr
Definition Loads.h:204

llvm::LinearExpression::Flags
GEPNoWrapFlags Flags
Definition Loads.h:208

llvm::MIPatternMatch::And
Matching combinators.
Definition MIPatternMatch.h:313

llvm::MIPatternMatch::Or
Definition MIPatternMatch.h:332

llvm::MinMax
Definition AssumeBundleQueries.h:72

llvm::PatternMatch::m_Mask
Definition PatternMatch.h:1988

llvm::PatternMatch::m_SpecificMask
Definition PatternMatch.h:2003

llvm::PatternMatch::m_SplatOrPoisonMask
Definition PatternMatch.h:2009

llvm::SelectPatternResult
Definition ValueTracking.h:851

llvm::SelectPatternResult::Flavor
SelectPatternFlavor Flavor
Definition ValueTracking.h:852

llvm::SelectPatternResult::isMinOrMax
static bool isMinOrMax(SelectPatternFlavor SPF)
When implementing this min/max pattern as fcmp; select, does the fcmp have to be ordered?
Definition ValueTracking.h:860

llvm::SimplifyQuery
Definition SimplifyQuery.h:71

llvm::SimplifyQuery::DL
const DataLayout & DL
Definition SimplifyQuery.h:72

llvm::SimplifyQuery::CxtI
const Instruction * CxtI
Definition SimplifyQuery.h:76

llvm::SimplifyQuery::DT
const DominatorTree * DT
Definition SimplifyQuery.h:74

llvm::SimplifyQuery::getWithInstruction
SimplifyQuery getWithInstruction(const Instruction *I) const
Definition SimplifyQuery.h:108

llvm::SimplifyQuery::AC
AssumptionCache * AC
Definition SimplifyQuery.h:75

llvm::SmallMapVector
A MapVector that performs no allocations if smaller than a certain size.
Definition MapVector.h:249

llvm::UseCaptureInfo
Capture information for a specific Use.
Definition CaptureTracking.h:115

llvm::fltSemantics
Definition APFloat.cpp:103