LLVM: lib/Transforms/InstCombine/InstCombineCompares.cpp Source File

//===- InstCombineCompares.cpp --------------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the visitICmp and visitFCmp functions.

//

//===----------------------------------------------------------------------===//


#include "InstCombineInternal.h"

#include "llvm/ADT/APFloat.h"

#include "llvm/ADT/APSInt.h"

#include "llvm/ADT/SetVector.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/CaptureTracking.h"

#include "llvm/Analysis/CmpInstAnalysis.h"

#include "llvm/Analysis/ConstantFolding.h"

#include "llvm/Analysis/InstructionSimplify.h"

#include "llvm/Analysis/Utils/Local.h"

#include "llvm/Analysis/VectorUtils.h"

#include "llvm/IR/ConstantRange.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/Support/KnownBits.h"

#include "llvm/Transforms/InstCombine/InstCombiner.h"

#include <bitset>


using namespace llvm;

using namespace PatternMatch;


#define DEBUG_TYPE "instcombine"


// How many times is a select replaced by one of its operands?

STATISTIC(NumSel, "Number of select opts");


/// Compute Result = In1+In2, returning true if the result overflowed for this

/// type.

static bool addWithOverflow(APInt &Result, const APInt &In1, const APInt &In2,

                            bool IsSigned = false) {

  bool Overflow;

  if (IsSigned)

    Result = In1.sadd_ov(In2, Overflow);

  else

    Result = In1.uadd_ov(In2, Overflow);


  return Overflow;

}


/// Compute Result = In1-In2, returning true if the result overflowed for this

/// type.

static bool subWithOverflow(APInt &Result, const APInt &In1, const APInt &In2,

                            bool IsSigned = false) {

  bool Overflow;

  if (IsSigned)

    Result = In1.ssub_ov(In2, Overflow);

  else

    Result = In1.usub_ov(In2, Overflow);


  return Overflow;

}


/// Given an icmp instruction, return true if any use of this comparison is a

/// branch on sign bit comparison.

static bool hasBranchUse(ICmpInst &I) {

  for (auto *U : I.users())

    if (isa<BranchInst>(U))

      return true;

  return false;

}


/// Returns true if the exploded icmp can be expressed as a signed comparison

/// to zero and updates the predicate accordingly.

/// The signedness of the comparison is preserved.

/// TODO: Refactor with decomposeBitTestICmp()?

static bool isSignTest(ICmpInst::Predicate &Pred, const APInt &C) {

  if (!ICmpInst::isSigned(Pred))

    return false;


  if (C.isZero())

    return ICmpInst::isRelational(Pred);


  if (C.isOne()) {

    if (Pred == ICmpInst::ICMP_SLT) {

      Pred = ICmpInst::ICMP_SLE;

      return true;

    }

  } else if (C.isAllOnes()) {

    if (Pred == ICmpInst::ICMP_SGT) {

      Pred = ICmpInst::ICMP_SGE;

      return true;

    }

  }


  return false;

}


/// This is called when we see this pattern:

///   cmp pred (load (gep GV, ...)), cmpcst

/// where GV is a global variable with a constant initializer. Try to simplify

/// this into some simple computation that does not need the load. For example

/// we can optimize "icmp eq (load (gep "foo", 0, i)), 0" into "icmp eq i, 3".

///

/// If AndCst is non-null, then the loaded value is masked with that constant

/// before doing the comparison. This handles cases like "A[i]&4 == 0".

Instruction *InstCombinerImpl::foldCmpLoadFromIndexedGlobal(

    LoadInst *LI, GetElementPtrInst *GEP, GlobalVariable *GV, CmpInst &ICI,

    ConstantInt *AndCst) {

  if (LI->isVolatile() || LI->getType() != GEP->getResultElementType() ||

      !GV->getValueType()->isArrayTy() || !GV->isConstant() ||

      !GV->hasDefinitiveInitializer())

    return nullptr;


  Type *GEPSrcEltTy = GEP->getSourceElementType();

  if (GEPSrcEltTy->isArrayTy())

    GEPSrcEltTy = GEPSrcEltTy->getArrayElementType();

  if (GV->getValueType()->getArrayElementType() != GEPSrcEltTy)

    return nullptr;


  Constant *Init = GV->getInitializer();

  if (!isa<ConstantArray>(Init) && !isa<ConstantDataArray>(Init))

    return nullptr;


  uint64_t ArrayElementCount = Init->getType()->getArrayNumElements();

  // Don't blow up on huge arrays.

  if (ArrayElementCount > MaxArraySizeForCombine)

    return nullptr;


  // There are many forms of this optimization we can handle, for now, just do

  // the simple index into a single-dimensional array or elements of equal size.

  //

  // Require: GEP [n x i8] GV, 0, Idx {{, constant indices}}

  //      Or: GEP i8 GV, Idx


  unsigned GEPIdxOp = 1;

  if (GEP->getSourceElementType()->isArrayTy()) {

    GEPIdxOp = 2;

    if (!match(GEP->getOperand(1), m_ZeroInt()))

      return nullptr;

  }

  if (GEP->getNumOperands() < GEPIdxOp + 1 ||

      isa<Constant>(GEP->getOperand(GEPIdxOp)))

    return nullptr;


  // Check that indices after the variable are constants and in-range for the

  // type they index.  Collect the indices.  This is typically for arrays of

  // structs.

  SmallVector<unsigned, 4> LaterIndices;


  Type *EltTy = Init->getType()->getArrayElementType();

  for (unsigned i = GEPIdxOp + 1, e = GEP->getNumOperands(); i != e; ++i) {

    ConstantInt *Idx = dyn_cast<ConstantInt>(GEP->getOperand(i));

    if (!Idx)

      return nullptr; // Variable index.


    uint64_t IdxVal = Idx->getZExtValue();

    if ((unsigned)IdxVal != IdxVal)

      return nullptr; // Too large array index.


    if (StructType *STy = dyn_cast<StructType>(EltTy))

      EltTy = STy->getElementType(IdxVal);

    else if (ArrayType *ATy = dyn_cast<ArrayType>(EltTy)) {

      if (IdxVal >= ATy->getNumElements())

        return nullptr;

      EltTy = ATy->getElementType();

    } else {

      return nullptr; // Unknown type.

    }


    LaterIndices.push_back(IdxVal);

  }


  Value *Idx = GEP->getOperand(GEPIdxOp);

  // If the index type is non-canonical, wait for it to be canonicalized.

  if (Idx->getType() != DL.getIndexType(GEP->getType()))

    return nullptr;


  enum { Overdefined = -3, Undefined = -2 };


  // Variables for our state machines.


  // FirstTrueElement/SecondTrueElement - Used to emit a comparison of the form

  // "i == 47 | i == 87", where 47 is the first index the condition is true for,

  // and 87 is the second (and last) index.  FirstTrueElement is -2 when

  // undefined, otherwise set to the first true element.  SecondTrueElement is

  // -2 when undefined, -3 when overdefined and >= 0 when that index is true.

  int FirstTrueElement = Undefined, SecondTrueElement = Undefined;


  // FirstFalseElement/SecondFalseElement - Used to emit a comparison of the

  // form "i != 47 & i != 87".  Same state transitions as for true elements.

  int FirstFalseElement = Undefined, SecondFalseElement = Undefined;


  /// TrueRangeEnd/FalseRangeEnd - In conjunction with First*Element, these

  /// define a state machine that triggers for ranges of values that the index

  /// is true or false for.  This triggers on things like "abbbbc"[i] == 'b'.

  /// This is -2 when undefined, -3 when overdefined, and otherwise the last

  /// index in the range (inclusive).  We use -2 for undefined here because we

  /// use relative comparisons and don't want 0-1 to match -1.

  int TrueRangeEnd = Undefined, FalseRangeEnd = Undefined;


  // MagicBitvector - This is a magic bitvector where we set a bit if the

  // comparison is true for element 'i'.  If there are 64 elements or less in

  // the array, this will fully represent all the comparison results.

  uint64_t MagicBitvector = 0;


  // Scan the array and see if one of our patterns matches.

  Constant *CompareRHS = cast<Constant>(ICI.getOperand(1));

  for (unsigned i = 0, e = ArrayElementCount; i != e; ++i) {

    Constant *Elt = Init->getAggregateElement(i);

    if (!Elt)

      return nullptr;


    // If this is indexing an array of structures, get the structure element.

    if (!LaterIndices.empty()) {

      Elt = ConstantFoldExtractValueInstruction(Elt, LaterIndices);

      if (!Elt)

        return nullptr;

    }


    // If the element is masked, handle it.

    if (AndCst) {

      Elt = ConstantFoldBinaryOpOperands(Instruction::And, Elt, AndCst, DL);

      if (!Elt)

        return nullptr;

    }


    // Find out if the comparison would be true or false for the i'th element.

    Constant *C = ConstantFoldCompareInstOperands(ICI.getPredicate(), Elt,

                                                  CompareRHS, DL, &TLI);

    if (!C)

      return nullptr;


    // If the result is undef for this element, ignore it.

    if (isa<UndefValue>(C)) {

      // Extend range state machines to cover this element in case there is an

      // undef in the middle of the range.

      if (TrueRangeEnd == (int)i - 1)

        TrueRangeEnd = i;

      if (FalseRangeEnd == (int)i - 1)

        FalseRangeEnd = i;

      continue;

    }


    // If we can't compute the result for any of the elements, we have to give

    // up evaluating the entire conditional.

    if (!isa<ConstantInt>(C))

      return nullptr;


    // Otherwise, we know if the comparison is true or false for this element,

    // update our state machines.

    bool IsTrueForElt = !cast<ConstantInt>(C)->isZero();


    // State machine for single/double/range index comparison.

    if (IsTrueForElt) {

      // Update the TrueElement state machine.

      if (FirstTrueElement == Undefined)

        FirstTrueElement = TrueRangeEnd = i; // First true element.

      else {

        // Update double-compare state machine.

        if (SecondTrueElement == Undefined)

          SecondTrueElement = i;

        else

          SecondTrueElement = Overdefined;


        // Update range state machine.

        if (TrueRangeEnd == (int)i - 1)

          TrueRangeEnd = i;

        else

          TrueRangeEnd = Overdefined;

      }

    } else {

      // Update the FalseElement state machine.

      if (FirstFalseElement == Undefined)

        FirstFalseElement = FalseRangeEnd = i; // First false element.

      else {

        // Update double-compare state machine.

        if (SecondFalseElement == Undefined)

          SecondFalseElement = i;

        else

          SecondFalseElement = Overdefined;


        // Update range state machine.

        if (FalseRangeEnd == (int)i - 1)

          FalseRangeEnd = i;

        else

          FalseRangeEnd = Overdefined;

      }

    }


    // If this element is in range, update our magic bitvector.

    if (i < 64 && IsTrueForElt)

      MagicBitvector |= 1ULL << i;


    // If all of our states become overdefined, bail out early.  Since the

    // predicate is expensive, only check it every 8 elements.  This is only

    // really useful for really huge arrays.

    if ((i & 8) == 0 && i >= 64 && SecondTrueElement == Overdefined &&

        SecondFalseElement == Overdefined && TrueRangeEnd == Overdefined &&

        FalseRangeEnd == Overdefined)

      return nullptr;

  }


  // Now that we've scanned the entire array, emit our new comparison(s).  We

  // order the state machines in complexity of the generated code.


  // If inbounds keyword is not present, Idx * ElementSize can overflow.

  // Let's assume that ElementSize is 2 and the wanted value is at offset 0.

  // Then, there are two possible values for Idx to match offset 0:

  // 0x00..00, 0x80..00.

  // Emitting 'icmp eq Idx, 0' isn't correct in this case because the

  // comparison is false if Idx was 0x80..00.

  // We need to erase the highest countTrailingZeros(ElementSize) bits of Idx.

  unsigned ElementSize =

      DL.getTypeAllocSize(Init->getType()->getArrayElementType());

  auto MaskIdx = [&](Value *Idx) {

    if (!GEP->isInBounds() && llvm::countr_zero(ElementSize) != 0) {

      Value *Mask = Constant::getAllOnesValue(Idx->getType());

      Mask = Builder.CreateLShr(Mask, llvm::countr_zero(ElementSize));

      Idx = Builder.CreateAnd(Idx, Mask);

    }

    return Idx;

  };


  // If the comparison is only true for one or two elements, emit direct

  // comparisons.

  if (SecondTrueElement != Overdefined) {

    Idx = MaskIdx(Idx);

    // None true -> false.

    if (FirstTrueElement == Undefined)

      return replaceInstUsesWith(ICI, Builder.getFalse());


    Value *FirstTrueIdx = ConstantInt::get(Idx->getType(), FirstTrueElement);


    // True for one element -> 'i == 47'.

    if (SecondTrueElement == Undefined)

      return new ICmpInst(ICmpInst::ICMP_EQ, Idx, FirstTrueIdx);


    // True for two elements -> 'i == 47 | i == 72'.

    Value *C1 = Builder.CreateICmpEQ(Idx, FirstTrueIdx);

    Value *SecondTrueIdx = ConstantInt::get(Idx->getType(), SecondTrueElement);

    Value *C2 = Builder.CreateICmpEQ(Idx, SecondTrueIdx);

    return BinaryOperator::CreateOr(C1, C2);

  }


  // If the comparison is only false for one or two elements, emit direct

  // comparisons.

  if (SecondFalseElement != Overdefined) {

    Idx = MaskIdx(Idx);

    // None false -> true.

    if (FirstFalseElement == Undefined)

      return replaceInstUsesWith(ICI, Builder.getTrue());


    Value *FirstFalseIdx = ConstantInt::get(Idx->getType(), FirstFalseElement);


    // False for one element -> 'i != 47'.

    if (SecondFalseElement == Undefined)

      return new ICmpInst(ICmpInst::ICMP_NE, Idx, FirstFalseIdx);


    // False for two elements -> 'i != 47 & i != 72'.

    Value *C1 = Builder.CreateICmpNE(Idx, FirstFalseIdx);

    Value *SecondFalseIdx =

        ConstantInt::get(Idx->getType(), SecondFalseElement);

    Value *C2 = Builder.CreateICmpNE(Idx, SecondFalseIdx);

    return BinaryOperator::CreateAnd(C1, C2);

  }


  // If the comparison can be replaced with a range comparison for the elements

  // where it is true, emit the range check.

  if (TrueRangeEnd != Overdefined) {

    assert(TrueRangeEnd != FirstTrueElement && "Should emit single compare");

    Idx = MaskIdx(Idx);


    // Generate (i-FirstTrue) <u (TrueRangeEnd-FirstTrue+1).

    if (FirstTrueElement) {

      Value *Offs = ConstantInt::get(Idx->getType(), -FirstTrueElement);

      Idx = Builder.CreateAdd(Idx, Offs);

    }


    Value *End =

        ConstantInt::get(Idx->getType(), TrueRangeEnd - FirstTrueElement + 1);

    return new ICmpInst(ICmpInst::ICMP_ULT, Idx, End);

  }


  // False range check.

  if (FalseRangeEnd != Overdefined) {

    assert(FalseRangeEnd != FirstFalseElement && "Should emit single compare");

    Idx = MaskIdx(Idx);

    // Generate (i-FirstFalse) >u (FalseRangeEnd-FirstFalse).

    if (FirstFalseElement) {

      Value *Offs = ConstantInt::get(Idx->getType(), -FirstFalseElement);

      Idx = Builder.CreateAdd(Idx, Offs);

    }


    Value *End =

        ConstantInt::get(Idx->getType(), FalseRangeEnd - FirstFalseElement);

    return new ICmpInst(ICmpInst::ICMP_UGT, Idx, End);

  }


  // If a magic bitvector captures the entire comparison state

  // of this load, replace it with computation that does:

  //   ((magic_cst >> i) & 1) != 0

  {

    Type *Ty = nullptr;


    // Look for an appropriate type:

    // - The type of Idx if the magic fits

    // - The smallest fitting legal type

    if (ArrayElementCount <= Idx->getType()->getIntegerBitWidth())

      Ty = Idx->getType();

    else

      Ty = DL.getSmallestLegalIntType(Init->getContext(), ArrayElementCount);


    if (Ty) {

      Idx = MaskIdx(Idx);

      Value *V = Builder.CreateIntCast(Idx, Ty, false);

      V = Builder.CreateLShr(ConstantInt::get(Ty, MagicBitvector), V);

      V = Builder.CreateAnd(ConstantInt::get(Ty, 1), V);

      return new ICmpInst(ICmpInst::ICMP_NE, V, ConstantInt::get(Ty, 0));

    }

  }


  return nullptr;

}


/// Returns true if we can rewrite Start as a GEP with pointer Base

/// and some integer offset. The nodes that need to be re-written

/// for this transformation will be added to Explored.

static bool canRewriteGEPAsOffset(Value *Start, Value *Base, GEPNoWrapFlags &NW,

                                  const DataLayout &DL,

                                  SetVector<Value *> &Explored) {

  SmallVector<Value *, 16> WorkList(1, Start);

  Explored.insert(Base);


  // The following traversal gives us an order which can be used

  // when doing the final transformation. Since in the final

  // transformation we create the PHI replacement instructions first,

  // we don't have to get them in any particular order.

  //

  // However, for other instructions we will have to traverse the

  // operands of an instruction first, which means that we have to

  // do a post-order traversal.

  while (!WorkList.empty()) {

    SetVector<PHINode *> PHIs;


    while (!WorkList.empty()) {

      if (Explored.size() >= 100)

        return false;


      Value *V = WorkList.back();


      if (Explored.contains(V)) {

        WorkList.pop_back();

        continue;

      }


      if (!isa<GetElementPtrInst>(V) && !isa<PHINode>(V))

        // We've found some value that we can't explore which is different from

        // the base. Therefore we can't do this transformation.

        return false;


      if (auto *GEP = dyn_cast<GEPOperator>(V)) {

        // Only allow inbounds GEPs with at most one variable offset.

        auto IsNonConst = [](Value *V) { return !isa<ConstantInt>(V); };

        if (!GEP->isInBounds() || count_if(GEP->indices(), IsNonConst) > 1)

          return false;


        NW = NW.intersectForOffsetAdd(GEP->getNoWrapFlags());

        if (!Explored.contains(GEP->getOperand(0)))

          WorkList.push_back(GEP->getOperand(0));

      }


      if (WorkList.back() == V) {

        WorkList.pop_back();

        // We've finished visiting this node, mark it as such.

        Explored.insert(V);

      }


      if (auto *PN = dyn_cast<PHINode>(V)) {

        // We cannot transform PHIs on unsplittable basic blocks.

        if (isa<CatchSwitchInst>(PN->getParent()->getTerminator()))

          return false;

        Explored.insert(PN);

        PHIs.insert(PN);

      }

    }


    // Explore the PHI nodes further.

    for (auto *PN : PHIs)

      for (Value *Op : PN->incoming_values())

        if (!Explored.contains(Op))

          WorkList.push_back(Op);

  }


  // Make sure that we can do this. Since we can't insert GEPs in a basic

  // block before a PHI node, we can't easily do this transformation if

  // we have PHI node users of transformed instructions.

  for (Value *Val : Explored) {

    for (Value *Use : Val->uses()) {


      auto *PHI = dyn_cast<PHINode>(Use);

      auto *Inst = dyn_cast<Instruction>(Val);


      if (Inst == Base || Inst == PHI || !Inst || !PHI ||

          !Explored.contains(PHI))

        continue;


      if (PHI->getParent() == Inst->getParent())

        return false;

    }

  }

  return true;

}


// Sets the appropriate insert point on Builder where we can add

// a replacement Instruction for V (if that is possible).

static void setInsertionPoint(IRBuilder<> &Builder, Value *V,

                              bool Before = true) {

  if (auto *PHI = dyn_cast<PHINode>(V)) {

    BasicBlock *Parent = PHI->getParent();

    Builder.SetInsertPoint(Parent, Parent->getFirstInsertionPt());

    return;

  }

  if (auto *I = dyn_cast<Instruction>(V)) {

    if (!Before)

      I = &*std::next(I->getIterator());

    Builder.SetInsertPoint(I);

    return;

  }

  if (auto *A = dyn_cast<Argument>(V)) {

    // Set the insertion point in the entry block.

    BasicBlock &Entry = A->getParent()->getEntryBlock();

    Builder.SetInsertPoint(&Entry, Entry.getFirstInsertionPt());

    return;

  }

  // Otherwise, this is a constant and we don't need to set a new

  // insertion point.

  assert(isa<Constant>(V) && "Setting insertion point for unknown value!");

}


/// Returns a re-written value of Start as an indexed GEP using Base as a

/// pointer.

static Value *rewriteGEPAsOffset(Value *Start, Value *Base, GEPNoWrapFlags NW,

                                 const DataLayout &DL,

                                 SetVector<Value *> &Explored,

                                 InstCombiner &IC) {

  // Perform all the substitutions. This is a bit tricky because we can

  // have cycles in our use-def chains.

  // 1. Create the PHI nodes without any incoming values.

  // 2. Create all the other values.

  // 3. Add the edges for the PHI nodes.

  // 4. Emit GEPs to get the original pointers.

  // 5. Remove the original instructions.

  Type *IndexType = IntegerType::get(

      Base->getContext(), DL.getIndexTypeSizeInBits(Start->getType()));


  DenseMap<Value *, Value *> NewInsts;

  NewInsts[Base] = ConstantInt::getNullValue(IndexType);


  // Create the new PHI nodes, without adding any incoming values.

  for (Value *Val : Explored) {

    if (Val == Base)

      continue;

    // Create empty phi nodes. This avoids cyclic dependencies when creating

    // the remaining instructions.

    if (auto *PHI = dyn_cast<PHINode>(Val))

      NewInsts[PHI] =

          PHINode::Create(IndexType, PHI->getNumIncomingValues(),

                          PHI->getName() + ".idx", PHI->getIterator());

  }

  IRBuilder<> Builder(Base->getContext());


  // Create all the other instructions.

  for (Value *Val : Explored) {

    if (NewInsts.contains(Val))

      continue;


    if (auto *GEP = dyn_cast<GEPOperator>(Val)) {

      setInsertionPoint(Builder, GEP);

      Value *Op = NewInsts[GEP->getOperand(0)];

      Value *OffsetV = emitGEPOffset(&Builder, DL, GEP);

      if (isa<ConstantInt>(Op) && cast<ConstantInt>(Op)->isZero())

        NewInsts[GEP] = OffsetV;

      else

        NewInsts[GEP] = Builder.CreateAdd(

            Op, OffsetV, GEP->getOperand(0)->getName() + ".add",

            /*NUW=*/NW.hasNoUnsignedWrap(),

            /*NSW=*/NW.hasNoUnsignedSignedWrap());

      continue;

    }

    if (isa<PHINode>(Val))

      continue;


    llvm_unreachable("Unexpected instruction type");

  }


  // Add the incoming values to the PHI nodes.

  for (Value *Val : Explored) {

    if (Val == Base)

      continue;

    // All the instructions have been created, we can now add edges to the

    // phi nodes.

    if (auto *PHI = dyn_cast<PHINode>(Val)) {

      PHINode *NewPhi = static_cast<PHINode *>(NewInsts[PHI]);

      for (unsigned I = 0, E = PHI->getNumIncomingValues(); I < E; ++I) {

        Value *NewIncoming = PHI->getIncomingValue(I);


        auto It = NewInsts.find(NewIncoming);

        if (It != NewInsts.end())

          NewIncoming = It->second;


        NewPhi->addIncoming(NewIncoming, PHI->getIncomingBlock(I));

      }

    }

  }


  for (Value *Val : Explored) {

    if (Val == Base)

      continue;


    setInsertionPoint(Builder, Val, false);

    // Create GEP for external users.

    Value *NewVal = Builder.CreateGEP(Builder.getInt8Ty(), Base, NewInsts[Val],

                                      Val->getName() + ".ptr", NW);

    IC.replaceInstUsesWith(*cast<Instruction>(Val), NewVal);

    // Add old instruction to worklist for DCE. We don't directly remove it

    // here because the original compare is one of the users.

    IC.addToWorklist(cast<Instruction>(Val));

  }


  return NewInsts[Start];

}


/// Converts (CMP GEPLHS, RHS) if this change would make RHS a constant.

/// We can look through PHIs, GEPs and casts in order to determine a common base

/// between GEPLHS and RHS.

static Instruction *transformToIndexedCompare(GEPOperator *GEPLHS, Value *RHS,

                                              CmpPredicate Cond,

                                              const DataLayout &DL,

                                              InstCombiner &IC) {

  // FIXME: Support vector of pointers.

  if (GEPLHS->getType()->isVectorTy())

    return nullptr;


  if (!GEPLHS->hasAllConstantIndices())

    return nullptr;


  APInt Offset(DL.getIndexTypeSizeInBits(GEPLHS->getType()), 0);

  Value *PtrBase =

      GEPLHS->stripAndAccumulateConstantOffsets(DL, Offset,

                                                /*AllowNonInbounds*/ false);


  // Bail if we looked through addrspacecast.

  if (PtrBase->getType() != GEPLHS->getType())

    return nullptr;


  // The set of nodes that will take part in this transformation.

  SetVector<Value *> Nodes;

  GEPNoWrapFlags NW = GEPLHS->getNoWrapFlags();

  if (!canRewriteGEPAsOffset(RHS, PtrBase, NW, DL, Nodes))

    return nullptr;


  // We know we can re-write this as

  //  ((gep Ptr, OFFSET1) cmp (gep Ptr, OFFSET2)

  // Since we've only looked through inbouds GEPs we know that we

  // can't have overflow on either side. We can therefore re-write

  // this as:

  //   OFFSET1 cmp OFFSET2

  Value *NewRHS = rewriteGEPAsOffset(RHS, PtrBase, NW, DL, Nodes, IC);


  // RewriteGEPAsOffset has replaced RHS and all of its uses with a re-written

  // GEP having PtrBase as the pointer base, and has returned in NewRHS the

  // offset. Since Index is the offset of LHS to the base pointer, we will now

  // compare the offsets instead of comparing the pointers.

  return new ICmpInst(ICmpInst::getSignedPredicate(Cond),

                      IC.Builder.getInt(Offset), NewRHS);

}


/// Fold comparisons between a GEP instruction and something else. At this point

/// we know that the GEP is on the LHS of the comparison.

Instruction *InstCombinerImpl::foldGEPICmp(GEPOperator *GEPLHS, Value *RHS,

                                           CmpPredicate Cond, Instruction &I) {

  // Don't transform signed compares of GEPs into index compares. Even if the

  // GEP is inbounds, the final add of the base pointer can have signed overflow

  // and would change the result of the icmp.

  // e.g. "&foo[0] <s &foo[1]" can't be folded to "true" because "foo" could be

  // the maximum signed value for the pointer type.

  if (ICmpInst::isSigned(Cond))

    return nullptr;


  // Look through bitcasts and addrspacecasts. We do not however want to remove

  // 0 GEPs.

  if (!isa<GetElementPtrInst>(RHS))

    RHS = RHS->stripPointerCasts();


  auto CanFold = [Cond](GEPNoWrapFlags NW) {

    if (ICmpInst::isEquality(Cond))

      return true;


    // Unsigned predicates can be folded if the GEPs have *any* nowrap flags.

    assert(ICmpInst::isUnsigned(Cond));

    return NW != GEPNoWrapFlags::none();

  };


  auto NewICmp = [Cond](GEPNoWrapFlags NW, Value *Op1, Value *Op2) {

    if (!NW.hasNoUnsignedWrap()) {

      // Convert signed to unsigned comparison.

      return new ICmpInst(ICmpInst::getSignedPredicate(Cond), Op1, Op2);

    }


    auto *I = new ICmpInst(Cond, Op1, Op2);

    I->setSameSign(NW.hasNoUnsignedSignedWrap());

    return I;

  };


  CommonPointerBase Base = CommonPointerBase::compute(GEPLHS, RHS);

  if (Base.Ptr == RHS && CanFold(Base.LHSNW) && !Base.isExpensive()) {

    // ((gep Ptr, OFFSET) cmp Ptr)   ---> (OFFSET cmp 0).

    Type *IdxTy = DL.getIndexType(GEPLHS->getType());

    Value *Offset =

        EmitGEPOffsets(Base.LHSGEPs, Base.LHSNW, IdxTy, /*RewriteGEPs=*/true);

    return NewICmp(Base.LHSNW, Offset,

                   Constant::getNullValue(Offset->getType()));

  }


  if (GEPLHS->isInBounds() && ICmpInst::isEquality(Cond) &&

      isa<Constant>(RHS) && cast<Constant>(RHS)->isNullValue() &&

      !NullPointerIsDefined(I.getFunction(),

                            RHS->getType()->getPointerAddressSpace())) {

    // For most address spaces, an allocation can't be placed at null, but null

    // itself is treated as a 0 size allocation in the in bounds rules.  Thus,

    // the only valid inbounds address derived from null, is null itself.

    // Thus, we have four cases to consider:

    // 1) Base == nullptr, Offset == 0 -> inbounds, null

    // 2) Base == nullptr, Offset != 0 -> poison as the result is out of bounds

    // 3) Base != nullptr, Offset == (-base) -> poison (crossing allocations)

    // 4) Base != nullptr, Offset != (-base) -> nonnull (and possibly poison)

    //

    // (Note if we're indexing a type of size 0, that simply collapses into one

    //  of the buckets above.)

    //

    // In general, we're allowed to make values less poison (i.e. remove

    //   sources of full UB), so in this case, we just select between the two

    //   non-poison cases (1 and 4 above).

    //

    // For vectors, we apply the same reasoning on a per-lane basis.

    auto *Base = GEPLHS->getPointerOperand();

    if (GEPLHS->getType()->isVectorTy() && Base->getType()->isPointerTy()) {

      auto EC = cast<VectorType>(GEPLHS->getType())->getElementCount();

      Base = Builder.CreateVectorSplat(EC, Base);

    }

    return new ICmpInst(Cond, Base,

                        ConstantExpr::getPointerBitCastOrAddrSpaceCast(

                            cast<Constant>(RHS), Base->getType()));

  } else if (GEPOperator *GEPRHS = dyn_cast<GEPOperator>(RHS)) {

    GEPNoWrapFlags NW = GEPLHS->getNoWrapFlags() & GEPRHS->getNoWrapFlags();


    // If the base pointers are different, but the indices are the same, just

    // compare the base pointer.

    if (GEPLHS->getOperand(0) != GEPRHS->getOperand(0)) {

      bool IndicesTheSame =

          GEPLHS->getNumOperands() == GEPRHS->getNumOperands() &&

          GEPLHS->getPointerOperand()->getType() ==

              GEPRHS->getPointerOperand()->getType() &&

          GEPLHS->getSourceElementType() == GEPRHS->getSourceElementType();

      if (IndicesTheSame)

        for (unsigned i = 1, e = GEPLHS->getNumOperands(); i != e; ++i)

          if (GEPLHS->getOperand(i) != GEPRHS->getOperand(i)) {

            IndicesTheSame = false;

            break;

          }


      // If all indices are the same, just compare the base pointers.

      Type *BaseType = GEPLHS->getOperand(0)->getType();

      if (IndicesTheSame &&

          CmpInst::makeCmpResultType(BaseType) == I.getType() && CanFold(NW))

        return new ICmpInst(Cond, GEPLHS->getOperand(0), GEPRHS->getOperand(0));


      // If we're comparing GEPs with two base pointers that only differ in type

      // and both GEPs have only constant indices or just one use, then fold

      // the compare with the adjusted indices.

      // FIXME: Support vector of pointers.

      if (GEPLHS->isInBounds() && GEPRHS->isInBounds() &&

          (GEPLHS->hasAllConstantIndices() || GEPLHS->hasOneUse()) &&

          (GEPRHS->hasAllConstantIndices() || GEPRHS->hasOneUse()) &&

          GEPLHS->getOperand(0)->stripPointerCasts() ==

              GEPRHS->getOperand(0)->stripPointerCasts() &&

          !GEPLHS->getType()->isVectorTy()) {

        Value *LOffset = EmitGEPOffset(GEPLHS);

        Value *ROffset = EmitGEPOffset(GEPRHS);


        // If we looked through an addrspacecast between different sized address

        // spaces, the LHS and RHS pointers are different sized

        // integers. Truncate to the smaller one.

        Type *LHSIndexTy = LOffset->getType();

        Type *RHSIndexTy = ROffset->getType();

        if (LHSIndexTy != RHSIndexTy) {

          if (LHSIndexTy->getPrimitiveSizeInBits().getFixedValue() <

              RHSIndexTy->getPrimitiveSizeInBits().getFixedValue()) {

            ROffset = Builder.CreateTrunc(ROffset, LHSIndexTy);

          } else

            LOffset = Builder.CreateTrunc(LOffset, RHSIndexTy);

        }


        Value *Cmp = Builder.CreateICmp(ICmpInst::getSignedPredicate(Cond),

                                        LOffset, ROffset);

        return replaceInstUsesWith(I, Cmp);

      }

    }


    if (GEPLHS->getOperand(0) == GEPRHS->getOperand(0) &&

        GEPLHS->getNumOperands() == GEPRHS->getNumOperands() &&

        GEPLHS->getSourceElementType() == GEPRHS->getSourceElementType()) {

      // If the GEPs only differ by one index, compare it.

      unsigned NumDifferences = 0; // Keep track of # differences.

      unsigned DiffOperand = 0;    // The operand that differs.

      for (unsigned i = 1, e = GEPRHS->getNumOperands(); i != e; ++i)

        if (GEPLHS->getOperand(i) != GEPRHS->getOperand(i)) {

          Type *LHSType = GEPLHS->getOperand(i)->getType();

          Type *RHSType = GEPRHS->getOperand(i)->getType();

          // FIXME: Better support for vector of pointers.

          if (LHSType->getPrimitiveSizeInBits() !=

                  RHSType->getPrimitiveSizeInBits() ||

              (GEPLHS->getType()->isVectorTy() &&

               (!LHSType->isVectorTy() || !RHSType->isVectorTy()))) {

            // Irreconcilable differences.

            NumDifferences = 2;

            break;

          }


          if (NumDifferences++)

            break;

          DiffOperand = i;

        }


      if (NumDifferences == 0) // SAME GEP?

        return replaceInstUsesWith(

            I, // No comparison is needed here.

            ConstantInt::get(I.getType(), ICmpInst::isTrueWhenEqual(Cond)));

      // If two GEPs only differ by an index, compare them.

      // Note that nowrap flags are always needed when comparing two indices.

      else if (NumDifferences == 1 && NW != GEPNoWrapFlags::none()) {

        Value *LHSV = GEPLHS->getOperand(DiffOperand);

        Value *RHSV = GEPRHS->getOperand(DiffOperand);

        return NewICmp(NW, LHSV, RHSV);

      }

    }


    if (Base.Ptr && CanFold(Base.LHSNW & Base.RHSNW) && !Base.isExpensive()) {

      // ((gep Ptr, OFFSET1) cmp (gep Ptr, OFFSET2)  --->  (OFFSET1 cmp OFFSET2)

      Type *IdxTy = DL.getIndexType(GEPLHS->getType());

      Value *L =

          EmitGEPOffsets(Base.LHSGEPs, Base.LHSNW, IdxTy, /*RewriteGEP=*/true);

      Value *R =

          EmitGEPOffsets(Base.RHSGEPs, Base.RHSNW, IdxTy, /*RewriteGEP=*/true);

      return NewICmp(Base.LHSNW & Base.RHSNW, L, R);

    }

  }


  // Try convert this to an indexed compare by looking through PHIs/casts as a

  // last resort.

  return transformToIndexedCompare(GEPLHS, RHS, Cond, DL, *this);

}


bool InstCombinerImpl::foldAllocaCmp(AllocaInst *Alloca) {

  // It would be tempting to fold away comparisons between allocas and any

  // pointer not based on that alloca (e.g. an argument). However, even

  // though such pointers cannot alias, they can still compare equal.

  //

  // But LLVM doesn't specify where allocas get their memory, so if the alloca

  // doesn't escape we can argue that it's impossible to guess its value, and we

  // can therefore act as if any such guesses are wrong.

  //

  // However, we need to ensure that this folding is consistent: We can't fold

  // one comparison to false, and then leave a different comparison against the

  // same value alone (as it might evaluate to true at runtime, leading to a

  // contradiction). As such, this code ensures that all comparisons are folded

  // at the same time, and there are no other escapes.


  struct CmpCaptureTracker : public CaptureTracker {

    AllocaInst *Alloca;

    bool Captured = false;

    /// The value of the map is a bit mask of which icmp operands the alloca is

    /// used in.

    SmallMapVector<ICmpInst *, unsigned, 4> ICmps;


    CmpCaptureTracker(AllocaInst *Alloca) : Alloca(Alloca) {}


    void tooManyUses() override { Captured = true; }


    Action captured(const Use *U, UseCaptureInfo CI) override {

      // TODO(captures): Use UseCaptureInfo.

      auto *ICmp = dyn_cast<ICmpInst>(U->getUser());

      // We need to check that U is based *only* on the alloca, and doesn't

      // have other contributions from a select/phi operand.

      // TODO: We could check whether getUnderlyingObjects() reduces to one

      // object, which would allow looking through phi nodes.

      if (ICmp && ICmp->isEquality() && getUnderlyingObject(*U) == Alloca) {

        // Collect equality icmps of the alloca, and don't treat them as

        // captures.

        ICmps[ICmp] |= 1u << U->getOperandNo();

        return Continue;

      }


      Captured = true;

      return Stop;

    }

  };


  CmpCaptureTracker Tracker(Alloca);

  PointerMayBeCaptured(Alloca, &Tracker);

  if (Tracker.Captured)

    return false;


  bool Changed = false;

  for (auto [ICmp, Operands] : Tracker.ICmps) {

    switch (Operands) {

    case 1:

    case 2: {

      // The alloca is only used in one icmp operand. Assume that the

      // equality is false.

      auto *Res = ConstantInt::get(ICmp->getType(),

                                   ICmp->getPredicate() == ICmpInst::ICMP_NE);

      replaceInstUsesWith(*ICmp, Res);

      eraseInstFromFunction(*ICmp);

      Changed = true;

      break;

    }

    case 3:

      // Both icmp operands are based on the alloca, so this is comparing

      // pointer offsets, without leaking any information about the address

      // of the alloca. Ignore such comparisons.

      break;

    default:

      llvm_unreachable("Cannot happen");

    }

  }


  return Changed;

}


/// Fold "icmp pred (X+C), X".

Instruction *InstCombinerImpl::foldICmpAddOpConst(Value *X, const APInt &C,

                                                  CmpPredicate Pred) {

  // From this point on, we know that (X+C <= X) --> (X+C < X) because C != 0,

  // so the values can never be equal.  Similarly for all other "or equals"

  // operators.

  assert(!!C && "C should not be zero!");


  // (X+1) <u X        --> X >u (MAXUINT-1)        --> X == 255

  // (X+2) <u X        --> X >u (MAXUINT-2)        --> X > 253

  // (X+MAXUINT) <u X  --> X >u (MAXUINT-MAXUINT)  --> X != 0

  if (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_ULE) {

    Constant *R =

        ConstantInt::get(X->getType(), APInt::getMaxValue(C.getBitWidth()) - C);

    return new ICmpInst(ICmpInst::ICMP_UGT, X, R);

  }


  // (X+1) >u X        --> X <u (0-1)        --> X != 255

  // (X+2) >u X        --> X <u (0-2)        --> X <u 254

  // (X+MAXUINT) >u X  --> X <u (0-MAXUINT)  --> X <u 1  --> X == 0

  if (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_UGE)

    return new ICmpInst(ICmpInst::ICMP_ULT, X,

                        ConstantInt::get(X->getType(), -C));


  APInt SMax = APInt::getSignedMaxValue(C.getBitWidth());


  // (X+ 1) <s X       --> X >s (MAXSINT-1)          --> X == 127

  // (X+ 2) <s X       --> X >s (MAXSINT-2)          --> X >s 125

  // (X+MAXSINT) <s X  --> X >s (MAXSINT-MAXSINT)    --> X >s 0

  // (X+MINSINT) <s X  --> X >s (MAXSINT-MINSINT)    --> X >s -1

  // (X+ -2) <s X      --> X >s (MAXSINT- -2)        --> X >s 126

  // (X+ -1) <s X      --> X >s (MAXSINT- -1)        --> X != 127

  if (Pred == ICmpInst::ICMP_SLT || Pred == ICmpInst::ICMP_SLE)

    return new ICmpInst(ICmpInst::ICMP_SGT, X,

                        ConstantInt::get(X->getType(), SMax - C));


  // (X+ 1) >s X       --> X <s (MAXSINT-(1-1))       --> X != 127

  // (X+ 2) >s X       --> X <s (MAXSINT-(2-1))       --> X <s 126

  // (X+MAXSINT) >s X  --> X <s (MAXSINT-(MAXSINT-1)) --> X <s 1

  // (X+MINSINT) >s X  --> X <s (MAXSINT-(MINSINT-1)) --> X <s -2

  // (X+ -2) >s X      --> X <s (MAXSINT-(-2-1))      --> X <s -126

  // (X+ -1) >s X      --> X <s (MAXSINT-(-1-1))      --> X == -128


  assert(Pred == ICmpInst::ICMP_SGT || Pred == ICmpInst::ICMP_SGE);

  return new ICmpInst(ICmpInst::ICMP_SLT, X,

                      ConstantInt::get(X->getType(), SMax - (C - 1)));

}


/// Handle "(icmp eq/ne (ashr/lshr AP2, A), AP1)" ->

/// (icmp eq/ne A, Log2(AP2/AP1)) ->

/// (icmp eq/ne A, Log2(AP2) - Log2(AP1)).

Instruction *InstCombinerImpl::foldICmpShrConstConst(ICmpInst &I, Value *A,

                                                     const APInt &AP1,

                                                     const APInt &AP2) {

  assert(I.isEquality() && "Cannot fold icmp gt/lt");


  auto getICmp = [&I](CmpInst::Predicate Pred, Value *LHS, Value *RHS) {

    if (I.getPredicate() == I.ICMP_NE)

      Pred = CmpInst::getInversePredicate(Pred);

    return new ICmpInst(Pred, LHS, RHS);

  };


  // Don't bother doing any work for cases which InstSimplify handles.

  if (AP2.isZero())

    return nullptr;


  bool IsAShr = isa<AShrOperator>(I.getOperand(0));

  if (IsAShr) {

    if (AP2.isAllOnes())

      return nullptr;

    if (AP2.isNegative() != AP1.isNegative())

      return nullptr;

    if (AP2.sgt(AP1))

      return nullptr;

  }


  if (!AP1)

    // 'A' must be large enough to shift out the highest set bit.

    return getICmp(I.ICMP_UGT, A,

                   ConstantInt::get(A->getType(), AP2.logBase2()));


  if (AP1 == AP2)

    return getICmp(I.ICMP_EQ, A, ConstantInt::getNullValue(A->getType()));


  int Shift;

  if (IsAShr && AP1.isNegative())

    Shift = AP1.countl_one() - AP2.countl_one();

  else

    Shift = AP1.countl_zero() - AP2.countl_zero();


  if (Shift > 0) {

    if (IsAShr && AP1 == AP2.ashr(Shift)) {

      // There are multiple solutions if we are comparing against -1 and the LHS

      // of the ashr is not a power of two.

      if (AP1.isAllOnes() && !AP2.isPowerOf2())

        return getICmp(I.ICMP_UGE, A, ConstantInt::get(A->getType(), Shift));

      return getICmp(I.ICMP_EQ, A, ConstantInt::get(A->getType(), Shift));

    } else if (AP1 == AP2.lshr(Shift)) {

      return getICmp(I.ICMP_EQ, A, ConstantInt::get(A->getType(), Shift));

    }

  }


  // Shifting const2 will never be equal to const1.

  // FIXME: This should always be handled by InstSimplify?

  auto *TorF = ConstantInt::get(I.getType(), I.getPredicate() == I.ICMP_NE);

  return replaceInstUsesWith(I, TorF);

}


/// Handle "(icmp eq/ne (shl AP2, A), AP1)" ->

/// (icmp eq/ne A, TrailingZeros(AP1) - TrailingZeros(AP2)).

Instruction *InstCombinerImpl::foldICmpShlConstConst(ICmpInst &I, Value *A,

                                                     const APInt &AP1,

                                                     const APInt &AP2) {

  assert(I.isEquality() && "Cannot fold icmp gt/lt");


  auto getICmp = [&I](CmpInst::Predicate Pred, Value *LHS, Value *RHS) {

    if (I.getPredicate() == I.ICMP_NE)

      Pred = CmpInst::getInversePredicate(Pred);

    return new ICmpInst(Pred, LHS, RHS);

  };


  // Don't bother doing any work for cases which InstSimplify handles.

  if (AP2.isZero())

    return nullptr;


  unsigned AP2TrailingZeros = AP2.countr_zero();


  if (!AP1 && AP2TrailingZeros != 0)

    return getICmp(

        I.ICMP_UGE, A,

        ConstantInt::get(A->getType(), AP2.getBitWidth() - AP2TrailingZeros));


  if (AP1 == AP2)

    return getICmp(I.ICMP_EQ, A, ConstantInt::getNullValue(A->getType()));


  // Get the distance between the lowest bits that are set.

  int Shift = AP1.countr_zero() - AP2TrailingZeros;


  if (Shift > 0 && AP2.shl(Shift) == AP1)

    return getICmp(I.ICMP_EQ, A, ConstantInt::get(A->getType(), Shift));


  // Shifting const2 will never be equal to const1.

  // FIXME: This should always be handled by InstSimplify?

  auto *TorF = ConstantInt::get(I.getType(), I.getPredicate() == I.ICMP_NE);

  return replaceInstUsesWith(I, TorF);

}


/// The caller has matched a pattern of the form:

///   I = icmp ugt (add (add A, B), CI2), CI1

/// If this is of the form:

///   sum = a + b

///   if (sum+128 >u 255)

/// Then replace it with llvm.sadd.with.overflow.i8.

///

static Instruction *processUGT_ADDCST_ADD(ICmpInst &I, Value *A, Value *B,

                                          ConstantInt *CI2, ConstantInt *CI1,

                                          InstCombinerImpl &IC) {

  // The transformation we're trying to do here is to transform this into an

  // llvm.sadd.with.overflow.  To do this, we have to replace the original add

  // with a narrower add, and discard the add-with-constant that is part of the

  // range check (if we can't eliminate it, this isn't profitable).


  // In order to eliminate the add-with-constant, the compare can be its only

  // use.

  Instruction *AddWithCst = cast<Instruction>(I.getOperand(0));

  if (!AddWithCst->hasOneUse())

    return nullptr;


  // If CI2 is 2^7, 2^15, 2^31, then it might be an sadd.with.overflow.

  if (!CI2->getValue().isPowerOf2())

    return nullptr;

  unsigned NewWidth = CI2->getValue().countr_zero();

  if (NewWidth != 7 && NewWidth != 15 && NewWidth != 31)

    return nullptr;


  // The width of the new add formed is 1 more than the bias.

  ++NewWidth;


  // Check to see that CI1 is an all-ones value with NewWidth bits.

  if (CI1->getBitWidth() == NewWidth ||

      CI1->getValue() != APInt::getLowBitsSet(CI1->getBitWidth(), NewWidth))

    return nullptr;


  // This is only really a signed overflow check if the inputs have been

  // sign-extended; check for that condition. For example, if CI2 is 2^31 and

  // the operands of the add are 64 bits wide, we need at least 33 sign bits.

  if (IC.ComputeMaxSignificantBits(A, &I) > NewWidth ||

      IC.ComputeMaxSignificantBits(B, &I) > NewWidth)

    return nullptr;


  // In order to replace the original add with a narrower

  // llvm.sadd.with.overflow, the only uses allowed are the add-with-constant

  // and truncates that discard the high bits of the add.  Verify that this is

  // the case.

  Instruction *OrigAdd = cast<Instruction>(AddWithCst->getOperand(0));

  for (User *U : OrigAdd->users()) {

    if (U == AddWithCst)

      continue;


    // Only accept truncates for now.  We would really like a nice recursive

    // predicate like SimplifyDemandedBits, but which goes downwards the use-def

    // chain to see which bits of a value are actually demanded.  If the

    // original add had another add which was then immediately truncated, we

    // could still do the transformation.

    TruncInst *TI = dyn_cast<TruncInst>(U);

    if (!TI || TI->getType()->getPrimitiveSizeInBits() > NewWidth)

      return nullptr;

  }


  // If the pattern matches, truncate the inputs to the narrower type and

  // use the sadd_with_overflow intrinsic to efficiently compute both the

  // result and the overflow bit.

  Type *NewType = IntegerType::get(OrigAdd->getContext(), NewWidth);

  Function *F = Intrinsic::getOrInsertDeclaration(

      I.getModule(), Intrinsic::sadd_with_overflow, NewType);


  InstCombiner::BuilderTy &Builder = IC.Builder;


  // Put the new code above the original add, in case there are any uses of the

  // add between the add and the compare.

  Builder.SetInsertPoint(OrigAdd);


  Value *TruncA = Builder.CreateTrunc(A, NewType, A->getName() + ".trunc");

  Value *TruncB = Builder.CreateTrunc(B, NewType, B->getName() + ".trunc");

  CallInst *Call = Builder.CreateCall(F, {TruncA, TruncB}, "sadd");

  Value *Add = Builder.CreateExtractValue(Call, 0, "sadd.result");

  Value *ZExt = Builder.CreateZExt(Add, OrigAdd->getType());


  // The inner add was the result of the narrow add, zero extended to the

  // wider type.  Replace it with the result computed by the intrinsic.

  IC.replaceInstUsesWith(*OrigAdd, ZExt);

  IC.eraseInstFromFunction(*OrigAdd);


  // The original icmp gets replaced with the overflow value.

  return ExtractValueInst::Create(Call, 1, "sadd.overflow");

}


/// If we have:

///   icmp eq/ne (urem/srem %x, %y), 0

/// iff %y is a power-of-two, we can replace this with a bit test:

///   icmp eq/ne (and %x, (add %y, -1)), 0

Instruction *InstCombinerImpl::foldIRemByPowerOfTwoToBitTest(ICmpInst &I) {

  // This fold is only valid for equality predicates.

  if (!I.isEquality())

    return nullptr;

  CmpPredicate Pred;

  Value *X, *Y, *Zero;

  if (!match(&I, m_ICmp(Pred, m_OneUse(m_IRem(m_Value(X), m_Value(Y))),

                        m_CombineAnd(m_Zero(), m_Value(Zero)))))

    return nullptr;

  if (!isKnownToBeAPowerOfTwo(Y, /*OrZero*/ true, &I))

    return nullptr;

  // This may increase instruction count, we don't enforce that Y is a constant.

  Value *Mask = Builder.CreateAdd(Y, Constant::getAllOnesValue(Y->getType()));

  Value *Masked = Builder.CreateAnd(X, Mask);

  return ICmpInst::Create(Instruction::ICmp, Pred, Masked, Zero);

}


/// Fold equality-comparison between zero and any (maybe truncated) right-shift

/// by one-less-than-bitwidth into a sign test on the original value.

Instruction *InstCombinerImpl::foldSignBitTest(ICmpInst &I) {

  Instruction *Val;

  CmpPredicate Pred;

  if (!I.isEquality() || !match(&I, m_ICmp(Pred, m_Instruction(Val), m_Zero())))

    return nullptr;


  Value *X;

  Type *XTy;


  Constant *C;

  if (match(Val, m_TruncOrSelf(m_Shr(m_Value(X), m_Constant(C))))) {

    XTy = X->getType();

    unsigned XBitWidth = XTy->getScalarSizeInBits();

    if (!match(C, m_SpecificInt_ICMP(ICmpInst::Predicate::ICMP_EQ,

                                     APInt(XBitWidth, XBitWidth - 1))))

      return nullptr;

  } else if (isa<BinaryOperator>(Val) &&

             (X = reassociateShiftAmtsOfTwoSameDirectionShifts(

                  cast<BinaryOperator>(Val), SQ.getWithInstruction(Val),

                  /*AnalyzeForSignBitExtraction=*/true))) {

    XTy = X->getType();

  } else

    return nullptr;


  return ICmpInst::Create(Instruction::ICmp,

                          Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_SGE

                                                    : ICmpInst::ICMP_SLT,

                          X, ConstantInt::getNullValue(XTy));

}


// Handle  icmp pred X, 0

Instruction *InstCombinerImpl::foldICmpWithZero(ICmpInst &Cmp) {

  CmpInst::Predicate Pred = Cmp.getPredicate();

  if (!match(Cmp.getOperand(1), m_Zero()))

    return nullptr;


  // (icmp sgt smin(PosA, B) 0) -> (icmp sgt B 0)

  if (Pred == ICmpInst::ICMP_SGT) {

    Value *A, *B;

    if (match(Cmp.getOperand(0), m_SMin(m_Value(A), m_Value(B)))) {

      if (isKnownPositive(A, SQ.getWithInstruction(&Cmp)))

        return new ICmpInst(Pred, B, Cmp.getOperand(1));

      if (isKnownPositive(B, SQ.getWithInstruction(&Cmp)))

        return new ICmpInst(Pred, A, Cmp.getOperand(1));

    }

  }


  if (Instruction *New = foldIRemByPowerOfTwoToBitTest(Cmp))

    return New;


  // Given:

  //   icmp eq/ne (urem %x, %y), 0

  // Iff %x has 0 or 1 bits set, and %y has at least 2 bits set, omit 'urem':

  //   icmp eq/ne %x, 0

  Value *X, *Y;

  if (match(Cmp.getOperand(0), m_URem(m_Value(X), m_Value(Y))) &&

      ICmpInst::isEquality(Pred)) {

    KnownBits XKnown = computeKnownBits(X, &Cmp);

    KnownBits YKnown = computeKnownBits(Y, &Cmp);

    if (XKnown.countMaxPopulation() == 1 && YKnown.countMinPopulation() >= 2)

      return new ICmpInst(Pred, X, Cmp.getOperand(1));

  }


  // (icmp eq/ne (mul X Y)) -> (icmp eq/ne X/Y) if we know about whether X/Y are

  // odd/non-zero/there is no overflow.

  if (match(Cmp.getOperand(0), m_Mul(m_Value(X), m_Value(Y))) &&

      ICmpInst::isEquality(Pred)) {


    KnownBits XKnown = computeKnownBits(X, &Cmp);

    // if X % 2 != 0

    //    (icmp eq/ne Y)

    if (XKnown.countMaxTrailingZeros() == 0)

      return new ICmpInst(Pred, Y, Cmp.getOperand(1));


    KnownBits YKnown = computeKnownBits(Y, &Cmp);

    // if Y % 2 != 0

    //    (icmp eq/ne X)

    if (YKnown.countMaxTrailingZeros() == 0)

      return new ICmpInst(Pred, X, Cmp.getOperand(1));


    auto *BO0 = cast<OverflowingBinaryOperator>(Cmp.getOperand(0));

    if (BO0->hasNoUnsignedWrap() || BO0->hasNoSignedWrap()) {

      const SimplifyQuery Q = SQ.getWithInstruction(&Cmp);

      // `isKnownNonZero` does more analysis than just `!KnownBits.One.isZero()`

      // but to avoid unnecessary work, first just if this is an obvious case.


      // if X non-zero and NoOverflow(X * Y)

      //    (icmp eq/ne Y)

      if (!XKnown.One.isZero() || isKnownNonZero(X, Q))

        return new ICmpInst(Pred, Y, Cmp.getOperand(1));


      // if Y non-zero and NoOverflow(X * Y)

      //    (icmp eq/ne X)

      if (!YKnown.One.isZero() || isKnownNonZero(Y, Q))

        return new ICmpInst(Pred, X, Cmp.getOperand(1));

    }

    // Note, we are skipping cases:

    //      if Y % 2 != 0 AND X % 2 != 0

    //          (false/true)

    //      if X non-zero and Y non-zero and NoOverflow(X * Y)

    //          (false/true)

    // Those can be simplified later as we would have already replaced the (icmp

    // eq/ne (mul X, Y)) with (icmp eq/ne X/Y) and if X/Y is known non-zero that

    // will fold to a constant elsewhere.

  }


  // (icmp eq/ne f(X), 0) -> (icmp eq/ne X, 0)

  // where f(X) == 0 if and only if X == 0

  if (ICmpInst::isEquality(Pred))

    if (Value *Stripped = stripNullTest(Cmp.getOperand(0)))

      return new ICmpInst(Pred, Stripped,

                          Constant::getNullValue(Stripped->getType()));


  return nullptr;

}


/// Fold icmp eq (num + mask) & ~mask, num

///      to

///      icmp eq (and num, mask), 0

/// Where mask is a low bit mask.

Instruction *InstCombinerImpl::foldIsMultipleOfAPowerOfTwo(ICmpInst &Cmp) {

  Value *Num;

  CmpPredicate Pred;

  const APInt *Mask, *Neg;


  if (!match(&Cmp,

             m_c_ICmp(Pred, m_Value(Num),

                      m_OneUse(m_c_And(m_OneUse(m_c_Add(m_Deferred(Num),

                                                        m_LowBitMask(Mask))),

                                       m_APInt(Neg))))))

    return nullptr;


  if (*Neg != ~*Mask)

    return nullptr;


  if (!ICmpInst::isEquality(Pred))

    return nullptr;


  // Create new icmp eq (num & mask), 0

  auto *NewAnd = Builder.CreateAnd(Num, *Mask);

  auto *Zero = Constant::getNullValue(Num->getType());


  return new ICmpInst(Pred, NewAnd, Zero);

}


/// Fold icmp Pred X, C.

/// TODO: This code structure does not make sense. The saturating add fold

/// should be moved to some other helper and extended as noted below (it is also

/// possible that code has been made unnecessary - do we canonicalize IR to

/// overflow/saturating intrinsics or not?).

Instruction *InstCombinerImpl::foldICmpWithConstant(ICmpInst &Cmp) {

  // Match the following pattern, which is a common idiom when writing

  // overflow-safe integer arithmetic functions. The source performs an addition

  // in wider type and explicitly checks for overflow using comparisons against

  // INT_MIN and INT_MAX. Simplify by using the sadd_with_overflow intrinsic.

  //

  // TODO: This could probably be generalized to handle other overflow-safe

  // operations if we worked out the formulas to compute the appropriate magic

  // constants.

  //

  // sum = a + b

  // if (sum+128 >u 255)  ...  -> llvm.sadd.with.overflow.i8

  CmpInst::Predicate Pred = Cmp.getPredicate();

  Value *Op0 = Cmp.getOperand(0), *Op1 = Cmp.getOperand(1);

  Value *A, *B;

  ConstantInt *CI, *CI2; // I = icmp ugt (add (add A, B), CI2), CI

  if (Pred == ICmpInst::ICMP_UGT && match(Op1, m_ConstantInt(CI)) &&

      match(Op0, m_Add(m_Add(m_Value(A), m_Value(B)), m_ConstantInt(CI2))))

    if (Instruction *Res = processUGT_ADDCST_ADD(Cmp, A, B, CI2, CI, *this))

      return Res;


  // icmp(phi(C1, C2, ...), C) -> phi(icmp(C1, C), icmp(C2, C), ...).

  Constant *C = dyn_cast<Constant>(Op1);

  if (!C)

    return nullptr;


  if (auto *Phi = dyn_cast<PHINode>(Op0))

    if (all_of(Phi->operands(), [](Value *V) { return isa<Constant>(V); })) {

      SmallVector<Constant *> Ops;

      for (Value *V : Phi->incoming_values()) {

        Constant *Res =

            ConstantFoldCompareInstOperands(Pred, cast<Constant>(V), C, DL);

        if (!Res)

          return nullptr;

        Ops.push_back(Res);

      }

      Builder.SetInsertPoint(Phi);

      PHINode *NewPhi = Builder.CreatePHI(Cmp.getType(), Phi->getNumOperands());

      for (auto [V, Pred] : zip(Ops, Phi->blocks()))

        NewPhi->addIncoming(V, Pred);

      return replaceInstUsesWith(Cmp, NewPhi);

    }


  if (Instruction *R = tryFoldInstWithCtpopWithNot(&Cmp))

    return R;


  return nullptr;

}


/// Canonicalize icmp instructions based on dominating conditions.

Instruction *InstCombinerImpl::foldICmpWithDominatingICmp(ICmpInst &Cmp) {

  // We already checked simple implication in InstSimplify, only handle complex

  // cases here.

  Value *X = Cmp.getOperand(0), *Y = Cmp.getOperand(1);

  const APInt *C;

  if (!match(Y, m_APInt(C)))

    return nullptr;


  CmpInst::Predicate Pred = Cmp.getPredicate();

  ConstantRange CR = ConstantRange::makeExactICmpRegion(Pred, *C);


  auto handleDomCond = [&](ICmpInst::Predicate DomPred,

                           const APInt *DomC) -> Instruction * {

    // We have 2 compares of a variable with constants. Calculate the constant

    // ranges of those compares to see if we can transform the 2nd compare:

    // DomBB:

    //   DomCond = icmp DomPred X, DomC

    //   br DomCond, CmpBB, FalseBB

    // CmpBB:

    //   Cmp = icmp Pred X, C

    ConstantRange DominatingCR =

        ConstantRange::makeExactICmpRegion(DomPred, *DomC);

    ConstantRange Intersection = DominatingCR.intersectWith(CR);

    ConstantRange Difference = DominatingCR.difference(CR);

    if (Intersection.isEmptySet())

      return replaceInstUsesWith(Cmp, Builder.getFalse());

    if (Difference.isEmptySet())

      return replaceInstUsesWith(Cmp, Builder.getTrue());


    // Canonicalizing a sign bit comparison that gets used in a branch,

    // pessimizes codegen by generating branch on zero instruction instead

    // of a test and branch. So we avoid canonicalizing in such situations

    // because test and branch instruction has better branch displacement

    // than compare and branch instruction.

    bool UnusedBit;

    bool IsSignBit = isSignBitCheck(Pred, *C, UnusedBit);

    if (Cmp.isEquality() || (IsSignBit && hasBranchUse(Cmp)))

      return nullptr;


    // Avoid an infinite loop with min/max canonicalization.

    // TODO: This will be unnecessary if we canonicalize to min/max intrinsics.

    if (Cmp.hasOneUse() &&

        match(Cmp.user_back(), m_MaxOrMin(m_Value(), m_Value())))

      return nullptr;


    if (const APInt *EqC = Intersection.getSingleElement())

      return new ICmpInst(ICmpInst::ICMP_EQ, X, Builder.getInt(*EqC));

    if (const APInt *NeC = Difference.getSingleElement())

      return new ICmpInst(ICmpInst::ICMP_NE, X, Builder.getInt(*NeC));

    return nullptr;

  };


  for (BranchInst *BI : DC.conditionsFor(X)) {

    CmpPredicate DomPred;

    const APInt *DomC;

    if (!match(BI->getCondition(),

               m_ICmp(DomPred, m_Specific(X), m_APInt(DomC))))

      continue;


    BasicBlockEdge Edge0(BI->getParent(), BI->getSuccessor(0));

    if (DT.dominates(Edge0, Cmp.getParent())) {

      if (auto *V = handleDomCond(DomPred, DomC))

        return V;

    } else {

      BasicBlockEdge Edge1(BI->getParent(), BI->getSuccessor(1));

      if (DT.dominates(Edge1, Cmp.getParent()))

        if (auto *V =

                handleDomCond(CmpInst::getInversePredicate(DomPred), DomC))

          return V;

    }

  }


  return nullptr;

}


/// Fold icmp (trunc X), C.

Instruction *InstCombinerImpl::foldICmpTruncConstant(ICmpInst &Cmp,

                                                     TruncInst *Trunc,

                                                     const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Value *X = Trunc->getOperand(0);

  Type *SrcTy = X->getType();

  unsigned DstBits = Trunc->getType()->getScalarSizeInBits(),

           SrcBits = SrcTy->getScalarSizeInBits();


  // Match (icmp pred (trunc nuw/nsw X), C)

  // Which we can convert to (icmp pred X, (sext/zext C))

  if (shouldChangeType(Trunc->getType(), SrcTy)) {

    if (Trunc->hasNoSignedWrap())

      return new ICmpInst(Pred, X, ConstantInt::get(SrcTy, C.sext(SrcBits)));

    if (!Cmp.isSigned() && Trunc->hasNoUnsignedWrap())

      return new ICmpInst(Pred, X, ConstantInt::get(SrcTy, C.zext(SrcBits)));

  }


  if (C.isOne() && C.getBitWidth() > 1) {

    // icmp slt trunc(signum(V)) 1 --> icmp slt V, 1

    Value *V = nullptr;

    if (Pred == ICmpInst::ICMP_SLT && match(X, m_Signum(m_Value(V))))

      return new ICmpInst(ICmpInst::ICMP_SLT, V,

                          ConstantInt::get(V->getType(), 1));

  }


  // TODO: Handle any shifted constant by subtracting trailing zeros.

  // TODO: Handle non-equality predicates.

  Value *Y;

  if (Cmp.isEquality() && match(X, m_Shl(m_One(), m_Value(Y)))) {

    // (trunc (1 << Y) to iN) == 0 --> Y u>= N

    // (trunc (1 << Y) to iN) != 0 --> Y u<  N

    if (C.isZero()) {

      auto NewPred = (Pred == Cmp.ICMP_EQ) ? Cmp.ICMP_UGE : Cmp.ICMP_ULT;

      return new ICmpInst(NewPred, Y, ConstantInt::get(SrcTy, DstBits));

    }

    // (trunc (1 << Y) to iN) == 2**C --> Y == C

    // (trunc (1 << Y) to iN) != 2**C --> Y != C

    if (C.isPowerOf2())

      return new ICmpInst(Pred, Y, ConstantInt::get(SrcTy, C.logBase2()));

  }


  if (Cmp.isEquality() && Trunc->hasOneUse()) {

    // Canonicalize to a mask and wider compare if the wide type is suitable:

    // (trunc X to i8) == C --> (X & 0xff) == (zext C)

    if (!SrcTy->isVectorTy() && shouldChangeType(DstBits, SrcBits)) {

      Constant *Mask =

          ConstantInt::get(SrcTy, APInt::getLowBitsSet(SrcBits, DstBits));

      Value *And = Builder.CreateAnd(X, Mask);

      Constant *WideC = ConstantInt::get(SrcTy, C.zext(SrcBits));

      return new ICmpInst(Pred, And, WideC);

    }


    // Simplify icmp eq (trunc x to i8), 42 -> icmp eq x, 42|highbits if all

    // of the high bits truncated out of x are known.

    KnownBits Known = computeKnownBits(X, &Cmp);


    // If all the high bits are known, we can do this xform.

    if ((Known.Zero | Known.One).countl_one() >= SrcBits - DstBits) {

      // Pull in the high bits from known-ones set.

      APInt NewRHS = C.zext(SrcBits);

      NewRHS |= Known.One & APInt::getHighBitsSet(SrcBits, SrcBits - DstBits);

      return new ICmpInst(Pred, X, ConstantInt::get(SrcTy, NewRHS));

    }

  }


  // Look through truncated right-shift of the sign-bit for a sign-bit check:

  // trunc iN (ShOp >> ShAmtC) to i[N - ShAmtC] < 0  --> ShOp <  0

  // trunc iN (ShOp >> ShAmtC) to i[N - ShAmtC] > -1 --> ShOp > -1

  Value *ShOp;

  uint64_t ShAmt;

  bool TrueIfSigned;

  if (isSignBitCheck(Pred, C, TrueIfSigned) &&

      match(X, m_Shr(m_Value(ShOp), m_ConstantInt(ShAmt))) &&

      DstBits == SrcBits - ShAmt) {

    return TrueIfSigned ? new ICmpInst(ICmpInst::ICMP_SLT, ShOp,

                                       ConstantInt::getNullValue(SrcTy))

                        : new ICmpInst(ICmpInst::ICMP_SGT, ShOp,

                                       ConstantInt::getAllOnesValue(SrcTy));

  }


  return nullptr;

}


/// Fold icmp (trunc nuw/nsw X), (trunc nuw/nsw Y).

/// Fold icmp (trunc nuw/nsw X), (zext/sext Y).

Instruction *

InstCombinerImpl::foldICmpTruncWithTruncOrExt(ICmpInst &Cmp,

                                              const SimplifyQuery &Q) {

  Value *X, *Y;

  CmpPredicate Pred;

  bool YIsSExt = false;

  // Try to match icmp (trunc X), (trunc Y)

  if (match(&Cmp, m_ICmp(Pred, m_Trunc(m_Value(X)), m_Trunc(m_Value(Y))))) {

    unsigned NoWrapFlags = cast<TruncInst>(Cmp.getOperand(0))->getNoWrapKind() &

                           cast<TruncInst>(Cmp.getOperand(1))->getNoWrapKind();

    if (Cmp.isSigned()) {

      // For signed comparisons, both truncs must be nsw.

      if (!(NoWrapFlags & TruncInst::NoSignedWrap))

        return nullptr;

    } else {

      // For unsigned and equality comparisons, either both must be nuw or

      // both must be nsw, we don't care which.

      if (!NoWrapFlags)

        return nullptr;

    }


    if (X->getType() != Y->getType() &&

        (!Cmp.getOperand(0)->hasOneUse() || !Cmp.getOperand(1)->hasOneUse()))

      return nullptr;

    if (!isDesirableIntType(X->getType()->getScalarSizeInBits()) &&

        isDesirableIntType(Y->getType()->getScalarSizeInBits())) {

      std::swap(X, Y);

      Pred = Cmp.getSwappedPredicate(Pred);

    }

    YIsSExt = !(NoWrapFlags & TruncInst::NoUnsignedWrap);

  }

  // Try to match icmp (trunc nuw X), (zext Y)

  else if (!Cmp.isSigned() &&

           match(&Cmp, m_c_ICmp(Pred, m_NUWTrunc(m_Value(X)),

                                m_OneUse(m_ZExt(m_Value(Y)))))) {

    // Can fold trunc nuw + zext for unsigned and equality predicates.

  }

  // Try to match icmp (trunc nsw X), (sext Y)

  else if (match(&Cmp, m_c_ICmp(Pred, m_NSWTrunc(m_Value(X)),

                                m_OneUse(m_ZExtOrSExt(m_Value(Y)))))) {

    // Can fold trunc nsw + zext/sext for all predicates.

    YIsSExt =

        isa<SExtInst>(Cmp.getOperand(0)) || isa<SExtInst>(Cmp.getOperand(1));

  } else

    return nullptr;


  Type *TruncTy = Cmp.getOperand(0)->getType();

  unsigned TruncBits = TruncTy->getScalarSizeInBits();


  // If this transform will end up changing from desirable types -> undesirable

  // types skip it.

  if (isDesirableIntType(TruncBits) &&

      !isDesirableIntType(X->getType()->getScalarSizeInBits()))

    return nullptr;


  Value *NewY = Builder.CreateIntCast(Y, X->getType(), YIsSExt);

  return new ICmpInst(Pred, X, NewY);

}


/// Fold icmp (xor X, Y), C.

Instruction *InstCombinerImpl::foldICmpXorConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Xor,

                                                   const APInt &C) {

  if (Instruction *I = foldICmpXorShiftConst(Cmp, Xor, C))

    return I;


  Value *X = Xor->getOperand(0);

  Value *Y = Xor->getOperand(1);

  const APInt *XorC;

  if (!match(Y, m_APInt(XorC)))

    return nullptr;


  // If this is a comparison that tests the signbit (X < 0) or (x > -1),

  // fold the xor.

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  bool TrueIfSigned = false;

  if (isSignBitCheck(Cmp.getPredicate(), C, TrueIfSigned)) {


    // If the sign bit of the XorCst is not set, there is no change to

    // the operation, just stop using the Xor.

    if (!XorC->isNegative())

      return replaceOperand(Cmp, 0, X);


    // Emit the opposite comparison.

    if (TrueIfSigned)

      return new ICmpInst(ICmpInst::ICMP_SGT, X,

                          ConstantInt::getAllOnesValue(X->getType()));

    else

      return new ICmpInst(ICmpInst::ICMP_SLT, X,

                          ConstantInt::getNullValue(X->getType()));

  }


  if (Xor->hasOneUse()) {

    // (icmp u/s (xor X SignMask), C) -> (icmp s/u X, (xor C SignMask))

    if (!Cmp.isEquality() && XorC->isSignMask()) {

      Pred = Cmp.getFlippedSignednessPredicate();

      return new ICmpInst(Pred, X, ConstantInt::get(X->getType(), C ^ *XorC));

    }


    // (icmp u/s (xor X ~SignMask), C) -> (icmp s/u X, (xor C ~SignMask))

    if (!Cmp.isEquality() && XorC->isMaxSignedValue()) {

      Pred = Cmp.getFlippedSignednessPredicate();

      Pred = Cmp.getSwappedPredicate(Pred);

      return new ICmpInst(Pred, X, ConstantInt::get(X->getType(), C ^ *XorC));

    }

  }


  // Mask constant magic can eliminate an 'xor' with unsigned compares.

  if (Pred == ICmpInst::ICMP_UGT) {

    // (xor X, ~C) >u C --> X <u ~C (when C+1 is a power of 2)

    if (*XorC == ~C && (C + 1).isPowerOf2())

      return new ICmpInst(ICmpInst::ICMP_ULT, X, Y);

    // (xor X, C) >u C --> X >u C (when C+1 is a power of 2)

    if (*XorC == C && (C + 1).isPowerOf2())

      return new ICmpInst(ICmpInst::ICMP_UGT, X, Y);

  }

  if (Pred == ICmpInst::ICMP_ULT) {

    // (xor X, -C) <u C --> X >u ~C (when C is a power of 2)

    if (*XorC == -C && C.isPowerOf2())

      return new ICmpInst(ICmpInst::ICMP_UGT, X,

                          ConstantInt::get(X->getType(), ~C));

    // (xor X, C) <u C --> X >u ~C (when -C is a power of 2)

    if (*XorC == C && (-C).isPowerOf2())

      return new ICmpInst(ICmpInst::ICMP_UGT, X,

                          ConstantInt::get(X->getType(), ~C));

  }

  return nullptr;

}


/// For power-of-2 C:

/// ((X s>> ShiftC) ^ X) u< C --> (X + C) u< (C << 1)

/// ((X s>> ShiftC) ^ X) u> (C - 1) --> (X + C) u> ((C << 1) - 1)

Instruction *InstCombinerImpl::foldICmpXorShiftConst(ICmpInst &Cmp,

                                                     BinaryOperator *Xor,

                                                     const APInt &C) {

  CmpInst::Predicate Pred = Cmp.getPredicate();

  APInt PowerOf2;

  if (Pred == ICmpInst::ICMP_ULT)

    PowerOf2 = C;

  else if (Pred == ICmpInst::ICMP_UGT && !C.isMaxValue())

    PowerOf2 = C + 1;

  else

    return nullptr;

  if (!PowerOf2.isPowerOf2())

    return nullptr;

  Value *X;

  const APInt *ShiftC;

  if (!match(Xor, m_OneUse(m_c_Xor(m_Value(X),

                                   m_AShr(m_Deferred(X), m_APInt(ShiftC))))))

    return nullptr;

  uint64_t Shift = ShiftC->getLimitedValue();

  Type *XType = X->getType();

  if (Shift == 0 || PowerOf2.isMinSignedValue())

    return nullptr;

  Value *Add = Builder.CreateAdd(X, ConstantInt::get(XType, PowerOf2));

  APInt Bound =

      Pred == ICmpInst::ICMP_ULT ? PowerOf2 << 1 : ((PowerOf2 << 1) - 1);

  return new ICmpInst(Pred, Add, ConstantInt::get(XType, Bound));

}


/// Fold icmp (and (sh X, Y), C2), C1.

Instruction *InstCombinerImpl::foldICmpAndShift(ICmpInst &Cmp,

                                                BinaryOperator *And,

                                                const APInt &C1,

                                                const APInt &C2) {

  BinaryOperator *Shift = dyn_cast<BinaryOperator>(And->getOperand(0));

  if (!Shift || !Shift->isShift())

    return nullptr;


  // If this is: (X >> C3) & C2 != C1 (where any shift and any compare could

  // exist), turn it into (X & (C2 << C3)) != (C1 << C3). This happens a LOT in

  // code produced by the clang front-end, for bitfield access.

  // This seemingly simple opportunity to fold away a shift turns out to be

  // rather complicated. See PR17827 for details.

  unsigned ShiftOpcode = Shift->getOpcode();

  bool IsShl = ShiftOpcode == Instruction::Shl;

  const APInt *C3;

  if (match(Shift->getOperand(1), m_APInt(C3))) {

    APInt NewAndCst, NewCmpCst;

    bool AnyCmpCstBitsShiftedOut;

    if (ShiftOpcode == Instruction::Shl) {

      // For a left shift, we can fold if the comparison is not signed. We can

      // also fold a signed comparison if the mask value and comparison value

      // are not negative. These constraints may not be obvious, but we can

      // prove that they are correct using an SMT solver.

      if (Cmp.isSigned() && (C2.isNegative() || C1.isNegative()))

        return nullptr;


      NewCmpCst = C1.lshr(*C3);

      NewAndCst = C2.lshr(*C3);

      AnyCmpCstBitsShiftedOut = NewCmpCst.shl(*C3) != C1;

    } else if (ShiftOpcode == Instruction::LShr) {

      // For a logical right shift, we can fold if the comparison is not signed.

      // We can also fold a signed comparison if the shifted mask value and the

      // shifted comparison value are not negative. These constraints may not be

      // obvious, but we can prove that they are correct using an SMT solver.

      NewCmpCst = C1.shl(*C3);

      NewAndCst = C2.shl(*C3);

      AnyCmpCstBitsShiftedOut = NewCmpCst.lshr(*C3) != C1;

      if (Cmp.isSigned() && (NewAndCst.isNegative() || NewCmpCst.isNegative()))

        return nullptr;

    } else {

      // For an arithmetic shift, check that both constants don't use (in a

      // signed sense) the top bits being shifted out.

      assert(ShiftOpcode == Instruction::AShr && "Unknown shift opcode");

      NewCmpCst = C1.shl(*C3);

      NewAndCst = C2.shl(*C3);

      AnyCmpCstBitsShiftedOut = NewCmpCst.ashr(*C3) != C1;

      if (NewAndCst.ashr(*C3) != C2)

        return nullptr;

    }


    if (AnyCmpCstBitsShiftedOut) {

      // If we shifted bits out, the fold is not going to work out. As a

      // special case, check to see if this means that the result is always

      // true or false now.

      if (Cmp.getPredicate() == ICmpInst::ICMP_EQ)

        return replaceInstUsesWith(Cmp, ConstantInt::getFalse(Cmp.getType()));

      if (Cmp.getPredicate() == ICmpInst::ICMP_NE)

        return replaceInstUsesWith(Cmp, ConstantInt::getTrue(Cmp.getType()));

    } else {

      Value *NewAnd = Builder.CreateAnd(

          Shift->getOperand(0), ConstantInt::get(And->getType(), NewAndCst));

      return new ICmpInst(Cmp.getPredicate(), NewAnd,

                          ConstantInt::get(And->getType(), NewCmpCst));

    }

  }


  // Turn ((X >> Y) & C2) == 0  into  (X & (C2 << Y)) == 0.  The latter is

  // preferable because it allows the C2 << Y expression to be hoisted out of a

  // loop if Y is invariant and X is not.

  if (Shift->hasOneUse() && C1.isZero() && Cmp.isEquality() &&

      !Shift->isArithmeticShift() &&

      ((!IsShl && C2.isOne()) || !isa<Constant>(Shift->getOperand(0)))) {

    // Compute C2 << Y.

    Value *NewShift =

        IsShl ? Builder.CreateLShr(And->getOperand(1), Shift->getOperand(1))

              : Builder.CreateShl(And->getOperand(1), Shift->getOperand(1));


    // Compute X & (C2 << Y).

    Value *NewAnd = Builder.CreateAnd(Shift->getOperand(0), NewShift);

    return new ICmpInst(Cmp.getPredicate(), NewAnd, Cmp.getOperand(1));

  }


  return nullptr;

}


/// Fold icmp (and X, C2), C1.

Instruction *InstCombinerImpl::foldICmpAndConstConst(ICmpInst &Cmp,

                                                     BinaryOperator *And,

                                                     const APInt &C1) {

  bool isICMP_NE = Cmp.getPredicate() == ICmpInst::ICMP_NE;


  // For vectors: icmp ne (and X, 1), 0 --> trunc X to N x i1

  // TODO: We canonicalize to the longer form for scalars because we have

  // better analysis/folds for icmp, and codegen may be better with icmp.

  if (isICMP_NE && Cmp.getType()->isVectorTy() && C1.isZero() &&

      match(And->getOperand(1), m_One()))

    return new TruncInst(And->getOperand(0), Cmp.getType());


  const APInt *C2;

  Value *X;

  if (!match(And, m_And(m_Value(X), m_APInt(C2))))

    return nullptr;


  // (and X, highmask) s> [0, ~highmask] --> X s> ~highmask

  if (Cmp.getPredicate() == ICmpInst::ICMP_SGT && C1.ule(~*C2) &&

      C2->isNegatedPowerOf2())

    return new ICmpInst(ICmpInst::ICMP_SGT, X,

                        ConstantInt::get(X->getType(), ~*C2));

  // (and X, highmask) s< [1, -highmask] --> X s< -highmask

  if (Cmp.getPredicate() == ICmpInst::ICMP_SLT && !C1.isSignMask() &&

      (C1 - 1).ule(~*C2) && C2->isNegatedPowerOf2() && !C2->isSignMask())

    return new ICmpInst(ICmpInst::ICMP_SLT, X,

                        ConstantInt::get(X->getType(), -*C2));


  // Don't perform the following transforms if the AND has multiple uses

  if (!And->hasOneUse())

    return nullptr;


  if (Cmp.isEquality() && C1.isZero()) {

    // Restrict this fold to single-use 'and' (PR10267).

    // Replace (and X, (1 << size(X)-1) != 0) with X s< 0

    if (C2->isSignMask()) {

      Constant *Zero = Constant::getNullValue(X->getType());

      auto NewPred = isICMP_NE ? ICmpInst::ICMP_SLT : ICmpInst::ICMP_SGE;

      return new ICmpInst(NewPred, X, Zero);

    }


    APInt NewC2 = *C2;

    KnownBits Know = computeKnownBits(And->getOperand(0), And);

    // Set high zeros of C2 to allow matching negated power-of-2.

    NewC2 = *C2 | APInt::getHighBitsSet(C2->getBitWidth(),

                                        Know.countMinLeadingZeros());


    // Restrict this fold only for single-use 'and' (PR10267).

    // ((%x & C) == 0) --> %x u< (-C)  iff (-C) is power of two.

    if (NewC2.isNegatedPowerOf2()) {

      Constant *NegBOC = ConstantInt::get(And->getType(), -NewC2);

      auto NewPred = isICMP_NE ? ICmpInst::ICMP_UGE : ICmpInst::ICMP_ULT;

      return new ICmpInst(NewPred, X, NegBOC);

    }

  }


  // If the LHS is an 'and' of a truncate and we can widen the and/compare to

  // the input width without changing the value produced, eliminate the cast:

  //

  // icmp (and (trunc W), C2), C1 -> icmp (and W, C2'), C1'

  //

  // We can do this transformation if the constants do not have their sign bits

  // set or if it is an equality comparison. Extending a relational comparison

  // when we're checking the sign bit would not work.

  Value *W;

  if (match(And->getOperand(0), m_OneUse(m_Trunc(m_Value(W)))) &&

      (Cmp.isEquality() || (!C1.isNegative() && !C2->isNegative()))) {

    // TODO: Is this a good transform for vectors? Wider types may reduce

    // throughput. Should this transform be limited (even for scalars) by using

    // shouldChangeType()?

    if (!Cmp.getType()->isVectorTy()) {

      Type *WideType = W->getType();

      unsigned WideScalarBits = WideType->getScalarSizeInBits();

      Constant *ZextC1 = ConstantInt::get(WideType, C1.zext(WideScalarBits));

      Constant *ZextC2 = ConstantInt::get(WideType, C2->zext(WideScalarBits));

      Value *NewAnd = Builder.CreateAnd(W, ZextC2, And->getName());

      return new ICmpInst(Cmp.getPredicate(), NewAnd, ZextC1);

    }

  }


  if (Instruction *I = foldICmpAndShift(Cmp, And, C1, *C2))

    return I;


  // (icmp pred (and (or (lshr A, B), A), 1), 0) -->

  // (icmp pred (and A, (or (shl 1, B), 1), 0))

  //

  // iff pred isn't signed

  if (!Cmp.isSigned() && C1.isZero() && And->getOperand(0)->hasOneUse() &&

      match(And->getOperand(1), m_One())) {

    Constant *One = cast<Constant>(And->getOperand(1));

    Value *Or = And->getOperand(0);

    Value *A, *B, *LShr;

    if (match(Or, m_Or(m_Value(LShr), m_Value(A))) &&

        match(LShr, m_LShr(m_Specific(A), m_Value(B)))) {

      unsigned UsesRemoved = 0;

      if (And->hasOneUse())

        ++UsesRemoved;

      if (Or->hasOneUse())

        ++UsesRemoved;

      if (LShr->hasOneUse())

        ++UsesRemoved;


      // Compute A & ((1 << B) | 1)

      unsigned RequireUsesRemoved = match(B, m_ImmConstant()) ? 1 : 3;

      if (UsesRemoved >= RequireUsesRemoved) {

        Value *NewOr =

            Builder.CreateOr(Builder.CreateShl(One, B, LShr->getName(),

                                               /*HasNUW=*/true),

                             One, Or->getName());

        Value *NewAnd = Builder.CreateAnd(A, NewOr, And->getName());

        return new ICmpInst(Cmp.getPredicate(), NewAnd, Cmp.getOperand(1));

      }

    }

  }


  // (icmp eq (and (bitcast X to int), ExponentMask), ExponentMask) -->

  // llvm.is.fpclass(X, fcInf|fcNan)

  // (icmp ne (and (bitcast X to int), ExponentMask), ExponentMask) -->

  // llvm.is.fpclass(X, ~(fcInf|fcNan))

  // (icmp eq (and (bitcast X to int), ExponentMask), 0) -->

  // llvm.is.fpclass(X, fcSubnormal|fcZero)

  // (icmp ne (and (bitcast X to int), ExponentMask), 0) -->

  // llvm.is.fpclass(X, ~(fcSubnormal|fcZero))

  Value *V;

  if (!Cmp.getParent()->getParent()->hasFnAttribute(

          Attribute::NoImplicitFloat) &&

      Cmp.isEquality() &&

      match(X, m_OneUse(m_ElementWiseBitCast(m_Value(V))))) {

    Type *FPType = V->getType()->getScalarType();

    if (FPType->isIEEELikeFPTy() && (C1.isZero() || C1 == *C2)) {

      APInt ExponentMask =

          APFloat::getInf(FPType->getFltSemantics()).bitcastToAPInt();

      if (*C2 == ExponentMask) {

        unsigned Mask = C1.isZero()

                            ? FPClassTest::fcZero | FPClassTest::fcSubnormal

                            : FPClassTest::fcNan | FPClassTest::fcInf;

        if (isICMP_NE)

          Mask = ~Mask & fcAllFlags;

        return replaceInstUsesWith(Cmp, Builder.createIsFPClass(V, Mask));

      }

    }

  }


  return nullptr;

}


/// Fold icmp (and X, Y), C.

Instruction *InstCombinerImpl::foldICmpAndConstant(ICmpInst &Cmp,

                                                   BinaryOperator *And,

                                                   const APInt &C) {

  if (Instruction *I = foldICmpAndConstConst(Cmp, And, C))

    return I;


  const ICmpInst::Predicate Pred = Cmp.getPredicate();

  bool TrueIfNeg;

  if (isSignBitCheck(Pred, C, TrueIfNeg)) {

    // ((X - 1) & ~X) <  0 --> X == 0

    // ((X - 1) & ~X) >= 0 --> X != 0

    Value *X;

    if (match(And->getOperand(0), m_Add(m_Value(X), m_AllOnes())) &&

        match(And->getOperand(1), m_Not(m_Specific(X)))) {

      auto NewPred = TrueIfNeg ? CmpInst::ICMP_EQ : CmpInst::ICMP_NE;

      return new ICmpInst(NewPred, X, ConstantInt::getNullValue(X->getType()));

    }

    // (X & -X) <  0 --> X == MinSignedC

    // (X & -X) > -1 --> X != MinSignedC

    if (match(And, m_c_And(m_Neg(m_Value(X)), m_Deferred(X)))) {

      Constant *MinSignedC = ConstantInt::get(

          X->getType(),

          APInt::getSignedMinValue(X->getType()->getScalarSizeInBits()));

      auto NewPred = TrueIfNeg ? CmpInst::ICMP_EQ : CmpInst::ICMP_NE;

      return new ICmpInst(NewPred, X, MinSignedC);

    }

  }


  // TODO: These all require that Y is constant too, so refactor with the above.


  // Try to optimize things like "A[i] & 42 == 0" to index computations.

  Value *X = And->getOperand(0);

  Value *Y = And->getOperand(1);

  if (auto *C2 = dyn_cast<ConstantInt>(Y))

    if (auto *LI = dyn_cast<LoadInst>(X))

      if (auto *GEP = dyn_cast<GetElementPtrInst>(LI->getOperand(0)))

        if (auto *GV = dyn_cast<GlobalVariable>(GEP->getOperand(0)))

          if (Instruction *Res =

                  foldCmpLoadFromIndexedGlobal(LI, GEP, GV, Cmp, C2))

            return Res;


  if (!Cmp.isEquality())

    return nullptr;


  // X & -C == -C -> X >  u ~C

  // X & -C != -C -> X <= u ~C

  //   iff C is a power of 2

  if (Cmp.getOperand(1) == Y && C.isNegatedPowerOf2()) {

    auto NewPred =

        Pred == CmpInst::ICMP_EQ ? CmpInst::ICMP_UGT : CmpInst::ICMP_ULE;

    return new ICmpInst(NewPred, X, SubOne(cast<Constant>(Cmp.getOperand(1))));

  }


  // ((zext i1 X) & Y) == 0 --> !((trunc Y) & X)

  // ((zext i1 X) & Y) != 0 -->  ((trunc Y) & X)

  // ((zext i1 X) & Y) == 1 -->  ((trunc Y) & X)

  // ((zext i1 X) & Y) != 1 --> !((trunc Y) & X)

  if (match(And, m_OneUse(m_c_And(m_OneUse(m_ZExt(m_Value(X))), m_Value(Y)))) &&

      X->getType()->isIntOrIntVectorTy(1) && (C.isZero() || C.isOne())) {

    Value *TruncY = Builder.CreateTrunc(Y, X->getType());

    if (C.isZero() ^ (Pred == CmpInst::ICMP_NE)) {

      Value *And = Builder.CreateAnd(TruncY, X);

      return BinaryOperator::CreateNot(And);

    }

    return BinaryOperator::CreateAnd(TruncY, X);

  }


  // (icmp eq/ne (and (shl -1, X), Y), 0)

  //    -> (icmp eq/ne (lshr Y, X), 0)

  // We could technically handle any C == 0 or (C < 0 && isOdd(C)) but it seems

  // highly unlikely the non-zero case will ever show up in code.

  if (C.isZero() &&

      match(And, m_OneUse(m_c_And(m_OneUse(m_Shl(m_AllOnes(), m_Value(X))),

                                  m_Value(Y))))) {

    Value *LShr = Builder.CreateLShr(Y, X);

    return new ICmpInst(Pred, LShr, Constant::getNullValue(LShr->getType()));

  }


  // (icmp eq/ne (and (add A, Addend), Msk), C)

  //    -> (icmp eq/ne (and A, Msk), (and (sub C, Addend), Msk))

  {

    Value *A;

    const APInt *Addend, *Msk;

    if (match(And, m_And(m_OneUse(m_Add(m_Value(A), m_APInt(Addend))),

                         m_LowBitMask(Msk))) &&

        C.ule(*Msk)) {

      APInt NewComperand = (C - *Addend) & *Msk;

      Value *MaskA = Builder.CreateAnd(A, ConstantInt::get(A->getType(), *Msk));

      return new ICmpInst(Pred, MaskA,

                          ConstantInt::get(MaskA->getType(), NewComperand));

    }

  }


  return nullptr;

}


/// Fold icmp eq/ne (or (xor/sub (X1, X2), xor/sub (X3, X4))), 0.

static Value *foldICmpOrXorSubChain(ICmpInst &Cmp, BinaryOperator *Or,

                                    InstCombiner::BuilderTy &Builder) {

  // Are we using xors or subs to bitwise check for a pair or pairs of

  // (in)equalities? Convert to a shorter form that has more potential to be

  // folded even further.

  // ((X1 ^/- X2) || (X3 ^/- X4)) == 0 --> (X1 == X2) && (X3 == X4)

  // ((X1 ^/- X2) || (X3 ^/- X4)) != 0 --> (X1 != X2) || (X3 != X4)

  // ((X1 ^/- X2) || (X3 ^/- X4) || (X5 ^/- X6)) == 0 -->

  // (X1 == X2) && (X3 == X4) && (X5 == X6)

  // ((X1 ^/- X2) || (X3 ^/- X4) || (X5 ^/- X6)) != 0 -->

  // (X1 != X2) || (X3 != X4) || (X5 != X6)

  SmallVector<std::pair<Value *, Value *>, 2> CmpValues;

  SmallVector<Value *, 16> WorkList(1, Or);


  while (!WorkList.empty()) {

    auto MatchOrOperatorArgument = [&](Value *OrOperatorArgument) {

      Value *Lhs, *Rhs;


      if (match(OrOperatorArgument,

                m_OneUse(m_Xor(m_Value(Lhs), m_Value(Rhs))))) {

        CmpValues.emplace_back(Lhs, Rhs);

        return;

      }


      if (match(OrOperatorArgument,

                m_OneUse(m_Sub(m_Value(Lhs), m_Value(Rhs))))) {

        CmpValues.emplace_back(Lhs, Rhs);

        return;

      }


      WorkList.push_back(OrOperatorArgument);

    };


    Value *CurrentValue = WorkList.pop_back_val();

    Value *OrOperatorLhs, *OrOperatorRhs;


    if (!match(CurrentValue,

               m_Or(m_Value(OrOperatorLhs), m_Value(OrOperatorRhs)))) {

      return nullptr;

    }


    MatchOrOperatorArgument(OrOperatorRhs);

    MatchOrOperatorArgument(OrOperatorLhs);

  }


  ICmpInst::Predicate Pred = Cmp.getPredicate();

  auto BOpc = Pred == CmpInst::ICMP_EQ ? Instruction::And : Instruction::Or;

  Value *LhsCmp = Builder.CreateICmp(Pred, CmpValues.rbegin()->first,

                                     CmpValues.rbegin()->second);


  for (auto It = CmpValues.rbegin() + 1; It != CmpValues.rend(); ++It) {

    Value *RhsCmp = Builder.CreateICmp(Pred, It->first, It->second);

    LhsCmp = Builder.CreateBinOp(BOpc, LhsCmp, RhsCmp);

  }


  return LhsCmp;

}


/// Fold icmp (or X, Y), C.

Instruction *InstCombinerImpl::foldICmpOrConstant(ICmpInst &Cmp,

                                                  BinaryOperator *Or,

                                                  const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  if (C.isOne()) {

    // icmp slt signum(V) 1 --> icmp slt V, 1

    Value *V = nullptr;

    if (Pred == ICmpInst::ICMP_SLT && match(Or, m_Signum(m_Value(V))))

      return new ICmpInst(ICmpInst::ICMP_SLT, V,

                          ConstantInt::get(V->getType(), 1));

  }


  Value *OrOp0 = Or->getOperand(0), *OrOp1 = Or->getOperand(1);


  // (icmp eq/ne (or disjoint x, C0), C1)

  //    -> (icmp eq/ne x, C0^C1)

  if (Cmp.isEquality() && match(OrOp1, m_ImmConstant()) &&

      cast<PossiblyDisjointInst>(Or)->isDisjoint()) {

    Value *NewC =

        Builder.CreateXor(OrOp1, ConstantInt::get(OrOp1->getType(), C));

    return new ICmpInst(Pred, OrOp0, NewC);

  }


  const APInt *MaskC;

  if (match(OrOp1, m_APInt(MaskC)) && Cmp.isEquality()) {

    if (*MaskC == C && (C + 1).isPowerOf2()) {

      // X | C == C --> X <=u C

      // X | C != C --> X  >u C

      //   iff C+1 is a power of 2 (C is a bitmask of the low bits)

      Pred = (Pred == CmpInst::ICMP_EQ) ? CmpInst::ICMP_ULE : CmpInst::ICMP_UGT;

      return new ICmpInst(Pred, OrOp0, OrOp1);

    }


    // More general: canonicalize 'equality with set bits mask' to

    // 'equality with clear bits mask'.

    // (X | MaskC) == C --> (X & ~MaskC) == C ^ MaskC

    // (X | MaskC) != C --> (X & ~MaskC) != C ^ MaskC

    if (Or->hasOneUse()) {

      Value *And = Builder.CreateAnd(OrOp0, ~(*MaskC));

      Constant *NewC = ConstantInt::get(Or->getType(), C ^ (*MaskC));

      return new ICmpInst(Pred, And, NewC);

    }

  }


  // (X | (X-1)) s<  0 --> X s< 1

  // (X | (X-1)) s> -1 --> X s> 0

  Value *X;

  bool TrueIfSigned;

  if (isSignBitCheck(Pred, C, TrueIfSigned) &&

      match(Or, m_c_Or(m_Add(m_Value(X), m_AllOnes()), m_Deferred(X)))) {

    auto NewPred = TrueIfSigned ? ICmpInst::ICMP_SLT : ICmpInst::ICMP_SGT;

    Constant *NewC = ConstantInt::get(X->getType(), TrueIfSigned ? 1 : 0);

    return new ICmpInst(NewPred, X, NewC);

  }


  const APInt *OrC;

  // icmp(X | OrC, C) --> icmp(X, 0)

  if (C.isNonNegative() && match(Or, m_Or(m_Value(X), m_APInt(OrC)))) {

    switch (Pred) {

    // X | OrC s< C --> X s< 0 iff OrC s>= C s>= 0

    case ICmpInst::ICMP_SLT:

    // X | OrC s>= C --> X s>= 0 iff OrC s>= C s>= 0

    case ICmpInst::ICMP_SGE:

      if (OrC->sge(C))

        return new ICmpInst(Pred, X, ConstantInt::getNullValue(X->getType()));

      break;

    // X | OrC s<= C --> X s< 0 iff OrC s> C s>= 0

    case ICmpInst::ICMP_SLE:

    // X | OrC s> C --> X s>= 0 iff OrC s> C s>= 0

    case ICmpInst::ICMP_SGT:

      if (OrC->sgt(C))

        return new ICmpInst(ICmpInst::getFlippedStrictnessPredicate(Pred), X,

                            ConstantInt::getNullValue(X->getType()));

      break;

    default:

      break;

    }

  }


  if (!Cmp.isEquality() || !C.isZero() || !Or->hasOneUse())

    return nullptr;


  Value *P, *Q;

  if (match(Or, m_Or(m_PtrToInt(m_Value(P)), m_PtrToInt(m_Value(Q))))) {

    // Simplify icmp eq (or (ptrtoint P), (ptrtoint Q)), 0

    // -> and (icmp eq P, null), (icmp eq Q, null).

    Value *CmpP =

        Builder.CreateICmp(Pred, P, ConstantInt::getNullValue(P->getType()));

    Value *CmpQ =

        Builder.CreateICmp(Pred, Q, ConstantInt::getNullValue(Q->getType()));

    auto BOpc = Pred == CmpInst::ICMP_EQ ? Instruction::And : Instruction::Or;

    return BinaryOperator::Create(BOpc, CmpP, CmpQ);

  }


  if (Value *V = foldICmpOrXorSubChain(Cmp, Or, Builder))

    return replaceInstUsesWith(Cmp, V);


  return nullptr;

}


/// Fold icmp (mul X, Y), C.

Instruction *InstCombinerImpl::foldICmpMulConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Mul,

                                                   const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Type *MulTy = Mul->getType();

  Value *X = Mul->getOperand(0);


  // If there's no overflow:

  // X * X == 0 --> X == 0

  // X * X != 0 --> X != 0

  if (Cmp.isEquality() && C.isZero() && X == Mul->getOperand(1) &&

      (Mul->hasNoUnsignedWrap() || Mul->hasNoSignedWrap()))

    return new ICmpInst(Pred, X, ConstantInt::getNullValue(MulTy));


  const APInt *MulC;

  if (!match(Mul->getOperand(1), m_APInt(MulC)))

    return nullptr;


  // If this is a test of the sign bit and the multiply is sign-preserving with

  // a constant operand, use the multiply LHS operand instead:

  // (X * +MulC) < 0 --> X < 0

  // (X * -MulC) < 0 --> X > 0

  if (isSignTest(Pred, C) && Mul->hasNoSignedWrap()) {

    if (MulC->isNegative())

      Pred = ICmpInst::getSwappedPredicate(Pred);

    return new ICmpInst(Pred, X, ConstantInt::getNullValue(MulTy));

  }


  if (MulC->isZero())

    return nullptr;


  // If the multiply does not wrap or the constant is odd, try to divide the

  // compare constant by the multiplication factor.

  if (Cmp.isEquality()) {

    // (mul nsw X, MulC) eq/ne C --> X eq/ne C /s MulC

    if (Mul->hasNoSignedWrap() && C.srem(*MulC).isZero()) {

      Constant *NewC = ConstantInt::get(MulTy, C.sdiv(*MulC));

      return new ICmpInst(Pred, X, NewC);

    }


    // C % MulC == 0 is weaker than we could use if MulC is odd because it

    // correct to transform if MulC * N == C including overflow. I.e with i8

    // (icmp eq (mul X, 5), 101) -> (icmp eq X, 225) but since 101 % 5 != 0, we

    // miss that case.

    if (C.urem(*MulC).isZero()) {

      // (mul nuw X, MulC) eq/ne C --> X eq/ne C /u MulC

      // (mul X, OddC) eq/ne N * C --> X eq/ne N

      if ((*MulC & 1).isOne() || Mul->hasNoUnsignedWrap()) {

        Constant *NewC = ConstantInt::get(MulTy, C.udiv(*MulC));

        return new ICmpInst(Pred, X, NewC);

      }

    }

  }


  // With a matching no-overflow guarantee, fold the constants:

  // (X * MulC) < C --> X < (C / MulC)

  // (X * MulC) > C --> X > (C / MulC)

  // TODO: Assert that Pred is not equal to SGE, SLE, UGE, ULE?

  Constant *NewC = nullptr;

  if (Mul->hasNoSignedWrap() && ICmpInst::isSigned(Pred)) {

    // MININT / -1 --> overflow.

    if (C.isMinSignedValue() && MulC->isAllOnes())

      return nullptr;

    if (MulC->isNegative())

      Pred = ICmpInst::getSwappedPredicate(Pred);


    if (Pred == ICmpInst::ICMP_SLT || Pred == ICmpInst::ICMP_SGE) {

      NewC = ConstantInt::get(

          MulTy, APIntOps::RoundingSDiv(C, *MulC, APInt::Rounding::UP));

    } else {

      assert((Pred == ICmpInst::ICMP_SLE || Pred == ICmpInst::ICMP_SGT) &&

             "Unexpected predicate");

      NewC = ConstantInt::get(

          MulTy, APIntOps::RoundingSDiv(C, *MulC, APInt::Rounding::DOWN));

    }

  } else if (Mul->hasNoUnsignedWrap() && ICmpInst::isUnsigned(Pred)) {

    if (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE) {

      NewC = ConstantInt::get(

          MulTy, APIntOps::RoundingUDiv(C, *MulC, APInt::Rounding::UP));

    } else {

      assert((Pred == ICmpInst::ICMP_ULE || Pred == ICmpInst::ICMP_UGT) &&

             "Unexpected predicate");

      NewC = ConstantInt::get(

          MulTy, APIntOps::RoundingUDiv(C, *MulC, APInt::Rounding::DOWN));

    }

  }


  return NewC ? new ICmpInst(Pred, X, NewC) : nullptr;

}


/// Fold icmp (shl nuw C2, Y), C.

static Instruction *foldICmpShlLHSC(ICmpInst &Cmp, Instruction *Shl,

                                    const APInt &C) {

  Value *Y;

  const APInt *C2;

  if (!match(Shl, m_NUWShl(m_APInt(C2), m_Value(Y))))

    return nullptr;


  Type *ShiftType = Shl->getType();

  unsigned TypeBits = C.getBitWidth();

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  if (Cmp.isUnsigned()) {

    if (C2->isZero() || C2->ugt(C))

      return nullptr;

    APInt Div, Rem;

    APInt::udivrem(C, *C2, Div, Rem);

    bool CIsPowerOf2 = Rem.isZero() && Div.isPowerOf2();


    // (1 << Y) pred C -> Y pred Log2(C)

    if (!CIsPowerOf2) {

      // (1 << Y) <  30 -> Y <= 4

      // (1 << Y) <= 30 -> Y <= 4

      // (1 << Y) >= 30 -> Y >  4

      // (1 << Y) >  30 -> Y >  4

      if (Pred == ICmpInst::ICMP_ULT)

        Pred = ICmpInst::ICMP_ULE;

      else if (Pred == ICmpInst::ICMP_UGE)

        Pred = ICmpInst::ICMP_UGT;

    }


    unsigned CLog2 = Div.logBase2();

    return new ICmpInst(Pred, Y, ConstantInt::get(ShiftType, CLog2));

  } else if (Cmp.isSigned() && C2->isOne()) {

    Constant *BitWidthMinusOne = ConstantInt::get(ShiftType, TypeBits - 1);

    // (1 << Y) >  0 -> Y != 31

    // (1 << Y) >  C -> Y != 31 if C is negative.

    if (Pred == ICmpInst::ICMP_SGT && C.sle(0))

      return new ICmpInst(ICmpInst::ICMP_NE, Y, BitWidthMinusOne);


    // (1 << Y) <  0 -> Y == 31

    // (1 << Y) <  1 -> Y == 31

    // (1 << Y) <  C -> Y == 31 if C is negative and not signed min.

    // Exclude signed min by subtracting 1 and lower the upper bound to 0.

    if (Pred == ICmpInst::ICMP_SLT && (C - 1).sle(0))

      return new ICmpInst(ICmpInst::ICMP_EQ, Y, BitWidthMinusOne);

  }


  return nullptr;

}


/// Fold icmp (shl X, Y), C.

Instruction *InstCombinerImpl::foldICmpShlConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Shl,

                                                   const APInt &C) {

  const APInt *ShiftVal;

  if (Cmp.isEquality() && match(Shl->getOperand(0), m_APInt(ShiftVal)))

    return foldICmpShlConstConst(Cmp, Shl->getOperand(1), C, *ShiftVal);


  ICmpInst::Predicate Pred = Cmp.getPredicate();

  // (icmp pred (shl nuw&nsw X, Y), Csle0)

  //      -> (icmp pred X, Csle0)

  //

  // The idea is the nuw/nsw essentially freeze the sign bit for the shift op

  // so X's must be what is used.

  if (C.sle(0) && Shl->hasNoUnsignedWrap() && Shl->hasNoSignedWrap())

    return new ICmpInst(Pred, Shl->getOperand(0), Cmp.getOperand(1));


  // (icmp eq/ne (shl nuw|nsw X, Y), 0)

  //      -> (icmp eq/ne X, 0)

  if (ICmpInst::isEquality(Pred) && C.isZero() &&

      (Shl->hasNoUnsignedWrap() || Shl->hasNoSignedWrap()))

    return new ICmpInst(Pred, Shl->getOperand(0), Cmp.getOperand(1));


  // (icmp slt (shl nsw X, Y), 0/1)

  //      -> (icmp slt X, 0/1)

  // (icmp sgt (shl nsw X, Y), 0/-1)

  //      -> (icmp sgt X, 0/-1)

  //

  // NB: sge/sle with a constant will canonicalize to sgt/slt.

  if (Shl->hasNoSignedWrap() &&

      (Pred == ICmpInst::ICMP_SGT || Pred == ICmpInst::ICMP_SLT))

    if (C.isZero() || (Pred == ICmpInst::ICMP_SGT ? C.isAllOnes() : C.isOne()))

      return new ICmpInst(Pred, Shl->getOperand(0), Cmp.getOperand(1));


  const APInt *ShiftAmt;

  if (!match(Shl->getOperand(1), m_APInt(ShiftAmt)))

    return foldICmpShlLHSC(Cmp, Shl, C);


  // Check that the shift amount is in range. If not, don't perform undefined

  // shifts. When the shift is visited, it will be simplified.

  unsigned TypeBits = C.getBitWidth();

  if (ShiftAmt->uge(TypeBits))

    return nullptr;


  Value *X = Shl->getOperand(0);

  Type *ShType = Shl->getType();


  // NSW guarantees that we are only shifting out sign bits from the high bits,

  // so we can ASHR the compare constant without needing a mask and eliminate

  // the shift.

  if (Shl->hasNoSignedWrap()) {

    if (Pred == ICmpInst::ICMP_SGT) {

      // icmp Pred (shl nsw X, ShiftAmt), C --> icmp Pred X, (C >>s ShiftAmt)

      APInt ShiftedC = C.ashr(*ShiftAmt);

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

    if ((Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_NE) &&

        C.ashr(*ShiftAmt).shl(*ShiftAmt) == C) {

      APInt ShiftedC = C.ashr(*ShiftAmt);

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

    if (Pred == ICmpInst::ICMP_SLT) {

      // SLE is the same as above, but SLE is canonicalized to SLT, so convert:

      // (X << S) <=s C is equiv to X <=s (C >> S) for all C

      // (X << S) <s (C + 1) is equiv to X <s (C >> S) + 1 if C <s SMAX

      // (X << S) <s C is equiv to X <s ((C - 1) >> S) + 1 if C >s SMIN

      assert(!C.isMinSignedValue() && "Unexpected icmp slt");

      APInt ShiftedC = (C - 1).ashr(*ShiftAmt) + 1;

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

  }


  // NUW guarantees that we are only shifting out zero bits from the high bits,

  // so we can LSHR the compare constant without needing a mask and eliminate

  // the shift.

  if (Shl->hasNoUnsignedWrap()) {

    if (Pred == ICmpInst::ICMP_UGT) {

      // icmp Pred (shl nuw X, ShiftAmt), C --> icmp Pred X, (C >>u ShiftAmt)

      APInt ShiftedC = C.lshr(*ShiftAmt);

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

    if ((Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_NE) &&

        C.lshr(*ShiftAmt).shl(*ShiftAmt) == C) {

      APInt ShiftedC = C.lshr(*ShiftAmt);

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

    if (Pred == ICmpInst::ICMP_ULT) {

      // ULE is the same as above, but ULE is canonicalized to ULT, so convert:

      // (X << S) <=u C is equiv to X <=u (C >> S) for all C

      // (X << S) <u (C + 1) is equiv to X <u (C >> S) + 1 if C <u ~0u

      // (X << S) <u C is equiv to X <u ((C - 1) >> S) + 1 if C >u 0

      assert(C.ugt(0) && "ult 0 should have been eliminated");

      APInt ShiftedC = (C - 1).lshr(*ShiftAmt) + 1;

      return new ICmpInst(Pred, X, ConstantInt::get(ShType, ShiftedC));

    }

  }


  if (Cmp.isEquality() && Shl->hasOneUse()) {

    // Strength-reduce the shift into an 'and'.

    Constant *Mask = ConstantInt::get(

        ShType,

        APInt::getLowBitsSet(TypeBits, TypeBits - ShiftAmt->getZExtValue()));

    Value *And = Builder.CreateAnd(X, Mask, Shl->getName() + ".mask");

    Constant *LShrC = ConstantInt::get(ShType, C.lshr(*ShiftAmt));

    return new ICmpInst(Pred, And, LShrC);

  }


  // Otherwise, if this is a comparison of the sign bit, simplify to and/test.

  bool TrueIfSigned = false;

  if (Shl->hasOneUse() && isSignBitCheck(Pred, C, TrueIfSigned)) {

    // (X << 31) <s 0  --> (X & 1) != 0

    Constant *Mask = ConstantInt::get(

        ShType,

        APInt::getOneBitSet(TypeBits, TypeBits - ShiftAmt->getZExtValue() - 1));

    Value *And = Builder.CreateAnd(X, Mask, Shl->getName() + ".mask");

    return new ICmpInst(TrueIfSigned ? ICmpInst::ICMP_NE : ICmpInst::ICMP_EQ,

                        And, Constant::getNullValue(ShType));

  }


  // Simplify 'shl' inequality test into 'and' equality test.

  if (Cmp.isUnsigned() && Shl->hasOneUse()) {

    // (X l<< C2) u<=/u> C1 iff C1+1 is power of two -> X & (~C1 l>> C2) ==/!= 0

    if ((C + 1).isPowerOf2() &&

        (Pred == ICmpInst::ICMP_ULE || Pred == ICmpInst::ICMP_UGT)) {

      Value *And = Builder.CreateAnd(X, (~C).lshr(ShiftAmt->getZExtValue()));

      return new ICmpInst(Pred == ICmpInst::ICMP_ULE ? ICmpInst::ICMP_EQ

                                                     : ICmpInst::ICMP_NE,

                          And, Constant::getNullValue(ShType));

    }

    // (X l<< C2) u</u>= C1 iff C1 is power of two -> X & (-C1 l>> C2) ==/!= 0

    if (C.isPowerOf2() &&

        (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE)) {

      Value *And =

          Builder.CreateAnd(X, (~(C - 1)).lshr(ShiftAmt->getZExtValue()));

      return new ICmpInst(Pred == ICmpInst::ICMP_ULT ? ICmpInst::ICMP_EQ

                                                     : ICmpInst::ICMP_NE,

                          And, Constant::getNullValue(ShType));

    }

  }


  // Transform (icmp pred iM (shl iM %v, N), C)

  // -> (icmp pred i(M-N) (trunc %v iM to i(M-N)), (trunc (C>>N))

  // Transform the shl to a trunc if (trunc (C>>N)) has no loss and M-N.

  // This enables us to get rid of the shift in favor of a trunc that may be

  // free on the target. It has the additional benefit of comparing to a

  // smaller constant that may be more target-friendly.

  unsigned Amt = ShiftAmt->getLimitedValue(TypeBits - 1);

  if (Shl->hasOneUse() && Amt != 0 &&

      shouldChangeType(ShType->getScalarSizeInBits(), TypeBits - Amt)) {

    ICmpInst::Predicate CmpPred = Pred;

    APInt RHSC = C;


    if (RHSC.countr_zero() < Amt && ICmpInst::isStrictPredicate(CmpPred)) {

      // Try the flipped strictness predicate.

      // e.g.:

      // icmp ult i64 (shl X, 32), 8589934593 ->

      // icmp ule i64 (shl X, 32), 8589934592 ->

      // icmp ule i32 (trunc X, i32), 2 ->

      // icmp ult i32 (trunc X, i32), 3

      if (auto FlippedStrictness = getFlippedStrictnessPredicateAndConstant(

              Pred, ConstantInt::get(ShType->getContext(), C))) {

        CmpPred = FlippedStrictness->first;

        RHSC = cast<ConstantInt>(FlippedStrictness->second)->getValue();

      }

    }


    if (RHSC.countr_zero() >= Amt) {

      Type *TruncTy = ShType->getWithNewBitWidth(TypeBits - Amt);

      Constant *NewC =

          ConstantInt::get(TruncTy, RHSC.ashr(*ShiftAmt).trunc(TypeBits - Amt));

      return new ICmpInst(CmpPred,

                          Builder.CreateTrunc(X, TruncTy, "", /*IsNUW=*/false,

                                              Shl->hasNoSignedWrap()),

                          NewC);

    }

  }


  return nullptr;

}


/// Fold icmp ({al}shr X, Y), C.

Instruction *InstCombinerImpl::foldICmpShrConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Shr,

                                                   const APInt &C) {

  // An exact shr only shifts out zero bits, so:

  // icmp eq/ne (shr X, Y), 0 --> icmp eq/ne X, 0

  Value *X = Shr->getOperand(0);

  CmpInst::Predicate Pred = Cmp.getPredicate();

  if (Cmp.isEquality() && Shr->isExact() && C.isZero())

    return new ICmpInst(Pred, X, Cmp.getOperand(1));


  bool IsAShr = Shr->getOpcode() == Instruction::AShr;

  const APInt *ShiftValC;

  if (match(X, m_APInt(ShiftValC))) {

    if (Cmp.isEquality())

      return foldICmpShrConstConst(Cmp, Shr->getOperand(1), C, *ShiftValC);


    // (ShiftValC >> Y) >s -1 --> Y != 0 with ShiftValC < 0

    // (ShiftValC >> Y) <s  0 --> Y == 0 with ShiftValC < 0

    bool TrueIfSigned;

    if (!IsAShr && ShiftValC->isNegative() &&

        isSignBitCheck(Pred, C, TrueIfSigned))

      return new ICmpInst(TrueIfSigned ? CmpInst::ICMP_EQ : CmpInst::ICMP_NE,

                          Shr->getOperand(1),

                          ConstantInt::getNullValue(X->getType()));


    // If the shifted constant is a power-of-2, test the shift amount directly:

    // (ShiftValC >> Y) >u C --> X <u (LZ(C) - LZ(ShiftValC))

    // (ShiftValC >> Y) <u C --> X >=u (LZ(C-1) - LZ(ShiftValC))

    if (!IsAShr && ShiftValC->isPowerOf2() &&

        (Pred == CmpInst::ICMP_UGT || Pred == CmpInst::ICMP_ULT)) {

      bool IsUGT = Pred == CmpInst::ICMP_UGT;

      assert(ShiftValC->uge(C) && "Expected simplify of compare");

      assert((IsUGT || !C.isZero()) && "Expected X u< 0 to simplify");


      unsigned CmpLZ = IsUGT ? C.countl_zero() : (C - 1).countl_zero();

      unsigned ShiftLZ = ShiftValC->countl_zero();

      Constant *NewC = ConstantInt::get(Shr->getType(), CmpLZ - ShiftLZ);

      auto NewPred = IsUGT ? CmpInst::ICMP_ULT : CmpInst::ICMP_UGE;

      return new ICmpInst(NewPred, Shr->getOperand(1), NewC);

    }

  }


  const APInt *ShiftAmtC;

  if (!match(Shr->getOperand(1), m_APInt(ShiftAmtC)))

    return nullptr;


  // Check that the shift amount is in range. If not, don't perform undefined

  // shifts. When the shift is visited it will be simplified.

  unsigned TypeBits = C.getBitWidth();

  unsigned ShAmtVal = ShiftAmtC->getLimitedValue(TypeBits);

  if (ShAmtVal >= TypeBits || ShAmtVal == 0)

    return nullptr;


  bool IsExact = Shr->isExact();

  Type *ShrTy = Shr->getType();

  // TODO: If we could guarantee that InstSimplify would handle all of the

  // constant-value-based preconditions in the folds below, then we could assert

  // those conditions rather than checking them. This is difficult because of

  // undef/poison (PR34838).

  if (IsAShr && Shr->hasOneUse()) {

    if (IsExact && (Pred == CmpInst::ICMP_SLT || Pred == CmpInst::ICMP_ULT) &&

        (C - 1).isPowerOf2() && C.countLeadingZeros() > ShAmtVal) {

      // When C - 1 is a power of two and the transform can be legally

      // performed, prefer this form so the produced constant is close to a

      // power of two.

      // icmp slt/ult (ashr exact X, ShAmtC), C

      // --> icmp slt/ult X, (C - 1) << ShAmtC) + 1

      APInt ShiftedC = (C - 1).shl(ShAmtVal) + 1;

      return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }

    if (IsExact || Pred == CmpInst::ICMP_SLT || Pred == CmpInst::ICMP_ULT) {

      // When ShAmtC can be shifted losslessly:

      // icmp PRED (ashr exact X, ShAmtC), C --> icmp PRED X, (C << ShAmtC)

      // icmp slt/ult (ashr X, ShAmtC), C --> icmp slt/ult X, (C << ShAmtC)

      APInt ShiftedC = C.shl(ShAmtVal);

      if (ShiftedC.ashr(ShAmtVal) == C)

        return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }

    if (Pred == CmpInst::ICMP_SGT) {

      // icmp sgt (ashr X, ShAmtC), C --> icmp sgt X, ((C + 1) << ShAmtC) - 1

      APInt ShiftedC = (C + 1).shl(ShAmtVal) - 1;

      if (!C.isMaxSignedValue() && !(C + 1).shl(ShAmtVal).isMinSignedValue() &&

          (ShiftedC + 1).ashr(ShAmtVal) == (C + 1))

        return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }

    if (Pred == CmpInst::ICMP_UGT) {

      // icmp ugt (ashr X, ShAmtC), C --> icmp ugt X, ((C + 1) << ShAmtC) - 1

      // 'C + 1 << ShAmtC' can overflow as a signed number, so the 2nd

      // clause accounts for that pattern.

      APInt ShiftedC = (C + 1).shl(ShAmtVal) - 1;

      if ((ShiftedC + 1).ashr(ShAmtVal) == (C + 1) ||

          (C + 1).shl(ShAmtVal).isMinSignedValue())

        return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }


    // If the compare constant has significant bits above the lowest sign-bit,

    // then convert an unsigned cmp to a test of the sign-bit:

    // (ashr X, ShiftC) u> C --> X s< 0

    // (ashr X, ShiftC) u< C --> X s> -1

    if (C.getBitWidth() > 2 && C.getNumSignBits() <= ShAmtVal) {

      if (Pred == CmpInst::ICMP_UGT) {

        return new ICmpInst(CmpInst::ICMP_SLT, X,

                            ConstantInt::getNullValue(ShrTy));

      }

      if (Pred == CmpInst::ICMP_ULT) {

        return new ICmpInst(CmpInst::ICMP_SGT, X,

                            ConstantInt::getAllOnesValue(ShrTy));

      }

    }

  } else if (!IsAShr) {

    if (Pred == CmpInst::ICMP_ULT || (Pred == CmpInst::ICMP_UGT && IsExact)) {

      // icmp ult (lshr X, ShAmtC), C --> icmp ult X, (C << ShAmtC)

      // icmp ugt (lshr exact X, ShAmtC), C --> icmp ugt X, (C << ShAmtC)

      APInt ShiftedC = C.shl(ShAmtVal);

      if (ShiftedC.lshr(ShAmtVal) == C)

        return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }

    if (Pred == CmpInst::ICMP_UGT) {

      // icmp ugt (lshr X, ShAmtC), C --> icmp ugt X, ((C + 1) << ShAmtC) - 1

      APInt ShiftedC = (C + 1).shl(ShAmtVal) - 1;

      if ((ShiftedC + 1).lshr(ShAmtVal) == (C + 1))

        return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, ShiftedC));

    }

  }


  if (!Cmp.isEquality())

    return nullptr;


  // Handle equality comparisons of shift-by-constant.


  // If the comparison constant changes with the shift, the comparison cannot

  // succeed (bits of the comparison constant cannot match the shifted value).

  // This should be known by InstSimplify and already be folded to true/false.

  assert(((IsAShr && C.shl(ShAmtVal).ashr(ShAmtVal) == C) ||

          (!IsAShr && C.shl(ShAmtVal).lshr(ShAmtVal) == C)) &&

         "Expected icmp+shr simplify did not occur.");


  // If the bits shifted out are known zero, compare the unshifted value:

  //  (X & 4) >> 1 == 2  --> (X & 4) == 4.

  if (Shr->isExact())

    return new ICmpInst(Pred, X, ConstantInt::get(ShrTy, C << ShAmtVal));


  if (C.isZero()) {

    // == 0 is u< 1.

    if (Pred == CmpInst::ICMP_EQ)

      return new ICmpInst(CmpInst::ICMP_ULT, X,

                          ConstantInt::get(ShrTy, (C + 1).shl(ShAmtVal)));

    else

      return new ICmpInst(CmpInst::ICMP_UGT, X,

                          ConstantInt::get(ShrTy, (C + 1).shl(ShAmtVal) - 1));

  }


  if (Shr->hasOneUse()) {

    // Canonicalize the shift into an 'and':

    // icmp eq/ne (shr X, ShAmt), C --> icmp eq/ne (and X, HiMask), (C << ShAmt)

    APInt Val(APInt::getHighBitsSet(TypeBits, TypeBits - ShAmtVal));

    Constant *Mask = ConstantInt::get(ShrTy, Val);

    Value *And = Builder.CreateAnd(X, Mask, Shr->getName() + ".mask");

    return new ICmpInst(Pred, And, ConstantInt::get(ShrTy, C << ShAmtVal));

  }


  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpSRemConstant(ICmpInst &Cmp,

                                                    BinaryOperator *SRem,

                                                    const APInt &C) {

  const ICmpInst::Predicate Pred = Cmp.getPredicate();

  if (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULT) {

    // Canonicalize unsigned predicates to signed:

    // (X s% DivisorC) u> C -> (X s% DivisorC) s< 0

    //   iff (C s< 0 ? ~C : C) u>= abs(DivisorC)-1

    // (X s% DivisorC) u< C+1 -> (X s% DivisorC) s> -1

    //   iff (C+1 s< 0 ? ~C : C) u>= abs(DivisorC)-1


    const APInt *DivisorC;

    if (!match(SRem->getOperand(1), m_APInt(DivisorC)))

      return nullptr;


    APInt NormalizedC = C;

    if (Pred == ICmpInst::ICMP_ULT) {

      assert(!NormalizedC.isZero() &&

             "ult X, 0 should have been simplified already.");

      --NormalizedC;

    }

    if (C.isNegative())

      NormalizedC.flipAllBits();

    assert(!DivisorC->isZero() &&

           "srem X, 0 should have been simplified already.");

    if (!NormalizedC.uge(DivisorC->abs() - 1))

      return nullptr;


    Type *Ty = SRem->getType();

    if (Pred == ICmpInst::ICMP_UGT)

      return new ICmpInst(ICmpInst::ICMP_SLT, SRem,

                          ConstantInt::getNullValue(Ty));

    return new ICmpInst(ICmpInst::ICMP_SGT, SRem,

                        ConstantInt::getAllOnesValue(Ty));

  }

  // Match an 'is positive' or 'is negative' comparison of remainder by a

  // constant power-of-2 value:

  // (X % pow2C) sgt/slt 0

  if (Pred != ICmpInst::ICMP_SGT && Pred != ICmpInst::ICMP_SLT &&

      Pred != ICmpInst::ICMP_EQ && Pred != ICmpInst::ICMP_NE)

    return nullptr;


  // TODO: The one-use check is standard because we do not typically want to

  //       create longer instruction sequences, but this might be a special-case

  //       because srem is not good for analysis or codegen.

  if (!SRem->hasOneUse())

    return nullptr;


  const APInt *DivisorC;

  if (!match(SRem->getOperand(1), m_Power2(DivisorC)))

    return nullptr;


  // For cmp_sgt/cmp_slt only zero valued C is handled.

  // For cmp_eq/cmp_ne only positive valued C is handled.

  if (((Pred == ICmpInst::ICMP_SGT || Pred == ICmpInst::ICMP_SLT) &&

       !C.isZero()) ||

      ((Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_NE) &&

       !C.isStrictlyPositive()))

    return nullptr;


  // Mask off the sign bit and the modulo bits (low-bits).

  Type *Ty = SRem->getType();

  APInt SignMask = APInt::getSignMask(Ty->getScalarSizeInBits());

  Constant *MaskC = ConstantInt::get(Ty, SignMask | (*DivisorC - 1));

  Value *And = Builder.CreateAnd(SRem->getOperand(0), MaskC);


  if (Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_NE)

    return new ICmpInst(Pred, And, ConstantInt::get(Ty, C));


  // For 'is positive?' check that the sign-bit is clear and at least 1 masked

  // bit is set. Example:

  // (i8 X % 32) s> 0 --> (X & 159) s> 0

  if (Pred == ICmpInst::ICMP_SGT)

    return new ICmpInst(ICmpInst::ICMP_SGT, And, ConstantInt::getNullValue(Ty));


  // For 'is negative?' check that the sign-bit is set and at least 1 masked

  // bit is set. Example:

  // (i16 X % 4) s< 0 --> (X & 32771) u> 32768

  return new ICmpInst(ICmpInst::ICMP_UGT, And, ConstantInt::get(Ty, SignMask));

}


/// Fold icmp (udiv X, Y), C.

Instruction *InstCombinerImpl::foldICmpUDivConstant(ICmpInst &Cmp,

                                                    BinaryOperator *UDiv,

                                                    const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Value *X = UDiv->getOperand(0);

  Value *Y = UDiv->getOperand(1);

  Type *Ty = UDiv->getType();


  const APInt *C2;

  if (!match(X, m_APInt(C2)))

    return nullptr;


  assert(*C2 != 0 && "udiv 0, X should have been simplified already.");


  // (icmp ugt (udiv C2, Y), C) -> (icmp ule Y, C2/(C+1))

  if (Pred == ICmpInst::ICMP_UGT) {

    assert(!C.isMaxValue() &&

           "icmp ugt X, UINT_MAX should have been simplified already.");

    return new ICmpInst(ICmpInst::ICMP_ULE, Y,

                        ConstantInt::get(Ty, C2->udiv(C + 1)));

  }


  // (icmp ult (udiv C2, Y), C) -> (icmp ugt Y, C2/C)

  if (Pred == ICmpInst::ICMP_ULT) {

    assert(C != 0 && "icmp ult X, 0 should have been simplified already.");

    return new ICmpInst(ICmpInst::ICMP_UGT, Y,

                        ConstantInt::get(Ty, C2->udiv(C)));

  }


  return nullptr;

}


/// Fold icmp ({su}div X, Y), C.

Instruction *InstCombinerImpl::foldICmpDivConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Div,

                                                   const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Value *X = Div->getOperand(0);

  Value *Y = Div->getOperand(1);

  Type *Ty = Div->getType();

  bool DivIsSigned = Div->getOpcode() == Instruction::SDiv;


  // If unsigned division and the compare constant is bigger than

  // UMAX/2 (negative), there's only one pair of values that satisfies an

  // equality check, so eliminate the division:

  // (X u/ Y) == C --> (X == C) && (Y == 1)

  // (X u/ Y) != C --> (X != C) || (Y != 1)

  // Similarly, if signed division and the compare constant is exactly SMIN:

  // (X s/ Y) == SMIN --> (X == SMIN) && (Y == 1)

  // (X s/ Y) != SMIN --> (X != SMIN) || (Y != 1)

  if (Cmp.isEquality() && Div->hasOneUse() && C.isSignBitSet() &&

      (!DivIsSigned || C.isMinSignedValue())) {

    Value *XBig = Builder.CreateICmp(Pred, X, ConstantInt::get(Ty, C));

    Value *YOne = Builder.CreateICmp(Pred, Y, ConstantInt::get(Ty, 1));

    auto Logic = Pred == ICmpInst::ICMP_EQ ? Instruction::And : Instruction::Or;

    return BinaryOperator::Create(Logic, XBig, YOne);

  }


  // Fold: icmp pred ([us]div X, C2), C -> range test

  // Fold this div into the comparison, producing a range check.

  // Determine, based on the divide type, what the range is being

  // checked.  If there is an overflow on the low or high side, remember

  // it, otherwise compute the range [low, hi) bounding the new value.

  // See: InsertRangeTest above for the kinds of replacements possible.

  const APInt *C2;

  if (!match(Y, m_APInt(C2)))

    return nullptr;


  // FIXME: If the operand types don't match the type of the divide

  // then don't attempt this transform. The code below doesn't have the

  // logic to deal with a signed divide and an unsigned compare (and

  // vice versa). This is because (x /s C2) <s C  produces different

  // results than (x /s C2) <u C or (x /u C2) <s C or even

  // (x /u C2) <u C.  Simply casting the operands and result won't

  // work. :(  The if statement below tests that condition and bails

  // if it finds it.

  if (!Cmp.isEquality() && DivIsSigned != Cmp.isSigned())

    return nullptr;


  // The ProdOV computation fails on divide by 0 and divide by -1. Cases with

  // INT_MIN will also fail if the divisor is 1. Although folds of all these

  // division-by-constant cases should be present, we can not assert that they

  // have happened before we reach this icmp instruction.

  if (C2->isZero() || C2->isOne() || (DivIsSigned && C2->isAllOnes()))

    return nullptr;


  // Compute Prod = C * C2. We are essentially solving an equation of

  // form X / C2 = C. We solve for X by multiplying C2 and C.

  // By solving for X, we can turn this into a range check instead of computing

  // a divide.

  APInt Prod = C * *C2;


  // Determine if the product overflows by seeing if the product is not equal to

  // the divide. Make sure we do the same kind of divide as in the LHS

  // instruction that we're folding.

  bool ProdOV = (DivIsSigned ? Prod.sdiv(*C2) : Prod.udiv(*C2)) != C;


  // If the division is known to be exact, then there is no remainder from the

  // divide, so the covered range size is unit, otherwise it is the divisor.

  APInt RangeSize = Div->isExact() ? APInt(C2->getBitWidth(), 1) : *C2;


  // Figure out the interval that is being checked.  For example, a comparison

  // like "X /u 5 == 0" is really checking that X is in the interval [0, 5).

  // Compute this interval based on the constants involved and the signedness of

  // the compare/divide.  This computes a half-open interval, keeping track of

  // whether either value in the interval overflows.  After analysis each

  // overflow variable is set to 0 if it's corresponding bound variable is valid

  // -1 if overflowed off the bottom end, or +1 if overflowed off the top end.

  int LoOverflow = 0, HiOverflow = 0;

  APInt LoBound, HiBound;


  if (!DivIsSigned) { // udiv

    // e.g. X/5 op 3  --> [15, 20)

    LoBound = Prod;

    HiOverflow = LoOverflow = ProdOV;

    if (!HiOverflow) {

      // If this is not an exact divide, then many values in the range collapse

      // to the same result value.

      HiOverflow = addWithOverflow(HiBound, LoBound, RangeSize, false);

    }

  } else if (C2->isStrictlyPositive()) { // Divisor is > 0.

    if (C.isZero()) {                    // (X / pos) op 0

      // Can't overflow.  e.g.  X/2 op 0 --> [-1, 2)

      LoBound = -(RangeSize - 1);

      HiBound = RangeSize;

    } else if (C.isStrictlyPositive()) { // (X / pos) op pos

      LoBound = Prod;                    // e.g.   X/5 op 3 --> [15, 20)

      HiOverflow = LoOverflow = ProdOV;

      if (!HiOverflow)

        HiOverflow = addWithOverflow(HiBound, Prod, RangeSize, true);

    } else { // (X / pos) op neg

      // e.g. X/5 op -3  --> [-15-4, -15+1) --> [-19, -14)

      HiBound = Prod + 1;

      LoOverflow = HiOverflow = ProdOV ? -1 : 0;

      if (!LoOverflow) {

        APInt DivNeg = -RangeSize;

        LoOverflow = addWithOverflow(LoBound, HiBound, DivNeg, true) ? -1 : 0;

      }

    }

  } else if (C2->isNegative()) { // Divisor is < 0.

    if (Div->isExact())

      RangeSize.negate();

    if (C.isZero()) { // (X / neg) op 0

      // e.g. X/-5 op 0  --> [-4, 5)

      LoBound = RangeSize + 1;

      HiBound = -RangeSize;

      if (HiBound == *C2) { // -INTMIN = INTMIN

        HiOverflow = 1;     // [INTMIN+1, overflow)

        HiBound = APInt();  // e.g. X/INTMIN = 0 --> X > INTMIN

      }

    } else if (C.isStrictlyPositive()) { // (X / neg) op pos

      // e.g. X/-5 op 3  --> [-19, -14)

      HiBound = Prod + 1;

      HiOverflow = LoOverflow = ProdOV ? -1 : 0;

      if (!LoOverflow)

        LoOverflow =

            addWithOverflow(LoBound, HiBound, RangeSize, true) ? -1 : 0;

    } else {          // (X / neg) op neg

      LoBound = Prod; // e.g. X/-5 op -3  --> [15, 20)

      LoOverflow = HiOverflow = ProdOV;

      if (!HiOverflow)

        HiOverflow = subWithOverflow(HiBound, Prod, RangeSize, true);

    }


    // Dividing by a negative swaps the condition.  LT <-> GT

    Pred = ICmpInst::getSwappedPredicate(Pred);

  }


  switch (Pred) {

  default:

    llvm_unreachable("Unhandled icmp predicate!");

  case ICmpInst::ICMP_EQ:

    if (LoOverflow && HiOverflow)

      return replaceInstUsesWith(Cmp, Builder.getFalse());

    if (HiOverflow)

      return new ICmpInst(DivIsSigned ? ICmpInst::ICMP_SGE : ICmpInst::ICMP_UGE,

                          X, ConstantInt::get(Ty, LoBound));

    if (LoOverflow)

      return new ICmpInst(DivIsSigned ? ICmpInst::ICMP_SLT : ICmpInst::ICMP_ULT,

                          X, ConstantInt::get(Ty, HiBound));

    return replaceInstUsesWith(

        Cmp, insertRangeTest(X, LoBound, HiBound, DivIsSigned, true));

  case ICmpInst::ICMP_NE:

    if (LoOverflow && HiOverflow)

      return replaceInstUsesWith(Cmp, Builder.getTrue());

    if (HiOverflow)

      return new ICmpInst(DivIsSigned ? ICmpInst::ICMP_SLT : ICmpInst::ICMP_ULT,

                          X, ConstantInt::get(Ty, LoBound));

    if (LoOverflow)

      return new ICmpInst(DivIsSigned ? ICmpInst::ICMP_SGE : ICmpInst::ICMP_UGE,

                          X, ConstantInt::get(Ty, HiBound));

    return replaceInstUsesWith(

        Cmp, insertRangeTest(X, LoBound, HiBound, DivIsSigned, false));

  case ICmpInst::ICMP_ULT:

  case ICmpInst::ICMP_SLT:

    if (LoOverflow == +1) // Low bound is greater than input range.

      return replaceInstUsesWith(Cmp, Builder.getTrue());

    if (LoOverflow == -1) // Low bound is less than input range.

      return replaceInstUsesWith(Cmp, Builder.getFalse());

    return new ICmpInst(Pred, X, ConstantInt::get(Ty, LoBound));

  case ICmpInst::ICMP_UGT:

  case ICmpInst::ICMP_SGT:

    if (HiOverflow == +1) // High bound greater than input range.

      return replaceInstUsesWith(Cmp, Builder.getFalse());

    if (HiOverflow == -1) // High bound less than input range.

      return replaceInstUsesWith(Cmp, Builder.getTrue());

    if (Pred == ICmpInst::ICMP_UGT)

      return new ICmpInst(ICmpInst::ICMP_UGE, X, ConstantInt::get(Ty, HiBound));

    return new ICmpInst(ICmpInst::ICMP_SGE, X, ConstantInt::get(Ty, HiBound));

  }


  return nullptr;

}


/// Fold icmp (sub X, Y), C.

Instruction *InstCombinerImpl::foldICmpSubConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Sub,

                                                   const APInt &C) {

  Value *X = Sub->getOperand(0), *Y = Sub->getOperand(1);

  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Type *Ty = Sub->getType();


  // (SubC - Y) == C) --> Y == (SubC - C)

  // (SubC - Y) != C) --> Y != (SubC - C)

  Constant *SubC;

  if (Cmp.isEquality() && match(X, m_ImmConstant(SubC))) {

    return new ICmpInst(Pred, Y,

                        ConstantExpr::getSub(SubC, ConstantInt::get(Ty, C)));

  }


  // (icmp P (sub nuw|nsw C2, Y), C) -> (icmp swap(P) Y, C2-C)

  const APInt *C2;

  APInt SubResult;

  ICmpInst::Predicate SwappedPred = Cmp.getSwappedPredicate();

  bool HasNSW = Sub->hasNoSignedWrap();

  bool HasNUW = Sub->hasNoUnsignedWrap();

  if (match(X, m_APInt(C2)) &&

      ((Cmp.isUnsigned() && HasNUW) || (Cmp.isSigned() && HasNSW)) &&

      !subWithOverflow(SubResult, *C2, C, Cmp.isSigned()))

    return new ICmpInst(SwappedPred, Y, ConstantInt::get(Ty, SubResult));


  // X - Y == 0 --> X == Y.

  // X - Y != 0 --> X != Y.

  // TODO: We allow this with multiple uses as long as the other uses are not

  //       in phis. The phi use check is guarding against a codegen regression

  //       for a loop test. If the backend could undo this (and possibly

  //       subsequent transforms), we would not need this hack.

  if (Cmp.isEquality() && C.isZero() &&

      none_of((Sub->users()), [](const User *U) { return isa<PHINode>(U); }))

    return new ICmpInst(Pred, X, Y);


  // The following transforms are only worth it if the only user of the subtract

  // is the icmp.

  // TODO: This is an artificial restriction for all of the transforms below

  //       that only need a single replacement icmp. Can these use the phi test

  //       like the transform above here?

  if (!Sub->hasOneUse())

    return nullptr;


  if (Sub->hasNoSignedWrap()) {

    // (icmp sgt (sub nsw X, Y), -1) -> (icmp sge X, Y)

    if (Pred == ICmpInst::ICMP_SGT && C.isAllOnes())

      return new ICmpInst(ICmpInst::ICMP_SGE, X, Y);


    // (icmp sgt (sub nsw X, Y), 0) -> (icmp sgt X, Y)

    if (Pred == ICmpInst::ICMP_SGT && C.isZero())

      return new ICmpInst(ICmpInst::ICMP_SGT, X, Y);


    // (icmp slt (sub nsw X, Y), 0) -> (icmp slt X, Y)

    if (Pred == ICmpInst::ICMP_SLT && C.isZero())

      return new ICmpInst(ICmpInst::ICMP_SLT, X, Y);


    // (icmp slt (sub nsw X, Y), 1) -> (icmp sle X, Y)

    if (Pred == ICmpInst::ICMP_SLT && C.isOne())

      return new ICmpInst(ICmpInst::ICMP_SLE, X, Y);

  }


  if (!match(X, m_APInt(C2)))

    return nullptr;


  // C2 - Y <u C -> (Y | (C - 1)) == C2

  //   iff (C2 & (C - 1)) == C - 1 and C is a power of 2

  if (Pred == ICmpInst::ICMP_ULT && C.isPowerOf2() &&

      (*C2 & (C - 1)) == (C - 1))

    return new ICmpInst(ICmpInst::ICMP_EQ, Builder.CreateOr(Y, C - 1), X);


  // C2 - Y >u C -> (Y | C) != C2

  //   iff C2 & C == C and C + 1 is a power of 2

  if (Pred == ICmpInst::ICMP_UGT && (C + 1).isPowerOf2() && (*C2 & C) == C)

    return new ICmpInst(ICmpInst::ICMP_NE, Builder.CreateOr(Y, C), X);


  // We have handled special cases that reduce.

  // Canonicalize any remaining sub to add as:

  // (C2 - Y) > C --> (Y + ~C2) < ~C

  Value *Add = Builder.CreateAdd(Y, ConstantInt::get(Ty, ~(*C2)), "notsub",

                                 HasNUW, HasNSW);

  return new ICmpInst(SwappedPred, Add, ConstantInt::get(Ty, ~C));

}


static Value *createLogicFromTable(const std::bitset<4> &Table, Value *Op0,

                                   Value *Op1, IRBuilderBase &Builder,

                                   bool HasOneUse) {

  auto FoldConstant = [&](bool Val) {

    Constant *Res = Val ? Builder.getTrue() : Builder.getFalse();

    if (Op0->getType()->isVectorTy())

      Res = ConstantVector::getSplat(

          cast<VectorType>(Op0->getType())->getElementCount(), Res);

    return Res;

  };


  switch (Table.to_ulong()) {

  case 0: // 0 0 0 0

    return FoldConstant(false);

  case 1: // 0 0 0 1

    return HasOneUse ? Builder.CreateNot(Builder.CreateOr(Op0, Op1)) : nullptr;

  case 2: // 0 0 1 0

    return HasOneUse ? Builder.CreateAnd(Builder.CreateNot(Op0), Op1) : nullptr;

  case 3: // 0 0 1 1

    return Builder.CreateNot(Op0);

  case 4: // 0 1 0 0

    return HasOneUse ? Builder.CreateAnd(Op0, Builder.CreateNot(Op1)) : nullptr;

  case 5: // 0 1 0 1

    return Builder.CreateNot(Op1);

  case 6: // 0 1 1 0

    return Builder.CreateXor(Op0, Op1);

  case 7: // 0 1 1 1

    return HasOneUse ? Builder.CreateNot(Builder.CreateAnd(Op0, Op1)) : nullptr;

  case 8: // 1 0 0 0

    return Builder.CreateAnd(Op0, Op1);

  case 9: // 1 0 0 1

    return HasOneUse ? Builder.CreateNot(Builder.CreateXor(Op0, Op1)) : nullptr;

  case 10: // 1 0 1 0

    return Op1;

  case 11: // 1 0 1 1

    return HasOneUse ? Builder.CreateOr(Builder.CreateNot(Op0), Op1) : nullptr;

  case 12: // 1 1 0 0

    return Op0;

  case 13: // 1 1 0 1

    return HasOneUse ? Builder.CreateOr(Op0, Builder.CreateNot(Op1)) : nullptr;

  case 14: // 1 1 1 0

    return Builder.CreateOr(Op0, Op1);

  case 15: // 1 1 1 1

    return FoldConstant(true);

  default:

    llvm_unreachable("Invalid Operation");

  }

  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpBinOpWithConstantViaTruthTable(

    ICmpInst &Cmp, BinaryOperator *BO, const APInt &C) {

  Value *A, *B;

  Constant *C1, *C2, *C3, *C4;

  if (!(match(BO->getOperand(0),

              m_Select(m_Value(A), m_Constant(C1), m_Constant(C2)))) ||

      !match(BO->getOperand(1),

             m_Select(m_Value(B), m_Constant(C3), m_Constant(C4))) ||

      Cmp.getType() != A->getType())

    return nullptr;


  std::bitset<4> Table;

  auto ComputeTable = [&](bool First, bool Second) -> std::optional<bool> {

    Constant *L = First ? C1 : C2;

    Constant *R = Second ? C3 : C4;

    if (auto *Res = ConstantFoldBinaryOpOperands(BO->getOpcode(), L, R, DL)) {

      auto *Val = Res->getType()->isVectorTy() ? Res->getSplatValue() : Res;

      if (auto *CI = dyn_cast_or_null<ConstantInt>(Val))

        return ICmpInst::compare(CI->getValue(), C, Cmp.getPredicate());

    }

    return std::nullopt;

  };


  for (unsigned I = 0; I < 4; ++I) {

    bool First = (I >> 1) & 1;

    bool Second = I & 1;

    if (auto Res = ComputeTable(First, Second))

      Table[I] = *Res;

    else

      return nullptr;

  }


  // Synthesize optimal logic.

  if (auto *Cond = createLogicFromTable(Table, A, B, Builder, BO->hasOneUse()))

    return replaceInstUsesWith(Cmp, Cond);

  return nullptr;

}


/// Fold icmp (add X, Y), C.

Instruction *InstCombinerImpl::foldICmpAddConstant(ICmpInst &Cmp,

                                                   BinaryOperator *Add,

                                                   const APInt &C) {

  Value *Y = Add->getOperand(1);

  Value *X = Add->getOperand(0);


  Value *Op0, *Op1;

  Instruction *Ext0, *Ext1;

  const CmpInst::Predicate Pred = Cmp.getPredicate();

  if (match(Add,

            m_Add(m_CombineAnd(m_Instruction(Ext0), m_ZExtOrSExt(m_Value(Op0))),

                  m_CombineAnd(m_Instruction(Ext1),

                               m_ZExtOrSExt(m_Value(Op1))))) &&

      Op0->getType()->isIntOrIntVectorTy(1) &&

      Op1->getType()->isIntOrIntVectorTy(1)) {

    unsigned BW = C.getBitWidth();

    std::bitset<4> Table;

    auto ComputeTable = [&](bool Op0Val, bool Op1Val) {

      APInt Res(BW, 0);

      if (Op0Val)

        Res += APInt(BW, isa<ZExtInst>(Ext0) ? 1 : -1, /*isSigned=*/true);

      if (Op1Val)

        Res += APInt(BW, isa<ZExtInst>(Ext1) ? 1 : -1, /*isSigned=*/true);

      return ICmpInst::compare(Res, C, Pred);

    };


    Table[0] = ComputeTable(false, false);

    Table[1] = ComputeTable(false, true);

    Table[2] = ComputeTable(true, false);

    Table[3] = ComputeTable(true, true);

    if (auto *Cond =

            createLogicFromTable(Table, Op0, Op1, Builder, Add->hasOneUse()))

      return replaceInstUsesWith(Cmp, Cond);

  }

  const APInt *C2;

  if (Cmp.isEquality() || !match(Y, m_APInt(C2)))

    return nullptr;


  // Fold icmp pred (add X, C2), C.

  Type *Ty = Add->getType();


  // If the add does not wrap, we can always adjust the compare by subtracting

  // the constants. Equality comparisons are handled elsewhere. SGE/SLE/UGE/ULE

  // are canonicalized to SGT/SLT/UGT/ULT.

  if ((Add->hasNoSignedWrap() &&

       (Pred == ICmpInst::ICMP_SGT || Pred == ICmpInst::ICMP_SLT)) ||

      (Add->hasNoUnsignedWrap() &&

       (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULT))) {

    bool Overflow;

    APInt NewC =

        Cmp.isSigned() ? C.ssub_ov(*C2, Overflow) : C.usub_ov(*C2, Overflow);

    // If there is overflow, the result must be true or false.

    // TODO: Can we assert there is no overflow because InstSimplify always

    // handles those cases?

    if (!Overflow)

      // icmp Pred (add nsw X, C2), C --> icmp Pred X, (C - C2)

      return new ICmpInst(Pred, X, ConstantInt::get(Ty, NewC));

  }


  if (ICmpInst::isUnsigned(Pred) && Add->hasNoSignedWrap() &&

      C.isNonNegative() && (C - *C2).isNonNegative() &&

      computeConstantRange(X, /*ForSigned=*/true).add(*C2).isAllNonNegative())

    return new ICmpInst(ICmpInst::getSignedPredicate(Pred), X,

                        ConstantInt::get(Ty, C - *C2));


  auto CR = ConstantRange::makeExactICmpRegion(Pred, C).subtract(*C2);

  const APInt &Upper = CR.getUpper();

  const APInt &Lower = CR.getLower();

  if (Cmp.isSigned()) {

    if (Lower.isSignMask())

      return new ICmpInst(ICmpInst::ICMP_SLT, X, ConstantInt::get(Ty, Upper));

    if (Upper.isSignMask())

      return new ICmpInst(ICmpInst::ICMP_SGE, X, ConstantInt::get(Ty, Lower));

  } else {

    if (Lower.isMinValue())

      return new ICmpInst(ICmpInst::ICMP_ULT, X, ConstantInt::get(Ty, Upper));

    if (Upper.isMinValue())

      return new ICmpInst(ICmpInst::ICMP_UGE, X, ConstantInt::get(Ty, Lower));

  }


  // This set of folds is intentionally placed after folds that use no-wrapping

  // flags because those folds are likely better for later analysis/codegen.

  const APInt SMax = APInt::getSignedMaxValue(Ty->getScalarSizeInBits());

  const APInt SMin = APInt::getSignedMinValue(Ty->getScalarSizeInBits());


  // Fold compare with offset to opposite sign compare if it eliminates offset:

  // (X + C2) >u C --> X <s -C2 (if C == C2 + SMAX)

  if (Pred == CmpInst::ICMP_UGT && C == *C2 + SMax)

    return new ICmpInst(ICmpInst::ICMP_SLT, X, ConstantInt::get(Ty, -(*C2)));


  // (X + C2) <u C --> X >s ~C2 (if C == C2 + SMIN)

  if (Pred == CmpInst::ICMP_ULT && C == *C2 + SMin)

    return new ICmpInst(ICmpInst::ICMP_SGT, X, ConstantInt::get(Ty, ~(*C2)));


  // (X + C2) >s C --> X <u (SMAX - C) (if C == C2 - 1)

  if (Pred == CmpInst::ICMP_SGT && C == *C2 - 1)

    return new ICmpInst(ICmpInst::ICMP_ULT, X, ConstantInt::get(Ty, SMax - C));


  // (X + C2) <s C --> X >u (C ^ SMAX) (if C == C2)

  if (Pred == CmpInst::ICMP_SLT && C == *C2)

    return new ICmpInst(ICmpInst::ICMP_UGT, X, ConstantInt::get(Ty, C ^ SMax));


  // (X + -1) <u C --> X <=u C (if X is never null)

  if (Pred == CmpInst::ICMP_ULT && C2->isAllOnes()) {

    const SimplifyQuery Q = SQ.getWithInstruction(&Cmp);

    if (llvm::isKnownNonZero(X, Q))

      return new ICmpInst(ICmpInst::ICMP_ULE, X, ConstantInt::get(Ty, C));

  }


  if (!Add->hasOneUse())

    return nullptr;


  // X+C <u C2 -> (X & -C2) == C

  //   iff C & (C2-1) == 0

  //       C2 is a power of 2

  if (Pred == ICmpInst::ICMP_ULT && C.isPowerOf2() && (*C2 & (C - 1)) == 0)

    return new ICmpInst(ICmpInst::ICMP_EQ, Builder.CreateAnd(X, -C),

                        ConstantExpr::getNeg(cast<Constant>(Y)));


  // X+C2 <u C -> (X & C) == 2C

  //   iff C == -(C2)

  //       C2 is a power of 2

  if (Pred == ICmpInst::ICMP_ULT && C2->isPowerOf2() && C == -*C2)

    return new ICmpInst(ICmpInst::ICMP_NE, Builder.CreateAnd(X, C),

                        ConstantInt::get(Ty, C * 2));


  // X+C >u C2 -> (X & ~C2) != C

  //   iff C & C2 == 0

  //       C2+1 is a power of 2

  if (Pred == ICmpInst::ICMP_UGT && (C + 1).isPowerOf2() && (*C2 & C) == 0)

    return new ICmpInst(ICmpInst::ICMP_NE, Builder.CreateAnd(X, ~C),

                        ConstantExpr::getNeg(cast<Constant>(Y)));


  // The range test idiom can use either ult or ugt. Arbitrarily canonicalize

  // to the ult form.

  // X+C2 >u C -> X+(C2-C-1) <u ~C

  if (Pred == ICmpInst::ICMP_UGT)

    return new ICmpInst(ICmpInst::ICMP_ULT,

                        Builder.CreateAdd(X, ConstantInt::get(Ty, *C2 - C - 1)),

                        ConstantInt::get(Ty, ~C));


  // zext(V) + C2 pred C -> V + C3 pred' C4

  Value *V;

  if (match(X, m_ZExt(m_Value(V)))) {

    Type *NewCmpTy = V->getType();

    unsigned NewCmpBW = NewCmpTy->getScalarSizeInBits();

    if (shouldChangeType(Ty, NewCmpTy)) {

      ConstantRange SrcCR = CR.truncate(NewCmpBW, TruncInst::NoUnsignedWrap);

      CmpInst::Predicate EquivPred;

      APInt EquivInt;

      APInt EquivOffset;


      SrcCR.getEquivalentICmp(EquivPred, EquivInt, EquivOffset);

      return new ICmpInst(

          EquivPred,

          EquivOffset.isZero()

              ? V

              : Builder.CreateAdd(V, ConstantInt::get(NewCmpTy, EquivOffset)),

          ConstantInt::get(NewCmpTy, EquivInt));

    }

  }


  return nullptr;

}


bool InstCombinerImpl::matchThreeWayIntCompare(SelectInst *SI, Value *&LHS,

                                               Value *&RHS, ConstantInt *&Less,

                                               ConstantInt *&Equal,

                                               ConstantInt *&Greater) {

  // TODO: Generalize this to work with other comparison idioms or ensure

  // they get canonicalized into this form.


  // select i1 (a == b),

  //        i32 Equal,

  //        i32 (select i1 (a < b), i32 Less, i32 Greater)

  // where Equal, Less and Greater are placeholders for any three constants.

  CmpPredicate PredA;

  if (!match(SI->getCondition(), m_ICmp(PredA, m_Value(LHS), m_Value(RHS))) ||

      !ICmpInst::isEquality(PredA))

    return false;

  Value *EqualVal = SI->getTrueValue();

  Value *UnequalVal = SI->getFalseValue();

  // We still can get non-canonical predicate here, so canonicalize.

  if (PredA == ICmpInst::ICMP_NE)

    std::swap(EqualVal, UnequalVal);

  if (!match(EqualVal, m_ConstantInt(Equal)))

    return false;

  CmpPredicate PredB;

  Value *LHS2, *RHS2;

  if (!match(UnequalVal, m_Select(m_ICmp(PredB, m_Value(LHS2), m_Value(RHS2)),

                                  m_ConstantInt(Less), m_ConstantInt(Greater))))

    return false;

  // We can get predicate mismatch here, so canonicalize if possible:

  // First, ensure that 'LHS' match.

  if (LHS2 != LHS) {

    // x sgt y <--> y slt x

    std::swap(LHS2, RHS2);

    PredB = ICmpInst::getSwappedPredicate(PredB);

  }

  if (LHS2 != LHS)

    return false;

  // We also need to canonicalize 'RHS'.

  if (PredB == ICmpInst::ICMP_SGT && isa<Constant>(RHS2)) {

    // x sgt C-1  <-->  x sge C  <-->  not(x slt C)

    auto FlippedStrictness =

        getFlippedStrictnessPredicateAndConstant(PredB, cast<Constant>(RHS2));

    if (!FlippedStrictness)

      return false;

    assert(FlippedStrictness->first == ICmpInst::ICMP_SGE &&

           "basic correctness failure");

    RHS2 = FlippedStrictness->second;

    // And kind-of perform the result swap.

    std::swap(Less, Greater);

    PredB = ICmpInst::ICMP_SLT;

  }

  return PredB == ICmpInst::ICMP_SLT && RHS == RHS2;

}


Instruction *InstCombinerImpl::foldICmpSelectConstant(ICmpInst &Cmp,

                                                      SelectInst *Select,

                                                      ConstantInt *C) {


  assert(C && "Cmp RHS should be a constant int!");

  // If we're testing a constant value against the result of a three way

  // comparison, the result can be expressed directly in terms of the

  // original values being compared.  Note: We could possibly be more

  // aggressive here and remove the hasOneUse test. The original select is

  // really likely to simplify or sink when we remove a test of the result.

  Value *OrigLHS, *OrigRHS;

  ConstantInt *C1LessThan, *C2Equal, *C3GreaterThan;

  if (Cmp.hasOneUse() &&

      matchThreeWayIntCompare(Select, OrigLHS, OrigRHS, C1LessThan, C2Equal,

                              C3GreaterThan)) {

    assert(C1LessThan && C2Equal && C3GreaterThan);


    bool TrueWhenLessThan = ICmpInst::compare(

        C1LessThan->getValue(), C->getValue(), Cmp.getPredicate());

    bool TrueWhenEqual = ICmpInst::compare(C2Equal->getValue(), C->getValue(),

                                           Cmp.getPredicate());

    bool TrueWhenGreaterThan = ICmpInst::compare(

        C3GreaterThan->getValue(), C->getValue(), Cmp.getPredicate());


    // This generates the new instruction that will replace the original Cmp

    // Instruction. Instead of enumerating the various combinations when

    // TrueWhenLessThan, TrueWhenEqual and TrueWhenGreaterThan are true versus

    // false, we rely on chaining of ORs and future passes of InstCombine to

    // simplify the OR further (i.e. a s< b || a == b becomes a s<= b).


    // When none of the three constants satisfy the predicate for the RHS (C),

    // the entire original Cmp can be simplified to a false.

    Value *Cond = Builder.getFalse();

    if (TrueWhenLessThan)

      Cond = Builder.CreateOr(

          Cond, Builder.CreateICmp(ICmpInst::ICMP_SLT, OrigLHS, OrigRHS));

    if (TrueWhenEqual)

      Cond = Builder.CreateOr(

          Cond, Builder.CreateICmp(ICmpInst::ICMP_EQ, OrigLHS, OrigRHS));

    if (TrueWhenGreaterThan)

      Cond = Builder.CreateOr(

          Cond, Builder.CreateICmp(ICmpInst::ICMP_SGT, OrigLHS, OrigRHS));


    return replaceInstUsesWith(Cmp, Cond);

  }

  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpBitCast(ICmpInst &Cmp) {

  auto *Bitcast = dyn_cast<BitCastInst>(Cmp.getOperand(0));

  if (!Bitcast)

    return nullptr;


  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Value *Op1 = Cmp.getOperand(1);

  Value *BCSrcOp = Bitcast->getOperand(0);

  Type *SrcType = Bitcast->getSrcTy();

  Type *DstType = Bitcast->getType();


  // Make sure the bitcast doesn't change between scalar and vector and

  // doesn't change the number of vector elements.

  if (SrcType->isVectorTy() == DstType->isVectorTy() &&

      SrcType->getScalarSizeInBits() == DstType->getScalarSizeInBits()) {

    // Zero-equality and sign-bit checks are preserved through sitofp + bitcast.

    Value *X;

    if (match(BCSrcOp, m_SIToFP(m_Value(X)))) {

      // icmp  eq (bitcast (sitofp X)), 0 --> icmp  eq X, 0

      // icmp  ne (bitcast (sitofp X)), 0 --> icmp  ne X, 0

      // icmp slt (bitcast (sitofp X)), 0 --> icmp slt X, 0

      // icmp sgt (bitcast (sitofp X)), 0 --> icmp sgt X, 0

      if ((Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_SLT ||

           Pred == ICmpInst::ICMP_NE || Pred == ICmpInst::ICMP_SGT) &&

          match(Op1, m_Zero()))

        return new ICmpInst(Pred, X, ConstantInt::getNullValue(X->getType()));


      // icmp slt (bitcast (sitofp X)), 1 --> icmp slt X, 1

      if (Pred == ICmpInst::ICMP_SLT && match(Op1, m_One()))

        return new ICmpInst(Pred, X, ConstantInt::get(X->getType(), 1));


      // icmp sgt (bitcast (sitofp X)), -1 --> icmp sgt X, -1

      if (Pred == ICmpInst::ICMP_SGT && match(Op1, m_AllOnes()))

        return new ICmpInst(Pred, X,

                            ConstantInt::getAllOnesValue(X->getType()));

    }


    // Zero-equality checks are preserved through unsigned floating-point casts:

    // icmp eq (bitcast (uitofp X)), 0 --> icmp eq X, 0

    // icmp ne (bitcast (uitofp X)), 0 --> icmp ne X, 0

    if (match(BCSrcOp, m_UIToFP(m_Value(X))))

      if (Cmp.isEquality() && match(Op1, m_Zero()))

        return new ICmpInst(Pred, X, ConstantInt::getNullValue(X->getType()));


    const APInt *C;

    bool TrueIfSigned;

    if (match(Op1, m_APInt(C)) && Bitcast->hasOneUse()) {

      // If this is a sign-bit test of a bitcast of a casted FP value, eliminate

      // the FP extend/truncate because that cast does not change the sign-bit.

      // This is true for all standard IEEE-754 types and the X86 80-bit type.

      // The sign-bit is always the most significant bit in those types.

      if (isSignBitCheck(Pred, *C, TrueIfSigned) &&

          (match(BCSrcOp, m_FPExt(m_Value(X))) ||

           match(BCSrcOp, m_FPTrunc(m_Value(X))))) {

        // (bitcast (fpext/fptrunc X)) to iX) < 0 --> (bitcast X to iY) < 0

        // (bitcast (fpext/fptrunc X)) to iX) > -1 --> (bitcast X to iY) > -1

        Type *XType = X->getType();


        // We can't currently handle Power style floating point operations here.

        if (!(XType->isPPC_FP128Ty() || SrcType->isPPC_FP128Ty())) {

          Type *NewType = Builder.getIntNTy(XType->getScalarSizeInBits());

          if (auto *XVTy = dyn_cast<VectorType>(XType))

            NewType = VectorType::get(NewType, XVTy->getElementCount());

          Value *NewBitcast = Builder.CreateBitCast(X, NewType);

          if (TrueIfSigned)

            return new ICmpInst(ICmpInst::ICMP_SLT, NewBitcast,

                                ConstantInt::getNullValue(NewType));

          else

            return new ICmpInst(ICmpInst::ICMP_SGT, NewBitcast,

                                ConstantInt::getAllOnesValue(NewType));

        }

      }


      // icmp eq/ne (bitcast X to int), special fp -> llvm.is.fpclass(X, class)

      Type *FPType = SrcType->getScalarType();

      if (!Cmp.getParent()->getParent()->hasFnAttribute(

              Attribute::NoImplicitFloat) &&

          Cmp.isEquality() && FPType->isIEEELikeFPTy()) {

        FPClassTest Mask = APFloat(FPType->getFltSemantics(), *C).classify();

        if (Mask & (fcInf | fcZero)) {

          if (Pred == ICmpInst::ICMP_NE)

            Mask = ~Mask;

          return replaceInstUsesWith(Cmp,

                                     Builder.createIsFPClass(BCSrcOp, Mask));

        }

      }

    }

  }


  const APInt *C;

  if (!match(Cmp.getOperand(1), m_APInt(C)) || !DstType->isIntegerTy() ||

      !SrcType->isIntOrIntVectorTy())

    return nullptr;


  // If this is checking if all elements of a vector compare are set or not,

  // invert the casted vector equality compare and test if all compare

  // elements are clear or not. Compare against zero is generally easier for

  // analysis and codegen.

  // icmp eq/ne (bitcast (not X) to iN), -1 --> icmp eq/ne (bitcast X to iN), 0

  // Example: are all elements equal? --> are zero elements not equal?

  // TODO: Try harder to reduce compare of 2 freely invertible operands?

  if (Cmp.isEquality() && C->isAllOnes() && Bitcast->hasOneUse()) {

    if (Value *NotBCSrcOp =

            getFreelyInverted(BCSrcOp, BCSrcOp->hasOneUse(), &Builder)) {

      Value *Cast = Builder.CreateBitCast(NotBCSrcOp, DstType);

      return new ICmpInst(Pred, Cast, ConstantInt::getNullValue(DstType));

    }

  }


  // If this is checking if all elements of an extended vector are clear or not,

  // compare in a narrow type to eliminate the extend:

  // icmp eq/ne (bitcast (ext X) to iN), 0 --> icmp eq/ne (bitcast X to iM), 0

  Value *X;

  if (Cmp.isEquality() && C->isZero() && Bitcast->hasOneUse() &&

      match(BCSrcOp, m_ZExtOrSExt(m_Value(X)))) {

    if (auto *VecTy = dyn_cast<FixedVectorType>(X->getType())) {

      Type *NewType = Builder.getIntNTy(VecTy->getPrimitiveSizeInBits());

      Value *NewCast = Builder.CreateBitCast(X, NewType);

      return new ICmpInst(Pred, NewCast, ConstantInt::getNullValue(NewType));

    }

  }


  // Folding: icmp <pred> iN X, C

  //  where X = bitcast <M x iK> (shufflevector <M x iK> %vec, undef, SC)) to iN

  //    and C is a splat of a K-bit pattern

  //    and SC is a constant vector = <C', C', C', ..., C'>

  // Into:

  //   %E = extractelement <M x iK> %vec, i32 C'

  //   icmp <pred> iK %E, trunc(C)

  Value *Vec;

  ArrayRef<int> Mask;

  if (match(BCSrcOp, m_Shuffle(m_Value(Vec), m_Undef(), m_Mask(Mask)))) {

    // Check whether every element of Mask is the same constant

    if (all_equal(Mask)) {

      auto *VecTy = cast<VectorType>(SrcType);

      auto *EltTy = cast<IntegerType>(VecTy->getElementType());

      if (C->isSplat(EltTy->getBitWidth())) {

        // Fold the icmp based on the value of C

        // If C is M copies of an iK sized bit pattern,

        // then:

        //   =>  %E = extractelement <N x iK> %vec, i32 Elem

        //       icmp <pred> iK %SplatVal, <pattern>

        Value *Elem = Builder.getInt32(Mask[0]);

        Value *Extract = Builder.CreateExtractElement(Vec, Elem);

        Value *NewC = ConstantInt::get(EltTy, C->trunc(EltTy->getBitWidth()));

        return new ICmpInst(Pred, Extract, NewC);

      }

    }

  }

  return nullptr;

}


/// Try to fold integer comparisons with a constant operand: icmp Pred X, C

/// where X is some kind of instruction.

Instruction *InstCombinerImpl::foldICmpInstWithConstant(ICmpInst &Cmp) {

  const APInt *C;


  if (match(Cmp.getOperand(1), m_APInt(C))) {

    if (auto *BO = dyn_cast<BinaryOperator>(Cmp.getOperand(0)))

      if (Instruction *I = foldICmpBinOpWithConstant(Cmp, BO, *C))

        return I;


    if (auto *SI = dyn_cast<SelectInst>(Cmp.getOperand(0)))

      // For now, we only support constant integers while folding the

      // ICMP(SELECT)) pattern. We can extend this to support vector of integers

      // similar to the cases handled by binary ops above.

      if (auto *ConstRHS = dyn_cast<ConstantInt>(Cmp.getOperand(1)))

        if (Instruction *I = foldICmpSelectConstant(Cmp, SI, ConstRHS))

          return I;


    if (auto *TI = dyn_cast<TruncInst>(Cmp.getOperand(0)))

      if (Instruction *I = foldICmpTruncConstant(Cmp, TI, *C))

        return I;


    if (auto *II = dyn_cast<IntrinsicInst>(Cmp.getOperand(0)))

      if (Instruction *I = foldICmpIntrinsicWithConstant(Cmp, II, *C))

        return I;


    // (extractval ([s/u]subo X, Y), 0) == 0 --> X == Y

    // (extractval ([s/u]subo X, Y), 0) != 0 --> X != Y

    // TODO: This checks one-use, but that is not strictly necessary.

    Value *Cmp0 = Cmp.getOperand(0);

    Value *X, *Y;

    if (C->isZero() && Cmp.isEquality() && Cmp0->hasOneUse() &&

        (match(Cmp0,

               m_ExtractValue<0>(m_Intrinsic<Intrinsic::ssub_with_overflow>(

                   m_Value(X), m_Value(Y)))) ||

         match(Cmp0,

               m_ExtractValue<0>(m_Intrinsic<Intrinsic::usub_with_overflow>(

                   m_Value(X), m_Value(Y))))))

      return new ICmpInst(Cmp.getPredicate(), X, Y);

  }


  if (match(Cmp.getOperand(1), m_APIntAllowPoison(C)))

    return foldICmpInstWithConstantAllowPoison(Cmp, *C);


  return nullptr;

}


/// Fold an icmp equality instruction with binary operator LHS and constant RHS:

/// icmp eq/ne BO, C.

Instruction *InstCombinerImpl::foldICmpBinOpEqualityWithConstant(

    ICmpInst &Cmp, BinaryOperator *BO, const APInt &C) {

  // TODO: Some of these folds could work with arbitrary constants, but this

  // function is limited to scalar and vector splat constants.

  if (!Cmp.isEquality())

    return nullptr;


  ICmpInst::Predicate Pred = Cmp.getPredicate();

  bool isICMP_NE = Pred == ICmpInst::ICMP_NE;

  Constant *RHS = cast<Constant>(Cmp.getOperand(1));

  Value *BOp0 = BO->getOperand(0), *BOp1 = BO->getOperand(1);


  switch (BO->getOpcode()) {

  case Instruction::SRem:

    // If we have a signed (X % (2^c)) == 0, turn it into an unsigned one.

    if (C.isZero() && BO->hasOneUse()) {

      const APInt *BOC;

      if (match(BOp1, m_APInt(BOC)) && BOC->sgt(1) && BOC->isPowerOf2()) {

        Value *NewRem = Builder.CreateURem(BOp0, BOp1, BO->getName());

        return new ICmpInst(Pred, NewRem,

                            Constant::getNullValue(BO->getType()));

      }

    }

    break;

  case Instruction::Add: {

    // (A + C2) == C --> A == (C - C2)

    // (A + C2) != C --> A != (C - C2)

    // TODO: Remove the one-use limitation? See discussion in D58633.

    if (Constant *C2 = dyn_cast<Constant>(BOp1)) {

      if (BO->hasOneUse())

        return new ICmpInst(Pred, BOp0, ConstantExpr::getSub(RHS, C2));

    } else if (C.isZero()) {

      // Replace ((add A, B) != 0) with (A != -B) if A or B is

      // efficiently invertible, or if the add has just this one use.

      if (Value *NegVal = dyn_castNegVal(BOp1))

        return new ICmpInst(Pred, BOp0, NegVal);

      if (Value *NegVal = dyn_castNegVal(BOp0))

        return new ICmpInst(Pred, NegVal, BOp1);

      if (BO->hasOneUse()) {

        // (add nuw A, B) != 0 -> (or A, B) != 0

        if (match(BO, m_NUWAdd(m_Value(), m_Value()))) {

          Value *Or = Builder.CreateOr(BOp0, BOp1);

          return new ICmpInst(Pred, Or, Constant::getNullValue(BO->getType()));

        }

        Value *Neg = Builder.CreateNeg(BOp1);

        Neg->takeName(BO);

        return new ICmpInst(Pred, BOp0, Neg);

      }

    }

    break;

  }

  case Instruction::Xor:

    if (Constant *BOC = dyn_cast<Constant>(BOp1)) {

      // For the xor case, we can xor two constants together, eliminating

      // the explicit xor.

      return new ICmpInst(Pred, BOp0, ConstantExpr::getXor(RHS, BOC));

    } else if (C.isZero()) {

      // Replace ((xor A, B) != 0) with (A != B)

      return new ICmpInst(Pred, BOp0, BOp1);

    }

    break;

  case Instruction::Or: {

    const APInt *BOC;

    if (match(BOp1, m_APInt(BOC)) && BO->hasOneUse() && RHS->isAllOnesValue()) {

      // Comparing if all bits outside of a constant mask are set?

      // Replace (X | C) == -1 with (X & ~C) == ~C.

      // This removes the -1 constant.

      Constant *NotBOC = ConstantExpr::getNot(cast<Constant>(BOp1));

      Value *And = Builder.CreateAnd(BOp0, NotBOC);

      return new ICmpInst(Pred, And, NotBOC);

    }

    // (icmp eq (or (select cond, 0, NonZero), Other), 0)

    //  -> (and cond, (icmp eq Other, 0))

    // (icmp ne (or (select cond, NonZero, 0), Other), 0)

    //  -> (or cond, (icmp ne Other, 0))

    Value *Cond, *TV, *FV, *Other, *Sel;

    if (C.isZero() &&

        match(BO,

              m_OneUse(m_c_Or(m_CombineAnd(m_Value(Sel),

                                           m_Select(m_Value(Cond), m_Value(TV),

                                                    m_Value(FV))),

                              m_Value(Other)))) &&

        Cond->getType() == Cmp.getType()) {

      const SimplifyQuery Q = SQ.getWithInstruction(&Cmp);

      // Easy case is if eq/ne matches whether 0 is trueval/falseval.

      if (Pred == ICmpInst::ICMP_EQ

              ? (match(TV, m_Zero()) && isKnownNonZero(FV, Q))

              : (match(FV, m_Zero()) && isKnownNonZero(TV, Q))) {

        Value *Cmp = Builder.CreateICmp(

            Pred, Other, Constant::getNullValue(Other->getType()));

        return BinaryOperator::Create(

            Pred == ICmpInst::ICMP_EQ ? Instruction::And : Instruction::Or, Cmp,

            Cond);

      }

      // Harder case is if eq/ne matches whether 0 is falseval/trueval. In this

      // case we need to invert the select condition so we need to be careful to

      // avoid creating extra instructions.

      // (icmp ne (or (select cond, 0, NonZero), Other), 0)

      //  -> (or (not cond), (icmp ne Other, 0))

      // (icmp eq (or (select cond, NonZero, 0), Other), 0)

      //  -> (and (not cond), (icmp eq Other, 0))

      //

      // Only do this if the inner select has one use, in which case we are

      // replacing `select` with `(not cond)`. Otherwise, we will create more

      // uses. NB: Trying to freely invert cond doesn't make sense here, as if

      // cond was freely invertable, the select arms would have been inverted.

      if (Sel->hasOneUse() &&

          (Pred == ICmpInst::ICMP_EQ

               ? (match(FV, m_Zero()) && isKnownNonZero(TV, Q))

               : (match(TV, m_Zero()) && isKnownNonZero(FV, Q)))) {

        Value *NotCond = Builder.CreateNot(Cond);

        Value *Cmp = Builder.CreateICmp(

            Pred, Other, Constant::getNullValue(Other->getType()));

        return BinaryOperator::Create(

            Pred == ICmpInst::ICMP_EQ ? Instruction::And : Instruction::Or, Cmp,

            NotCond);

      }

    }

    break;

  }

  case Instruction::UDiv:

  case Instruction::SDiv:

    if (BO->isExact()) {

      // div exact X, Y eq/ne 0 -> X eq/ne 0

      // div exact X, Y eq/ne 1 -> X eq/ne Y

      // div exact X, Y eq/ne C ->

      //    if Y * C never-overflow && OneUse:

      //      -> Y * C eq/ne X

      if (C.isZero())

        return new ICmpInst(Pred, BOp0, Constant::getNullValue(BO->getType()));

      else if (C.isOne())

        return new ICmpInst(Pred, BOp0, BOp1);

      else if (BO->hasOneUse()) {

        OverflowResult OR = computeOverflow(

            Instruction::Mul, BO->getOpcode() == Instruction::SDiv, BOp1,

            Cmp.getOperand(1), BO);

        if (OR == OverflowResult::NeverOverflows) {

          Value *YC =

              Builder.CreateMul(BOp1, ConstantInt::get(BO->getType(), C));

          return new ICmpInst(Pred, YC, BOp0);

        }

      }

    }

    if (BO->getOpcode() == Instruction::UDiv && C.isZero()) {

      // (icmp eq/ne (udiv A, B), 0) -> (icmp ugt/ule i32 B, A)

      auto NewPred = isICMP_NE ? ICmpInst::ICMP_ULE : ICmpInst::ICMP_UGT;

      return new ICmpInst(NewPred, BOp1, BOp0);

    }

    break;

  default:

    break;

  }

  return nullptr;

}


static Instruction *foldCtpopPow2Test(ICmpInst &I, IntrinsicInst *CtpopLhs,

                                      const APInt &CRhs,

                                      InstCombiner::BuilderTy &Builder,

                                      const SimplifyQuery &Q) {

  assert(CtpopLhs->getIntrinsicID() == Intrinsic::ctpop &&

         "Non-ctpop intrin in ctpop fold");

  if (!CtpopLhs->hasOneUse())

    return nullptr;


  // Power of 2 test:

  //    isPow2OrZero : ctpop(X) u< 2

  //    isPow2       : ctpop(X) == 1

  //    NotPow2OrZero: ctpop(X) u> 1

  //    NotPow2      : ctpop(X) != 1

  // If we know any bit of X can be folded to:

  //    IsPow2       : X & (~Bit) == 0

  //    NotPow2      : X & (~Bit) != 0

  const ICmpInst::Predicate Pred = I.getPredicate();

  if (((I.isEquality() || Pred == ICmpInst::ICMP_UGT) && CRhs == 1) ||

      (Pred == ICmpInst::ICMP_ULT && CRhs == 2)) {

    Value *Op = CtpopLhs->getArgOperand(0);

    KnownBits OpKnown = computeKnownBits(Op, Q.DL, Q.AC, Q.CxtI, Q.DT);

    // No need to check for count > 1, that should be already constant folded.

    if (OpKnown.countMinPopulation() == 1) {

      Value *And = Builder.CreateAnd(

          Op, Constant::getIntegerValue(Op->getType(), ~(OpKnown.One)));

      return new ICmpInst(

          (Pred == ICmpInst::ICMP_EQ || Pred == ICmpInst::ICMP_ULT)

              ? ICmpInst::ICMP_EQ

              : ICmpInst::ICMP_NE,

          And, Constant::getNullValue(Op->getType()));

    }

  }


  return nullptr;

}


/// Fold an equality icmp with LLVM intrinsic and constant operand.

Instruction *InstCombinerImpl::foldICmpEqIntrinsicWithConstant(

    ICmpInst &Cmp, IntrinsicInst *II, const APInt &C) {

  Type *Ty = II->getType();

  unsigned BitWidth = C.getBitWidth();

  const ICmpInst::Predicate Pred = Cmp.getPredicate();


  switch (II->getIntrinsicID()) {

  case Intrinsic::abs:

    // abs(A) == 0  ->  A == 0

    // abs(A) == INT_MIN  ->  A == INT_MIN

    if (C.isZero() || C.isMinSignedValue())

      return new ICmpInst(Pred, II->getArgOperand(0), ConstantInt::get(Ty, C));

    break;


  case Intrinsic::bswap:

    // bswap(A) == C  ->  A == bswap(C)

    return new ICmpInst(Pred, II->getArgOperand(0),

                        ConstantInt::get(Ty, C.byteSwap()));


  case Intrinsic::bitreverse:

    // bitreverse(A) == C  ->  A == bitreverse(C)

    return new ICmpInst(Pred, II->getArgOperand(0),

                        ConstantInt::get(Ty, C.reverseBits()));


  case Intrinsic::ctlz:

  case Intrinsic::cttz: {

    // ctz(A) == bitwidth(A)  ->  A == 0 and likewise for !=

    if (C == BitWidth)

      return new ICmpInst(Pred, II->getArgOperand(0),

                          ConstantInt::getNullValue(Ty));


    // ctz(A) == C -> A & Mask1 == Mask2, where Mask2 only has bit C set

    // and Mask1 has bits 0..C+1 set. Similar for ctl, but for high bits.

    // Limit to one use to ensure we don't increase instruction count.

    unsigned Num = C.getLimitedValue(BitWidth);

    if (Num != BitWidth && II->hasOneUse()) {

      bool IsTrailing = II->getIntrinsicID() == Intrinsic::cttz;

      APInt Mask1 = IsTrailing ? APInt::getLowBitsSet(BitWidth, Num + 1)

                               : APInt::getHighBitsSet(BitWidth, Num + 1);

      APInt Mask2 = IsTrailing

                        ? APInt::getOneBitSet(BitWidth, Num)

                        : APInt::getOneBitSet(BitWidth, BitWidth - Num - 1);

      return new ICmpInst(Pred, Builder.CreateAnd(II->getArgOperand(0), Mask1),

                          ConstantInt::get(Ty, Mask2));

    }

    break;

  }


  case Intrinsic::ctpop: {

    // popcount(A) == 0  ->  A == 0 and likewise for !=

    // popcount(A) == bitwidth(A)  ->  A == -1 and likewise for !=

    bool IsZero = C.isZero();

    if (IsZero || C == BitWidth)

      return new ICmpInst(Pred, II->getArgOperand(0),

                          IsZero ? Constant::getNullValue(Ty)

                                 : Constant::getAllOnesValue(Ty));


    break;

  }


  case Intrinsic::fshl:

  case Intrinsic::fshr:

    if (II->getArgOperand(0) == II->getArgOperand(1)) {

      const APInt *RotAmtC;

      // ror(X, RotAmtC) == C --> X == rol(C, RotAmtC)

      // rol(X, RotAmtC) == C --> X == ror(C, RotAmtC)

      if (match(II->getArgOperand(2), m_APInt(RotAmtC)))

        return new ICmpInst(Pred, II->getArgOperand(0),

                            II->getIntrinsicID() == Intrinsic::fshl

                                ? ConstantInt::get(Ty, C.rotr(*RotAmtC))

                                : ConstantInt::get(Ty, C.rotl(*RotAmtC)));

    }

    break;


  case Intrinsic::umax:

  case Intrinsic::uadd_sat: {

    // uadd.sat(a, b) == 0  ->  (a | b) == 0

    // umax(a, b) == 0  ->  (a | b) == 0

    if (C.isZero() && II->hasOneUse()) {

      Value *Or = Builder.CreateOr(II->getArgOperand(0), II->getArgOperand(1));

      return new ICmpInst(Pred, Or, Constant::getNullValue(Ty));

    }

    break;

  }


  case Intrinsic::ssub_sat:

    // ssub.sat(a, b) == 0 -> a == b

    if (C.isZero())

      return new ICmpInst(Pred, II->getArgOperand(0), II->getArgOperand(1));

    break;

  case Intrinsic::usub_sat: {

    // usub.sat(a, b) == 0  ->  a <= b

    if (C.isZero()) {

      ICmpInst::Predicate NewPred =

          Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_ULE : ICmpInst::ICMP_UGT;

      return new ICmpInst(NewPred, II->getArgOperand(0), II->getArgOperand(1));

    }

    break;

  }

  default:

    break;

  }


  return nullptr;

}


/// Fold an icmp with LLVM intrinsics

static Instruction *

foldICmpIntrinsicWithIntrinsic(ICmpInst &Cmp,

                               InstCombiner::BuilderTy &Builder) {

  assert(Cmp.isEquality());


  ICmpInst::Predicate Pred = Cmp.getPredicate();

  Value *Op0 = Cmp.getOperand(0);

  Value *Op1 = Cmp.getOperand(1);

  const auto *IIOp0 = dyn_cast<IntrinsicInst>(Op0);

  const auto *IIOp1 = dyn_cast<IntrinsicInst>(Op1);

  if (!IIOp0 || !IIOp1 || IIOp0->getIntrinsicID() != IIOp1->getIntrinsicID())

    return nullptr;


  switch (IIOp0->getIntrinsicID()) {

  case Intrinsic::bswap:

  case Intrinsic::bitreverse:

    // If both operands are byte-swapped or bit-reversed, just compare the

    // original values.

    return new ICmpInst(Pred, IIOp0->getOperand(0), IIOp1->getOperand(0));

  case Intrinsic::fshl:

  case Intrinsic::fshr: {

    // If both operands are rotated by same amount, just compare the

    // original values.

    if (IIOp0->getOperand(0) != IIOp0->getOperand(1))

      break;

    if (IIOp1->getOperand(0) != IIOp1->getOperand(1))

      break;

    if (IIOp0->getOperand(2) == IIOp1->getOperand(2))

      return new ICmpInst(Pred, IIOp0->getOperand(0), IIOp1->getOperand(0));


    // rotate(X, AmtX) == rotate(Y, AmtY)

    //  -> rotate(X, AmtX - AmtY) == Y

    // Do this if either both rotates have one use or if only one has one use

    // and AmtX/AmtY are constants.

    unsigned OneUses = IIOp0->hasOneUse() + IIOp1->hasOneUse();

    if (OneUses == 2 ||

        (OneUses == 1 && match(IIOp0->getOperand(2), m_ImmConstant()) &&

         match(IIOp1->getOperand(2), m_ImmConstant()))) {

      Value *SubAmt =

          Builder.CreateSub(IIOp0->getOperand(2), IIOp1->getOperand(2));

      Value *CombinedRotate = Builder.CreateIntrinsic(

          Op0->getType(), IIOp0->getIntrinsicID(),

          {IIOp0->getOperand(0), IIOp0->getOperand(0), SubAmt});

      return new ICmpInst(Pred, IIOp1->getOperand(0), CombinedRotate);

    }

  } break;

  default:

    break;

  }


  return nullptr;

}


/// Try to fold integer comparisons with a constant operand: icmp Pred X, C

/// where X is some kind of instruction and C is AllowPoison.

/// TODO: Move more folds which allow poison to this function.

Instruction *

InstCombinerImpl::foldICmpInstWithConstantAllowPoison(ICmpInst &Cmp,

                                                      const APInt &C) {

  const ICmpInst::Predicate Pred = Cmp.getPredicate();

  if (auto *II = dyn_cast<IntrinsicInst>(Cmp.getOperand(0))) {

    switch (II->getIntrinsicID()) {

    default:

      break;

    case Intrinsic::fshl:

    case Intrinsic::fshr:

      if (Cmp.isEquality() && II->getArgOperand(0) == II->getArgOperand(1)) {

        // (rot X, ?) == 0/-1 --> X == 0/-1

        if (C.isZero() || C.isAllOnes())

          return new ICmpInst(Pred, II->getArgOperand(0), Cmp.getOperand(1));

      }

      break;

    }

  }


  return nullptr;

}


/// Fold an icmp with BinaryOp and constant operand: icmp Pred BO, C.

Instruction *InstCombinerImpl::foldICmpBinOpWithConstant(ICmpInst &Cmp,

                                                         BinaryOperator *BO,

                                                         const APInt &C) {

  switch (BO->getOpcode()) {

  case Instruction::Xor:

    if (Instruction *I = foldICmpXorConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::And:

    if (Instruction *I = foldICmpAndConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::Or:

    if (Instruction *I = foldICmpOrConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::Mul:

    if (Instruction *I = foldICmpMulConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::Shl:

    if (Instruction *I = foldICmpShlConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::LShr:

  case Instruction::AShr:

    if (Instruction *I = foldICmpShrConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::SRem:

    if (Instruction *I = foldICmpSRemConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::UDiv:

    if (Instruction *I = foldICmpUDivConstant(Cmp, BO, C))

      return I;

    [[fallthrough]];

  case Instruction::SDiv:

    if (Instruction *I = foldICmpDivConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::Sub:

    if (Instruction *I = foldICmpSubConstant(Cmp, BO, C))

      return I;

    break;

  case Instruction::Add:

    if (Instruction *I = foldICmpAddConstant(Cmp, BO, C))

      return I;

    break;

  default:

    break;

  }


  // TODO: These folds could be refactored to be part of the above calls.

  if (Instruction *I = foldICmpBinOpEqualityWithConstant(Cmp, BO, C))

    return I;


  // Fall back to handling `icmp pred (select A ? C1 : C2) binop (select B ? C3

  // : C4), C5` pattern, by computing a truth table of the four constant

  // variants.

  return foldICmpBinOpWithConstantViaTruthTable(Cmp, BO, C);

}


static Instruction *

foldICmpUSubSatOrUAddSatWithConstant(CmpPredicate Pred, SaturatingInst *II,

                                     const APInt &C,

                                     InstCombiner::BuilderTy &Builder) {

  // This transform may end up producing more than one instruction for the

  // intrinsic, so limit it to one user of the intrinsic.

  if (!II->hasOneUse())

    return nullptr;


  // Let Y        = [add/sub]_sat(X, C) pred C2

  //     SatVal   = The saturating value for the operation

  //     WillWrap = Whether or not the operation will underflow / overflow

  // => Y = (WillWrap ? SatVal : (X binop C)) pred C2

  // => Y = WillWrap ? (SatVal pred C2) : ((X binop C) pred C2)

  //

  // When (SatVal pred C2) is true, then

  //    Y = WillWrap ? true : ((X binop C) pred C2)

  // => Y = WillWrap || ((X binop C) pred C2)

  // else

  //    Y =  WillWrap ? false : ((X binop C) pred C2)

  // => Y = !WillWrap ?  ((X binop C) pred C2) : false

  // => Y = !WillWrap && ((X binop C) pred C2)

  Value *Op0 = II->getOperand(0);

  Value *Op1 = II->getOperand(1);


  const APInt *COp1;

  // This transform only works when the intrinsic has an integral constant or

  // splat vector as the second operand.

  if (!match(Op1, m_APInt(COp1)))

    return nullptr;


  APInt SatVal;

  switch (II->getIntrinsicID()) {

  default:

    llvm_unreachable(

        "This function only works with usub_sat and uadd_sat for now!");

  case Intrinsic::uadd_sat:

    SatVal = APInt::getAllOnes(C.getBitWidth());

    break;

  case Intrinsic::usub_sat:

    SatVal = APInt::getZero(C.getBitWidth());

    break;

  }


  // Check (SatVal pred C2)

  bool SatValCheck = ICmpInst::compare(SatVal, C, Pred);


  // !WillWrap.

  ConstantRange C1 = ConstantRange::makeExactNoWrapRegion(

      II->getBinaryOp(), *COp1, II->getNoWrapKind());


  // WillWrap.

  if (SatValCheck)

    C1 = C1.inverse();


  ConstantRange C2 = ConstantRange::makeExactICmpRegion(Pred, C);

  if (II->getBinaryOp() == Instruction::Add)

    C2 = C2.sub(*COp1);

  else

    C2 = C2.add(*COp1);


  Instruction::BinaryOps CombiningOp =

      SatValCheck ? Instruction::BinaryOps::Or : Instruction::BinaryOps::And;


  std::optional<ConstantRange> Combination;

  if (CombiningOp == Instruction::BinaryOps::Or)

    Combination = C1.exactUnionWith(C2);

  else /* CombiningOp == Instruction::BinaryOps::And */

    Combination = C1.exactIntersectWith(C2);


  if (!Combination)

    return nullptr;


  CmpInst::Predicate EquivPred;

  APInt EquivInt;

  APInt EquivOffset;


  Combination->getEquivalentICmp(EquivPred, EquivInt, EquivOffset);


  return new ICmpInst(

      EquivPred,

      Builder.CreateAdd(Op0, ConstantInt::get(Op1->getType(), EquivOffset)),

      ConstantInt::get(Op1->getType(), EquivInt));

}


static Instruction *

foldICmpOfCmpIntrinsicWithConstant(CmpPredicate Pred, IntrinsicInst *I,

                                   const APInt &C,

                                   InstCombiner::BuilderTy &Builder) {

  std::optional<ICmpInst::Predicate> NewPredicate = std::nullopt;

  switch (Pred) {

  case ICmpInst::ICMP_EQ:

  case ICmpInst::ICMP_NE:

    if (C.isZero())

      NewPredicate = Pred;

    else if (C.isOne())

      NewPredicate =

          Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_UGT : ICmpInst::ICMP_ULE;

    else if (C.isAllOnes())

      NewPredicate =

          Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_ULT : ICmpInst::ICMP_UGE;

    break;


  case ICmpInst::ICMP_SGT:

    if (C.isAllOnes())

      NewPredicate = ICmpInst::ICMP_UGE;

    else if (C.isZero())

      NewPredicate = ICmpInst::ICMP_UGT;

    break;


  case ICmpInst::ICMP_SLT:

    if (C.isZero())

      NewPredicate = ICmpInst::ICMP_ULT;

    else if (C.isOne())

      NewPredicate = ICmpInst::ICMP_ULE;

    break;


  case ICmpInst::ICMP_ULT:

    if (C.ugt(1))

      NewPredicate = ICmpInst::ICMP_UGE;

    break;


  case ICmpInst::ICMP_UGT:

    if (!C.isZero() && !C.isAllOnes())

      NewPredicate = ICmpInst::ICMP_ULT;

    break;


  default:

    break;

  }


  if (!NewPredicate)

    return nullptr;


  if (I->getIntrinsicID() == Intrinsic::scmp)

    NewPredicate = ICmpInst::getSignedPredicate(*NewPredicate);

  Value *LHS = I->getOperand(0);

  Value *RHS = I->getOperand(1);

  return new ICmpInst(*NewPredicate, LHS, RHS);

}


/// Fold an icmp with LLVM intrinsic and constant operand: icmp Pred II, C.

Instruction *InstCombinerImpl::foldICmpIntrinsicWithConstant(ICmpInst &Cmp,

                                                             IntrinsicInst *II,

                                                             const APInt &C) {

  ICmpInst::Predicate Pred = Cmp.getPredicate();


  // Handle folds that apply for any kind of icmp.

  switch (II->getIntrinsicID()) {

  default:

    break;

  case Intrinsic::uadd_sat:

  case Intrinsic::usub_sat:

    if (auto *Folded = foldICmpUSubSatOrUAddSatWithConstant(

            Pred, cast<SaturatingInst>(II), C, Builder))

      return Folded;

    break;

  case Intrinsic::ctpop: {

    const SimplifyQuery Q = SQ.getWithInstruction(&Cmp);

    if (Instruction *R = foldCtpopPow2Test(Cmp, II, C, Builder, Q))

      return R;

  } break;

  case Intrinsic::scmp:

  case Intrinsic::ucmp:

    if (auto *Folded = foldICmpOfCmpIntrinsicWithConstant(Pred, II, C, Builder))

      return Folded;

    break;

  }


  if (Cmp.isEquality())

    return foldICmpEqIntrinsicWithConstant(Cmp, II, C);


  Type *Ty = II->getType();

  unsigned BitWidth = C.getBitWidth();

  switch (II->getIntrinsicID()) {

  case Intrinsic::ctpop: {

    // (ctpop X > BitWidth - 1) --> X == -1

    Value *X = II->getArgOperand(0);

    if (C == BitWidth - 1 && Pred == ICmpInst::ICMP_UGT)

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_EQ, X,

                             ConstantInt::getAllOnesValue(Ty));

    // (ctpop X < BitWidth) --> X != -1

    if (C == BitWidth && Pred == ICmpInst::ICMP_ULT)

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_NE, X,

                             ConstantInt::getAllOnesValue(Ty));

    break;

  }

  case Intrinsic::ctlz: {

    // ctlz(0bXXXXXXXX) > 3 -> 0bXXXXXXXX < 0b00010000

    if (Pred == ICmpInst::ICMP_UGT && C.ult(BitWidth)) {

      unsigned Num = C.getLimitedValue();

      APInt Limit = APInt::getOneBitSet(BitWidth, BitWidth - Num - 1);

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_ULT,

                             II->getArgOperand(0), ConstantInt::get(Ty, Limit));

    }


    // ctlz(0bXXXXXXXX) < 3 -> 0bXXXXXXXX > 0b00011111

    if (Pred == ICmpInst::ICMP_ULT && C.uge(1) && C.ule(BitWidth)) {

      unsigned Num = C.getLimitedValue();

      APInt Limit = APInt::getLowBitsSet(BitWidth, BitWidth - Num);

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_UGT,

                             II->getArgOperand(0), ConstantInt::get(Ty, Limit));

    }

    break;

  }

  case Intrinsic::cttz: {

    // Limit to one use to ensure we don't increase instruction count.

    if (!II->hasOneUse())

      return nullptr;


    // cttz(0bXXXXXXXX) > 3 -> 0bXXXXXXXX & 0b00001111 == 0

    if (Pred == ICmpInst::ICMP_UGT && C.ult(BitWidth)) {

      APInt Mask = APInt::getLowBitsSet(BitWidth, C.getLimitedValue() + 1);

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_EQ,

                             Builder.CreateAnd(II->getArgOperand(0), Mask),

                             ConstantInt::getNullValue(Ty));

    }


    // cttz(0bXXXXXXXX) < 3 -> 0bXXXXXXXX & 0b00000111 != 0

    if (Pred == ICmpInst::ICMP_ULT && C.uge(1) && C.ule(BitWidth)) {

      APInt Mask = APInt::getLowBitsSet(BitWidth, C.getLimitedValue());

      return CmpInst::Create(Instruction::ICmp, ICmpInst::ICMP_NE,

                             Builder.CreateAnd(II->getArgOperand(0), Mask),

                             ConstantInt::getNullValue(Ty));

    }

    break;

  }

  case Intrinsic::ssub_sat:

    // ssub.sat(a, b) spred 0 -> a spred b

    if (ICmpInst::isSigned(Pred)) {

      if (C.isZero())

        return new ICmpInst(Pred, II->getArgOperand(0), II->getArgOperand(1));

      // X s<= 0 is cannonicalized to X s< 1

      if (Pred == ICmpInst::ICMP_SLT && C.isOne())

        return new ICmpInst(ICmpInst::ICMP_SLE, II->getArgOperand(0),

                            II->getArgOperand(1));

      // X s>= 0 is cannonicalized to X s> -1

      if (Pred == ICmpInst::ICMP_SGT && C.isAllOnes())

        return new ICmpInst(ICmpInst::ICMP_SGE, II->getArgOperand(0),

                            II->getArgOperand(1));

    }

    break;

  default:

    break;

  }


  return nullptr;

}


/// Handle icmp with constant (but not simple integer constant) RHS.

Instruction *InstCombinerImpl::foldICmpInstWithConstantNotInt(ICmpInst &I) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  Constant *RHSC = dyn_cast<Constant>(Op1);

  Instruction *LHSI = dyn_cast<Instruction>(Op0);

  if (!RHSC || !LHSI)

    return nullptr;


  switch (LHSI->getOpcode()) {

  case Instruction::IntToPtr:

    // icmp pred inttoptr(X), null -> icmp pred X, 0

    if (RHSC->isNullValue() &&

        DL.getIntPtrType(RHSC->getType()) == LHSI->getOperand(0)->getType())

      return new ICmpInst(

          I.getPredicate(), LHSI->getOperand(0),

          Constant::getNullValue(LHSI->getOperand(0)->getType()));

    break;


  case Instruction::Load:

    // Try to optimize things like "A[i] > 4" to index computations.

    if (GetElementPtrInst *GEP =

            dyn_cast<GetElementPtrInst>(LHSI->getOperand(0)))

      if (GlobalVariable *GV = dyn_cast<GlobalVariable>(GEP->getOperand(0)))

        if (Instruction *Res =

                foldCmpLoadFromIndexedGlobal(cast<LoadInst>(LHSI), GEP, GV, I))

          return Res;

    break;

  }


  return nullptr;

}


Instruction *InstCombinerImpl::foldSelectICmp(CmpPredicate Pred, SelectInst *SI,

                                              Value *RHS, const ICmpInst &I) {

  // Try to fold the comparison into the select arms, which will cause the

  // select to be converted into a logical and/or.

  auto SimplifyOp = [&](Value *Op, bool SelectCondIsTrue) -> Value * {

    if (Value *Res = simplifyICmpInst(Pred, Op, RHS, SQ))

      return Res;

    if (std::optional<bool> Impl = isImpliedCondition(

            SI->getCondition(), Pred, Op, RHS, DL, SelectCondIsTrue))

      return ConstantInt::get(I.getType(), *Impl);

    return nullptr;

  };


  ConstantInt *CI = nullptr;

  Value *Op1 = SimplifyOp(SI->getOperand(1), true);

  if (Op1)

    CI = dyn_cast<ConstantInt>(Op1);


  Value *Op2 = SimplifyOp(SI->getOperand(2), false);

  if (Op2)

    CI = dyn_cast<ConstantInt>(Op2);


  auto Simplifies = [&](Value *Op, unsigned Idx) {

    // A comparison of ucmp/scmp with a constant will fold into an icmp.

    const APInt *Dummy;

    return Op ||

           (isa<CmpIntrinsic>(SI->getOperand(Idx)) &&

            SI->getOperand(Idx)->hasOneUse() && match(RHS, m_APInt(Dummy)));

  };


  // We only want to perform this transformation if it will not lead to

  // additional code. This is true if either both sides of the select

  // fold to a constant (in which case the icmp is replaced with a select

  // which will usually simplify) or this is the only user of the

  // select (in which case we are trading a select+icmp for a simpler

  // select+icmp) or all uses of the select can be replaced based on

  // dominance information ("Global cases").

  bool Transform = false;

  if (Op1 && Op2)

    Transform = true;

  else if (Simplifies(Op1, 1) || Simplifies(Op2, 2)) {

    // Local case

    if (SI->hasOneUse())

      Transform = true;

    // Global cases

    else if (CI && !CI->isZero())

      // When Op1 is constant try replacing select with second operand.

      // Otherwise Op2 is constant and try replacing select with first

      // operand.

      Transform = replacedSelectWithOperand(SI, &I, Op1 ? 2 : 1);

  }

  if (Transform) {

    if (!Op1)

      Op1 = Builder.CreateICmp(Pred, SI->getOperand(1), RHS, I.getName());

    if (!Op2)

      Op2 = Builder.CreateICmp(Pred, SI->getOperand(2), RHS, I.getName());

    return SelectInst::Create(SI->getOperand(0), Op1, Op2);

  }


  return nullptr;

}


// Returns whether V is a Mask ((X + 1) & X == 0) or ~Mask (-Pow2OrZero)

static bool isMaskOrZero(const Value *V, bool Not, const SimplifyQuery &Q,

                         unsigned Depth = 0) {

  if (Not ? match(V, m_NegatedPower2OrZero()) : match(V, m_LowBitMaskOrZero()))

    return true;

  if (V->getType()->getScalarSizeInBits() == 1)

    return true;

  if (Depth++ >= MaxAnalysisRecursionDepth)

    return false;

  Value *X;

  const Instruction *I = dyn_cast<Instruction>(V);

  if (!I)

    return false;

  switch (I->getOpcode()) {

  case Instruction::ZExt:

    // ZExt(Mask) is a Mask.

    return !Not && isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::SExt:

    // SExt(Mask) is a Mask.

    // SExt(~Mask) is a ~Mask.

    return isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::And:

  case Instruction::Or:

    // Mask0 | Mask1 is a Mask.

    // Mask0 & Mask1 is a Mask.

    // ~Mask0 | ~Mask1 is a ~Mask.

    // ~Mask0 & ~Mask1 is a ~Mask.

    return isMaskOrZero(I->getOperand(1), Not, Q, Depth) &&

           isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::Xor:

    if (match(V, m_Not(m_Value(X))))

      return isMaskOrZero(X, !Not, Q, Depth);


    // (X ^ -X) is a ~Mask

    if (Not)

      return match(V, m_c_Xor(m_Value(X), m_Neg(m_Deferred(X))));

    // (X ^ (X - 1)) is a Mask

    else

      return match(V, m_c_Xor(m_Value(X), m_Add(m_Deferred(X), m_AllOnes())));

  case Instruction::Select:

    // c ? Mask0 : Mask1 is a Mask.

    return isMaskOrZero(I->getOperand(1), Not, Q, Depth) &&

           isMaskOrZero(I->getOperand(2), Not, Q, Depth);

  case Instruction::Shl:

    // (~Mask) << X is a ~Mask.

    return Not && isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::LShr:

    // Mask >> X is a Mask.

    return !Not && isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::AShr:

    // Mask s>> X is a Mask.

    // ~Mask s>> X is a ~Mask.

    return isMaskOrZero(I->getOperand(0), Not, Q, Depth);

  case Instruction::Add:

    // Pow2 - 1 is a Mask.

    if (!Not && match(I->getOperand(1), m_AllOnes()))

      return isKnownToBeAPowerOfTwo(I->getOperand(0), Q.DL, /*OrZero*/ true,

                                    Q.AC, Q.CxtI, Q.DT, Depth);

    break;

  case Instruction::Sub:

    // -Pow2 is a ~Mask.

    if (Not && match(I->getOperand(0), m_Zero()))

      return isKnownToBeAPowerOfTwo(I->getOperand(1), Q.DL, /*OrZero*/ true,

                                    Q.AC, Q.CxtI, Q.DT, Depth);

    break;

  case Instruction::Call: {

    if (auto *II = dyn_cast<IntrinsicInst>(I)) {

      switch (II->getIntrinsicID()) {

        // min/max(Mask0, Mask1) is a Mask.

        // min/max(~Mask0, ~Mask1) is a ~Mask.

      case Intrinsic::umax:

      case Intrinsic::smax:

      case Intrinsic::umin:

      case Intrinsic::smin:

        return isMaskOrZero(II->getArgOperand(1), Not, Q, Depth) &&

               isMaskOrZero(II->getArgOperand(0), Not, Q, Depth);


        // In the context of masks, bitreverse(Mask) == ~Mask

      case Intrinsic::bitreverse:

        return isMaskOrZero(II->getArgOperand(0), !Not, Q, Depth);

      default:

        break;

      }

    }

    break;

  }

  default:

    break;

  }

  return false;

}


/// Some comparisons can be simplified.

/// In this case, we are looking for comparisons that look like

/// a check for a lossy truncation.

/// Folds:

///   icmp SrcPred (x & Mask), x    to    icmp DstPred x, Mask

///   icmp SrcPred (x & ~Mask), ~Mask    to    icmp DstPred x, ~Mask

///   icmp eq/ne (x & ~Mask), 0     to    icmp DstPred x, Mask

///   icmp eq/ne (~x | Mask), -1     to    icmp DstPred x, Mask

/// Where Mask is some pattern that produces all-ones in low bits:

///    (-1 >> y)

///    ((-1 << y) >> y)     <- non-canonical, has extra uses

///   ~(-1 << y)

///    ((1 << y) + (-1))    <- non-canonical, has extra uses

/// The Mask can be a constant, too.

/// For some predicates, the operands are commutative.

/// For others, x can only be on a specific side.

static Value *foldICmpWithLowBitMaskedVal(CmpPredicate Pred, Value *Op0,

                                          Value *Op1, const SimplifyQuery &Q,

                                          InstCombiner &IC) {


  ICmpInst::Predicate DstPred;

  switch (Pred) {

  case ICmpInst::Predicate::ICMP_EQ:

    //  x & Mask == x

    //  x & ~Mask == 0

    //  ~x | Mask == -1

    //    ->    x u<= Mask

    //  x & ~Mask == ~Mask

    //    ->    ~Mask u<= x

    DstPred = ICmpInst::Predicate::ICMP_ULE;

    break;

  case ICmpInst::Predicate::ICMP_NE:

    //  x & Mask != x

    //  x & ~Mask != 0

    //  ~x | Mask != -1

    //    ->    x u> Mask

    //  x & ~Mask != ~Mask

    //    ->    ~Mask u> x

    DstPred = ICmpInst::Predicate::ICMP_UGT;

    break;

  case ICmpInst::Predicate::ICMP_ULT:

    //  x & Mask u< x

    //    -> x u> Mask

    //  x & ~Mask u< ~Mask

    //    -> ~Mask u> x

    DstPred = ICmpInst::Predicate::ICMP_UGT;

    break;

  case ICmpInst::Predicate::ICMP_UGE:

    //  x & Mask u>= x

    //    -> x u<= Mask

    //  x & ~Mask u>= ~Mask

    //    -> ~Mask u<= x

    DstPred = ICmpInst::Predicate::ICMP_ULE;

    break;

  case ICmpInst::Predicate::ICMP_SLT:

    //  x & Mask s< x [iff Mask s>= 0]

    //    -> x s> Mask

    //  x & ~Mask s< ~Mask [iff ~Mask != 0]

    //    -> ~Mask s> x

    DstPred = ICmpInst::Predicate::ICMP_SGT;

    break;

  case ICmpInst::Predicate::ICMP_SGE:

    //  x & Mask s>= x [iff Mask s>= 0]

    //    -> x s<= Mask

    //  x & ~Mask s>= ~Mask [iff ~Mask != 0]

    //    -> ~Mask s<= x

    DstPred = ICmpInst::Predicate::ICMP_SLE;

    break;

  default:

    // We don't support sgt,sle

    // ult/ugt are simplified to true/false respectively.

    return nullptr;

  }


  Value *X, *M;

  // Put search code in lambda for early positive returns.

  auto IsLowBitMask = [&]() {

    if (match(Op0, m_c_And(m_Specific(Op1), m_Value(M)))) {

      X = Op1;

      // Look for: x & Mask pred x

      if (isMaskOrZero(M, /*Not=*/false, Q)) {

        return !ICmpInst::isSigned(Pred) ||

               (match(M, m_NonNegative()) || isKnownNonNegative(M, Q));

      }


      // Look for: x & ~Mask pred ~Mask

      if (isMaskOrZero(X, /*Not=*/true, Q)) {

        return !ICmpInst::isSigned(Pred) || isKnownNonZero(X, Q);

      }

      return false;

    }

    if (ICmpInst::isEquality(Pred) && match(Op1, m_AllOnes()) &&

        match(Op0, m_OneUse(m_Or(m_Value(X), m_Value(M))))) {


      auto Check = [&]() {

        // Look for: ~x | Mask == -1

        if (isMaskOrZero(M, /*Not=*/false, Q)) {

          if (Value *NotX =

                  IC.getFreelyInverted(X, X->hasOneUse(), &IC.Builder)) {

            X = NotX;

            return true;

          }

        }

        return false;

      };

      if (Check())

        return true;

      std::swap(X, M);

      return Check();

    }

    if (ICmpInst::isEquality(Pred) && match(Op1, m_Zero()) &&

        match(Op0, m_OneUse(m_And(m_Value(X), m_Value(M))))) {

      auto Check = [&]() {

        // Look for: x & ~Mask == 0

        if (isMaskOrZero(M, /*Not=*/true, Q)) {

          if (Value *NotM =

                  IC.getFreelyInverted(M, M->hasOneUse(), &IC.Builder)) {

            M = NotM;

            return true;

          }

        }

        return false;

      };

      if (Check())

        return true;

      std::swap(X, M);

      return Check();

    }

    return false;

  };


  if (!IsLowBitMask())

    return nullptr;


  return IC.Builder.CreateICmp(DstPred, X, M);

}


/// Some comparisons can be simplified.

/// In this case, we are looking for comparisons that look like

/// a check for a lossy signed truncation.

/// Folds:   (MaskedBits is a constant.)

///   ((%x << MaskedBits) a>> MaskedBits) SrcPred %x

/// Into:

///   (add %x, (1 << (KeptBits-1))) DstPred (1 << KeptBits)

/// Where  KeptBits = bitwidth(%x) - MaskedBits

static Value *

foldICmpWithTruncSignExtendedVal(ICmpInst &I,

                                 InstCombiner::BuilderTy &Builder) {

  CmpPredicate SrcPred;

  Value *X;

  const APInt *C0, *C1; // FIXME: non-splats, potentially with undef.

  // We are ok with 'shl' having multiple uses, but 'ashr' must be one-use.

  if (!match(&I, m_c_ICmp(SrcPred,

                          m_OneUse(m_AShr(m_Shl(m_Value(X), m_APInt(C0)),

                                          m_APInt(C1))),

                          m_Deferred(X))))

    return nullptr;


  // Potential handling of non-splats: for each element:

  //  * if both are undef, replace with constant 0.

  //    Because (1<<0) is OK and is 1, and ((1<<0)>>1) is also OK and is 0.

  //  * if both are not undef, and are different, bailout.

  //  * else, only one is undef, then pick the non-undef one.


  // The shift amount must be equal.

  if (*C0 != *C1)

    return nullptr;

  const APInt &MaskedBits = *C0;

  assert(MaskedBits != 0 && "shift by zero should be folded away already.");


  ICmpInst::Predicate DstPred;

  switch (SrcPred) {

  case ICmpInst::Predicate::ICMP_EQ:

    // ((%x << MaskedBits) a>> MaskedBits) == %x

    //   =>

    // (add %x, (1 << (KeptBits-1))) u< (1 << KeptBits)

    DstPred = ICmpInst::Predicate::ICMP_ULT;

    break;

  case ICmpInst::Predicate::ICMP_NE:

    // ((%x << MaskedBits) a>> MaskedBits) != %x

    //   =>

    // (add %x, (1 << (KeptBits-1))) u>= (1 << KeptBits)

    DstPred = ICmpInst::Predicate::ICMP_UGE;

    break;

  // FIXME: are more folds possible?

  default:

    return nullptr;

  }


  auto *XType = X->getType();

  const unsigned XBitWidth = XType->getScalarSizeInBits();

  const APInt BitWidth = APInt(XBitWidth, XBitWidth);

  assert(BitWidth.ugt(MaskedBits) && "shifts should leave some bits untouched");


  // KeptBits = bitwidth(%x) - MaskedBits

  const APInt KeptBits = BitWidth - MaskedBits;

  assert(KeptBits.ugt(0) && KeptBits.ult(BitWidth) && "unreachable");

  // ICmpCst = (1 << KeptBits)

  const APInt ICmpCst = APInt(XBitWidth, 1).shl(KeptBits);

  assert(ICmpCst.isPowerOf2());

  // AddCst = (1 << (KeptBits-1))

  const APInt AddCst = ICmpCst.lshr(1);

  assert(AddCst.ult(ICmpCst) && AddCst.isPowerOf2());


  // T0 = add %x, AddCst

  Value *T0 = Builder.CreateAdd(X, ConstantInt::get(XType, AddCst));

  // T1 = T0 DstPred ICmpCst

  Value *T1 = Builder.CreateICmp(DstPred, T0, ConstantInt::get(XType, ICmpCst));


  return T1;

}


// Given pattern:

//   icmp eq/ne (and ((x shift Q), (y oppositeshift K))), 0

// we should move shifts to the same hand of 'and', i.e. rewrite as

//   icmp eq/ne (and (x shift (Q+K)), y), 0  iff (Q+K) u< bitwidth(x)

// We are only interested in opposite logical shifts here.

// One of the shifts can be truncated.

// If we can, we want to end up creating 'lshr' shift.

static Value *

foldShiftIntoShiftInAnotherHandOfAndInICmp(ICmpInst &I, const SimplifyQuery SQ,

                                           InstCombiner::BuilderTy &Builder) {

  if (!I.isEquality() || !match(I.getOperand(1), m_Zero()) ||

      !I.getOperand(0)->hasOneUse())

    return nullptr;


  auto m_AnyLogicalShift = m_LogicalShift(m_Value(), m_Value());


  // Look for an 'and' of two logical shifts, one of which may be truncated.

  // We use m_TruncOrSelf() on the RHS to correctly handle commutative case.

  Instruction *XShift, *MaybeTruncation, *YShift;

  if (!match(

          I.getOperand(0),

          m_c_And(m_CombineAnd(m_AnyLogicalShift, m_Instruction(XShift)),

                  m_CombineAnd(m_TruncOrSelf(m_CombineAnd(

                                   m_AnyLogicalShift, m_Instruction(YShift))),

                               m_Instruction(MaybeTruncation)))))

    return nullptr;


  // We potentially looked past 'trunc', but only when matching YShift,

  // therefore YShift must have the widest type.

  Instruction *WidestShift = YShift;

  // Therefore XShift must have the shallowest type.

  // Or they both have identical types if there was no truncation.

  Instruction *NarrowestShift = XShift;


  Type *WidestTy = WidestShift->getType();

  Type *NarrowestTy = NarrowestShift->getType();

  assert(NarrowestTy == I.getOperand(0)->getType() &&

         "We did not look past any shifts while matching XShift though.");

  bool HadTrunc = WidestTy != I.getOperand(0)->getType();


  // If YShift is a 'lshr', swap the shifts around.

  if (match(YShift, m_LShr(m_Value(), m_Value())))

    std::swap(XShift, YShift);


  // The shifts must be in opposite directions.

  auto XShiftOpcode = XShift->getOpcode();

  if (XShiftOpcode == YShift->getOpcode())

    return nullptr; // Do not care about same-direction shifts here.


  Value *X, *XShAmt, *Y, *YShAmt;

  match(XShift, m_BinOp(m_Value(X), m_ZExtOrSelf(m_Value(XShAmt))));

  match(YShift, m_BinOp(m_Value(Y), m_ZExtOrSelf(m_Value(YShAmt))));


  // If one of the values being shifted is a constant, then we will end with

  // and+icmp, and [zext+]shift instrs will be constant-folded. If they are not,

  // however, we will need to ensure that we won't increase instruction count.

  if (!isa<Constant>(X) && !isa<Constant>(Y)) {

    // At least one of the hands of the 'and' should be one-use shift.

    if (!match(I.getOperand(0),

               m_c_And(m_OneUse(m_AnyLogicalShift), m_Value())))

      return nullptr;

    if (HadTrunc) {

      // Due to the 'trunc', we will need to widen X. For that either the old

      // 'trunc' or the shift amt in the non-truncated shift should be one-use.

      if (!MaybeTruncation->hasOneUse() &&

          !NarrowestShift->getOperand(1)->hasOneUse())

        return nullptr;

    }

  }


  // We have two shift amounts from two different shifts. The types of those

  // shift amounts may not match. If that's the case let's bailout now.

  if (XShAmt->getType() != YShAmt->getType())

    return nullptr;


  // As input, we have the following pattern:

  //   icmp eq/ne (and ((x shift Q), (y oppositeshift K))), 0

  // We want to rewrite that as:

  //   icmp eq/ne (and (x shift (Q+K)), y), 0  iff (Q+K) u< bitwidth(x)

  // While we know that originally (Q+K) would not overflow

  // (because  2 * (N-1) u<= iN -1), we have looked past extensions of

  // shift amounts. so it may now overflow in smaller bitwidth.

  // To ensure that does not happen, we need to ensure that the total maximal

  // shift amount is still representable in that smaller bit width.

  unsigned MaximalPossibleTotalShiftAmount =

      (WidestTy->getScalarSizeInBits() - 1) +

      (NarrowestTy->getScalarSizeInBits() - 1);

  APInt MaximalRepresentableShiftAmount =

      APInt::getAllOnes(XShAmt->getType()->getScalarSizeInBits());

  if (MaximalRepresentableShiftAmount.ult(MaximalPossibleTotalShiftAmount))

    return nullptr;


  // Can we fold (XShAmt+YShAmt) ?

  auto *NewShAmt = dyn_cast_or_null<Constant>(

      simplifyAddInst(XShAmt, YShAmt, /*isNSW=*/false,

                      /*isNUW=*/false, SQ.getWithInstruction(&I)));

  if (!NewShAmt)

    return nullptr;

  if (NewShAmt->getType() != WidestTy) {

    NewShAmt =

        ConstantFoldCastOperand(Instruction::ZExt, NewShAmt, WidestTy, SQ.DL);

    if (!NewShAmt)

      return nullptr;

  }

  unsigned WidestBitWidth = WidestTy->getScalarSizeInBits();


  // Is the new shift amount smaller than the bit width?

  // FIXME: could also rely on ConstantRange.

  if (!match(NewShAmt,

             m_SpecificInt_ICMP(ICmpInst::Predicate::ICMP_ULT,

                                APInt(WidestBitWidth, WidestBitWidth))))

    return nullptr;


  // An extra legality check is needed if we had trunc-of-lshr.

  if (HadTrunc && match(WidestShift, m_LShr(m_Value(), m_Value()))) {

    auto CanFold = [NewShAmt, WidestBitWidth, NarrowestShift, SQ,

                    WidestShift]() {

      // It isn't obvious whether it's worth it to analyze non-constants here.

      // Also, let's basically give up on non-splat cases, pessimizing vectors.

      // If *any* of these preconditions matches we can perform the fold.

      Constant *NewShAmtSplat = NewShAmt->getType()->isVectorTy()

                                    ? NewShAmt->getSplatValue()

                                    : NewShAmt;

      // If it's edge-case shift (by 0 or by WidestBitWidth-1) we can fold.

      if (NewShAmtSplat &&

          (NewShAmtSplat->isNullValue() ||

           NewShAmtSplat->getUniqueInteger() == WidestBitWidth - 1))

        return true;

      // We consider *min* leading zeros so a single outlier

      // blocks the transform as opposed to allowing it.

      if (auto *C = dyn_cast<Constant>(NarrowestShift->getOperand(0))) {

        KnownBits Known = computeKnownBits(C, SQ.DL);

        unsigned MinLeadZero = Known.countMinLeadingZeros();

        // If the value being shifted has at most lowest bit set we can fold.

        unsigned MaxActiveBits = Known.getBitWidth() - MinLeadZero;

        if (MaxActiveBits <= 1)

          return true;

        // Precondition:  NewShAmt u<= countLeadingZeros(C)

        if (NewShAmtSplat && NewShAmtSplat->getUniqueInteger().ule(MinLeadZero))

          return true;

      }

      if (auto *C = dyn_cast<Constant>(WidestShift->getOperand(0))) {

        KnownBits Known = computeKnownBits(C, SQ.DL);

        unsigned MinLeadZero = Known.countMinLeadingZeros();

        // If the value being shifted has at most lowest bit set we can fold.

        unsigned MaxActiveBits = Known.getBitWidth() - MinLeadZero;

        if (MaxActiveBits <= 1)

          return true;

        // Precondition:  ((WidestBitWidth-1)-NewShAmt) u<= countLeadingZeros(C)

        if (NewShAmtSplat) {

          APInt AdjNewShAmt =

              (WidestBitWidth - 1) - NewShAmtSplat->getUniqueInteger();

          if (AdjNewShAmt.ule(MinLeadZero))

            return true;

        }

      }

      return false; // Can't tell if it's ok.

    };

    if (!CanFold())

      return nullptr;

  }


  // All good, we can do this fold.

  X = Builder.CreateZExt(X, WidestTy);

  Y = Builder.CreateZExt(Y, WidestTy);

  // The shift is the same that was for X.

  Value *T0 = XShiftOpcode == Instruction::BinaryOps::LShr

                  ? Builder.CreateLShr(X, NewShAmt)

                  : Builder.CreateShl(X, NewShAmt);

  Value *T1 = Builder.CreateAnd(T0, Y);

  return Builder.CreateICmp(I.getPredicate(), T1,

                            Constant::getNullValue(WidestTy));

}


/// Fold

///   (-1 u/ x) u< y

///   ((x * y) ?/ x) != y

/// to

///   @llvm.?mul.with.overflow(x, y) plus extraction of overflow bit

/// Note that the comparison is commutative, while inverted (u>=, ==) predicate

/// will mean that we are looking for the opposite answer.

Value *InstCombinerImpl::foldMultiplicationOverflowCheck(ICmpInst &I) {

  CmpPredicate Pred;

  Value *X, *Y;

  Instruction *Mul;

  Instruction *Div;

  bool NeedNegation;

  // Look for: (-1 u/ x) u</u>= y

  if (!I.isEquality() &&

      match(&I, m_c_ICmp(Pred,

                         m_CombineAnd(m_OneUse(m_UDiv(m_AllOnes(), m_Value(X))),

                                      m_Instruction(Div)),

                         m_Value(Y)))) {

    Mul = nullptr;


    // Are we checking that overflow does not happen, or does happen?

    switch (Pred) {

    case ICmpInst::Predicate::ICMP_ULT:

      NeedNegation = false;

      break; // OK

    case ICmpInst::Predicate::ICMP_UGE:

      NeedNegation = true;

      break; // OK

    default:

      return nullptr; // Wrong predicate.

    }

  } else // Look for: ((x * y) / x) !=/== y

    if (I.isEquality() &&

        match(&I, m_c_ICmp(Pred, m_Value(Y),

                           m_CombineAnd(m_OneUse(m_IDiv(

                                            m_CombineAnd(m_c_Mul(m_Deferred(Y),

                                                                 m_Value(X)),

                                                         m_Instruction(Mul)),

                                            m_Deferred(X))),

                                        m_Instruction(Div))))) {

      NeedNegation = Pred == ICmpInst::Predicate::ICMP_EQ;

    } else

      return nullptr;


  BuilderTy::InsertPointGuard Guard(Builder);

  // If the pattern included (x * y), we'll want to insert new instructions

  // right before that original multiplication so that we can replace it.

  bool MulHadOtherUses = Mul && !Mul->hasOneUse();

  if (MulHadOtherUses)

    Builder.SetInsertPoint(Mul);


  CallInst *Call = Builder.CreateIntrinsic(

      Div->getOpcode() == Instruction::UDiv ? Intrinsic::umul_with_overflow

                                            : Intrinsic::smul_with_overflow,

      X->getType(), {X, Y}, /*FMFSource=*/nullptr, "mul");


  // If the multiplication was used elsewhere, to ensure that we don't leave

  // "duplicate" instructions, replace uses of that original multiplication

  // with the multiplication result from the with.overflow intrinsic.

  if (MulHadOtherUses)

    replaceInstUsesWith(*Mul, Builder.CreateExtractValue(Call, 0, "mul.val"));


  Value *Res = Builder.CreateExtractValue(Call, 1, "mul.ov");

  if (NeedNegation) // This technically increases instruction count.

    Res = Builder.CreateNot(Res, "mul.not.ov");


  // If we replaced the mul, erase it. Do this after all uses of Builder,

  // as the mul is used as insertion point.

  if (MulHadOtherUses)

    eraseInstFromFunction(*Mul);


  return Res;

}


static Instruction *foldICmpXNegX(ICmpInst &I,

                                  InstCombiner::BuilderTy &Builder) {

  CmpPredicate Pred;

  Value *X;

  if (match(&I, m_c_ICmp(Pred, m_NSWNeg(m_Value(X)), m_Deferred(X)))) {


    if (ICmpInst::isSigned(Pred))

      Pred = ICmpInst::getSwappedPredicate(Pred);

    else if (ICmpInst::isUnsigned(Pred))

      Pred = ICmpInst::getSignedPredicate(Pred);

    // else for equality-comparisons just keep the predicate.


    return ICmpInst::Create(Instruction::ICmp, Pred, X,

                            Constant::getNullValue(X->getType()), I.getName());

  }


  // A value is not equal to its negation unless that value is 0 or

  // MinSignedValue, ie: a != -a --> (a & MaxSignedVal) != 0

  if (match(&I, m_c_ICmp(Pred, m_OneUse(m_Neg(m_Value(X))), m_Deferred(X))) &&

      ICmpInst::isEquality(Pred)) {

    Type *Ty = X->getType();

    uint32_t BitWidth = Ty->getScalarSizeInBits();

    Constant *MaxSignedVal =

        ConstantInt::get(Ty, APInt::getSignedMaxValue(BitWidth));

    Value *And = Builder.CreateAnd(X, MaxSignedVal);

    Constant *Zero = Constant::getNullValue(Ty);

    return CmpInst::Create(Instruction::ICmp, Pred, And, Zero);

  }


  return nullptr;

}


static Instruction *foldICmpAndXX(ICmpInst &I, const SimplifyQuery &Q,

                                  InstCombinerImpl &IC) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1), *A;

  // Normalize and operand as operand 0.

  CmpInst::Predicate Pred = I.getPredicate();

  if (match(Op1, m_c_And(m_Specific(Op0), m_Value()))) {

    std::swap(Op0, Op1);

    Pred = ICmpInst::getSwappedPredicate(Pred);

  }


  if (!match(Op0, m_c_And(m_Specific(Op1), m_Value(A))))

    return nullptr;


  // (icmp (X & Y) u< X --> (X & Y) != X

  if (Pred == ICmpInst::ICMP_ULT)

    return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);


  // (icmp (X & Y) u>= X --> (X & Y) == X

  if (Pred == ICmpInst::ICMP_UGE)

    return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);


  if (ICmpInst::isEquality(Pred) && Op0->hasOneUse()) {

    // icmp (X & Y) eq/ne Y --> (X | ~Y) eq/ne -1 if Y is freely invertible and

    // Y is non-constant. If Y is constant the `X & C == C` form is preferable

    // so don't do this fold.

    if (!match(Op1, m_ImmConstant()))

      if (auto *NotOp1 =

              IC.getFreelyInverted(Op1, !Op1->hasNUsesOrMore(3), &IC.Builder))

        return new ICmpInst(Pred, IC.Builder.CreateOr(A, NotOp1),

                            Constant::getAllOnesValue(Op1->getType()));

    // icmp (X & Y) eq/ne Y --> (~X & Y) eq/ne 0 if X  is freely invertible.

    if (auto *NotA = IC.getFreelyInverted(A, A->hasOneUse(), &IC.Builder))

      return new ICmpInst(Pred, IC.Builder.CreateAnd(Op1, NotA),

                          Constant::getNullValue(Op1->getType()));

  }


  if (!ICmpInst::isSigned(Pred))

    return nullptr;


  KnownBits KnownY = IC.computeKnownBits(A, &I);

  // (X & NegY) spred X --> (X & NegY) upred X

  if (KnownY.isNegative())

    return new ICmpInst(ICmpInst::getUnsignedPredicate(Pred), Op0, Op1);


  if (Pred != ICmpInst::ICMP_SLE && Pred != ICmpInst::ICMP_SGT)

    return nullptr;


  if (KnownY.isNonNegative())

    // (X & PosY) s<= X --> X s>= 0

    // (X & PosY) s> X --> X s< 0

    return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Op1,

                        Constant::getNullValue(Op1->getType()));


  if (isKnownNegative(Op1, IC.getSimplifyQuery().getWithInstruction(&I)))

    // (NegX & Y) s<= NegX --> Y s< 0

    // (NegX & Y) s> NegX --> Y s>= 0

    return new ICmpInst(ICmpInst::getFlippedStrictnessPredicate(Pred), A,

                        Constant::getNullValue(A->getType()));


  return nullptr;

}


static Instruction *foldICmpOrXX(ICmpInst &I, const SimplifyQuery &Q,

                                 InstCombinerImpl &IC) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1), *A;


  // Normalize or operand as operand 0.

  CmpInst::Predicate Pred = I.getPredicate();

  if (match(Op1, m_c_Or(m_Specific(Op0), m_Value(A)))) {

    std::swap(Op0, Op1);

    Pred = ICmpInst::getSwappedPredicate(Pred);

  } else if (!match(Op0, m_c_Or(m_Specific(Op1), m_Value(A)))) {

    return nullptr;

  }


  // icmp (X | Y) u<= X --> (X | Y) == X

  if (Pred == ICmpInst::ICMP_ULE)

    return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);


  // icmp (X | Y) u> X --> (X | Y) != X

  if (Pred == ICmpInst::ICMP_UGT)

    return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);


  if (ICmpInst::isEquality(Pred) && Op0->hasOneUse()) {

    // icmp (X | Y) eq/ne Y --> (X & ~Y) eq/ne 0 if Y is freely invertible

    if (Value *NotOp1 = IC.getFreelyInverted(

            Op1, !isa<Constant>(Op1) && !Op1->hasNUsesOrMore(3), &IC.Builder))

      return new ICmpInst(Pred, IC.Builder.CreateAnd(A, NotOp1),

                          Constant::getNullValue(Op1->getType()));

    // icmp (X | Y) eq/ne Y --> (~X | Y) eq/ne -1 if X  is freely invertible.

    if (Value *NotA = IC.getFreelyInverted(A, A->hasOneUse(), &IC.Builder))

      return new ICmpInst(Pred, IC.Builder.CreateOr(Op1, NotA),

                          Constant::getAllOnesValue(Op1->getType()));

  }

  return nullptr;

}


static Instruction *foldICmpXorXX(ICmpInst &I, const SimplifyQuery &Q,

                                  InstCombinerImpl &IC) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1), *A;

  // Normalize xor operand as operand 0.

  CmpInst::Predicate Pred = I.getPredicate();

  if (match(Op1, m_c_Xor(m_Specific(Op0), m_Value()))) {

    std::swap(Op0, Op1);

    Pred = ICmpInst::getSwappedPredicate(Pred);

  }

  if (!match(Op0, m_c_Xor(m_Specific(Op1), m_Value(A))))

    return nullptr;


  // icmp (X ^ Y_NonZero) u>= X --> icmp (X ^ Y_NonZero) u> X

  // icmp (X ^ Y_NonZero) u<= X --> icmp (X ^ Y_NonZero) u< X

  // icmp (X ^ Y_NonZero) s>= X --> icmp (X ^ Y_NonZero) s> X

  // icmp (X ^ Y_NonZero) s<= X --> icmp (X ^ Y_NonZero) s< X

  CmpInst::Predicate PredOut = CmpInst::getStrictPredicate(Pred);

  if (PredOut != Pred && isKnownNonZero(A, Q))

    return new ICmpInst(PredOut, Op0, Op1);


  // These transform work when A is negative.

  // X s< X^A, X s<= X^A, X u> X^A, X u>= X^A  --> X s< 0

  // X s> X^A, X s>= X^A, X u< X^A, X u<= X^A  --> X s>= 0

  if (match(A, m_Negative())) {

    CmpInst::Predicate NewPred;

    switch (ICmpInst::getStrictPredicate(Pred)) {

    default:

      return nullptr;

    case ICmpInst::ICMP_SLT:

    case ICmpInst::ICMP_UGT:

      NewPred = ICmpInst::ICMP_SLT;

      break;

    case ICmpInst::ICMP_SGT:

    case ICmpInst::ICMP_ULT:

      NewPred = ICmpInst::ICMP_SGE;

      break;

    }

    Constant *Const = Constant::getNullValue(Op0->getType());

    return new ICmpInst(NewPred, Op0, Const);

  }


  return nullptr;

}


/// Return true if X is a multiple of C.

/// TODO: Handle non-power-of-2 factors.

static bool isMultipleOf(Value *X, const APInt &C, const SimplifyQuery &Q) {

  if (C.isOne())

    return true;


  if (!C.isPowerOf2())

    return false;


  return MaskedValueIsZero(X, C - 1, Q);

}


/// Try to fold icmp (binop), X or icmp X, (binop).

/// TODO: A large part of this logic is duplicated in InstSimplify's

/// simplifyICmpWithBinOp(). We should be able to share that and avoid the code

/// duplication.

Instruction *InstCombinerImpl::foldICmpBinOp(ICmpInst &I,

                                             const SimplifyQuery &SQ) {

  const SimplifyQuery Q = SQ.getWithInstruction(&I);

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);


  // Special logic for binary operators.

  BinaryOperator *BO0 = dyn_cast<BinaryOperator>(Op0);

  BinaryOperator *BO1 = dyn_cast<BinaryOperator>(Op1);

  if (!BO0 && !BO1)

    return nullptr;


  if (Instruction *NewICmp = foldICmpXNegX(I, Builder))

    return NewICmp;


  const CmpInst::Predicate Pred = I.getPredicate();

  Value *X;


  // Convert add-with-unsigned-overflow comparisons into a 'not' with compare.

  // (Op1 + X) u</u>= Op1 --> ~Op1 u</u>= X

  if (match(Op0, m_OneUse(m_c_Add(m_Specific(Op1), m_Value(X)))) &&

      (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE))

    return new ICmpInst(Pred, Builder.CreateNot(Op1), X);

  // Op0 u>/u<= (Op0 + X) --> X u>/u<= ~Op0

  if (match(Op1, m_OneUse(m_c_Add(m_Specific(Op0), m_Value(X)))) &&

      (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULE))

    return new ICmpInst(Pred, X, Builder.CreateNot(Op0));


  {

    // (Op1 + X) + C u</u>= Op1 --> ~C - X u</u>= Op1

    Constant *C;

    if (match(Op0, m_OneUse(m_Add(m_c_Add(m_Specific(Op1), m_Value(X)),

                                  m_ImmConstant(C)))) &&

        (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE)) {

      Constant *C2 = ConstantExpr::getNot(C);

      return new ICmpInst(Pred, Builder.CreateSub(C2, X), Op1);

    }

    // Op0 u>/u<= (Op0 + X) + C --> Op0 u>/u<= ~C - X

    if (match(Op1, m_OneUse(m_Add(m_c_Add(m_Specific(Op0), m_Value(X)),

                                  m_ImmConstant(C)))) &&

        (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULE)) {

      Constant *C2 = ConstantExpr::getNot(C);

      return new ICmpInst(Pred, Op0, Builder.CreateSub(C2, X));

    }

  }


  // (icmp eq/ne (X, -P2), INT_MIN)

  //  -> (icmp slt/sge X, INT_MIN + P2)

  if (ICmpInst::isEquality(Pred) && BO0 &&

      match(I.getOperand(1), m_SignMask()) &&

      match(BO0, m_And(m_Value(), m_NegatedPower2OrZero()))) {

    // Will Constant fold.

    Value *NewC = Builder.CreateSub(I.getOperand(1), BO0->getOperand(1));

    return new ICmpInst(Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_SLT

                                                  : ICmpInst::ICMP_SGE,

                        BO0->getOperand(0), NewC);

  }


  {

    // Similar to above: an unsigned overflow comparison may use offset + mask:

    // ((Op1 + C) & C) u<  Op1 --> Op1 != 0

    // ((Op1 + C) & C) u>= Op1 --> Op1 == 0

    // Op0 u>  ((Op0 + C) & C) --> Op0 != 0

    // Op0 u<= ((Op0 + C) & C) --> Op0 == 0

    BinaryOperator *BO;

    const APInt *C;

    if ((Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE) &&

        match(Op0, m_And(m_BinOp(BO), m_LowBitMask(C))) &&

        match(BO, m_Add(m_Specific(Op1), m_SpecificIntAllowPoison(*C)))) {

      CmpInst::Predicate NewPred =

          Pred == ICmpInst::ICMP_ULT ? ICmpInst::ICMP_NE : ICmpInst::ICMP_EQ;

      Constant *Zero = ConstantInt::getNullValue(Op1->getType());

      return new ICmpInst(NewPred, Op1, Zero);

    }


    if ((Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULE) &&

        match(Op1, m_And(m_BinOp(BO), m_LowBitMask(C))) &&

        match(BO, m_Add(m_Specific(Op0), m_SpecificIntAllowPoison(*C)))) {

      CmpInst::Predicate NewPred =

          Pred == ICmpInst::ICMP_UGT ? ICmpInst::ICMP_NE : ICmpInst::ICMP_EQ;

      Constant *Zero = ConstantInt::getNullValue(Op1->getType());

      return new ICmpInst(NewPred, Op0, Zero);

    }

  }


  bool NoOp0WrapProblem = false, NoOp1WrapProblem = false;

  bool Op0HasNUW = false, Op1HasNUW = false;

  bool Op0HasNSW = false, Op1HasNSW = false;

  // Analyze the case when either Op0 or Op1 is an add instruction.

  // Op0 = A + B (or A and B are null); Op1 = C + D (or C and D are null).

  auto hasNoWrapProblem = [](const BinaryOperator &BO, CmpInst::Predicate Pred,

                             bool &HasNSW, bool &HasNUW) -> bool {

    if (isa<OverflowingBinaryOperator>(BO)) {

      HasNUW = BO.hasNoUnsignedWrap();

      HasNSW = BO.hasNoSignedWrap();

      return ICmpInst::isEquality(Pred) ||

             (CmpInst::isUnsigned(Pred) && HasNUW) ||

             (CmpInst::isSigned(Pred) && HasNSW);

    } else if (BO.getOpcode() == Instruction::Or) {

      HasNUW = true;

      HasNSW = true;

      return true;

    } else {

      return false;

    }

  };

  Value *A = nullptr, *B = nullptr, *C = nullptr, *D = nullptr;


  if (BO0) {

    match(BO0, m_AddLike(m_Value(A), m_Value(B)));

    NoOp0WrapProblem = hasNoWrapProblem(*BO0, Pred, Op0HasNSW, Op0HasNUW);

  }

  if (BO1) {

    match(BO1, m_AddLike(m_Value(C), m_Value(D)));

    NoOp1WrapProblem = hasNoWrapProblem(*BO1, Pred, Op1HasNSW, Op1HasNUW);

  }


  // icmp (A+B), A -> icmp B, 0 for equalities or if there is no overflow.

  // icmp (A+B), B -> icmp A, 0 for equalities or if there is no overflow.

  if ((A == Op1 || B == Op1) && NoOp0WrapProblem)

    return new ICmpInst(Pred, A == Op1 ? B : A,

                        Constant::getNullValue(Op1->getType()));


  // icmp C, (C+D) -> icmp 0, D for equalities or if there is no overflow.

  // icmp D, (C+D) -> icmp 0, C for equalities or if there is no overflow.

  if ((C == Op0 || D == Op0) && NoOp1WrapProblem)

    return new ICmpInst(Pred, Constant::getNullValue(Op0->getType()),

                        C == Op0 ? D : C);


  // icmp (A+B), (A+D) -> icmp B, D for equalities or if there is no overflow.

  if (A && C && (A == C || A == D || B == C || B == D) && NoOp0WrapProblem &&

      NoOp1WrapProblem) {

    // Determine Y and Z in the form icmp (X+Y), (X+Z).

    Value *Y, *Z;

    if (A == C) {

      // C + B == C + D  ->  B == D

      Y = B;

      Z = D;

    } else if (A == D) {

      // D + B == C + D  ->  B == C

      Y = B;

      Z = C;

    } else if (B == C) {

      // A + C == C + D  ->  A == D

      Y = A;

      Z = D;

    } else {

      assert(B == D);

      // A + D == C + D  ->  A == C

      Y = A;

      Z = C;

    }

    return new ICmpInst(Pred, Y, Z);

  }


  if (ICmpInst::isRelational(Pred)) {

    // Return if both X and Y is divisible by Z/-Z.

    // TODO: Generalize to check if (X - Y) is divisible by Z/-Z.

    auto ShareCommonDivisor = [&Q](Value *X, Value *Y, Value *Z,

                                   bool IsNegative) -> bool {

      const APInt *OffsetC;

      if (!match(Z, m_APInt(OffsetC)))

        return false;


      // Fast path for Z == 1/-1.

      if (IsNegative ? OffsetC->isAllOnes() : OffsetC->isOne())

        return true;


      APInt C = *OffsetC;

      if (IsNegative)

        C.negate();

      // Note: -INT_MIN is also negative.

      if (!C.isStrictlyPositive())

        return false;


      return isMultipleOf(X, C, Q) && isMultipleOf(Y, C, Q);

    };


    // TODO: The subtraction-related identities shown below also hold, but

    // canonicalization from (X -nuw 1) to (X + -1) means that the combinations

    // wouldn't happen even if they were implemented.

    //

    // icmp ult (A - 1), Op1 -> icmp ule A, Op1

    // icmp uge (A - 1), Op1 -> icmp ugt A, Op1

    // icmp ugt Op0, (C - 1) -> icmp uge Op0, C

    // icmp ule Op0, (C - 1) -> icmp ult Op0, C


    // icmp slt (A + -1), Op1 -> icmp sle A, Op1

    // icmp sge (A + -1), Op1 -> icmp sgt A, Op1

    // icmp sle (A + 1), Op1 -> icmp slt A, Op1

    // icmp sgt (A + 1), Op1 -> icmp sge A, Op1

    // icmp ule (A + 1), Op0 -> icmp ult A, Op1

    // icmp ugt (A + 1), Op0 -> icmp uge A, Op1

    if (A && NoOp0WrapProblem &&

        ShareCommonDivisor(A, Op1, B,

                           ICmpInst::isLT(Pred) || ICmpInst::isGE(Pred)))

      return new ICmpInst(ICmpInst::getFlippedStrictnessPredicate(Pred), A,

                          Op1);


    // icmp sgt Op0, (C + -1) -> icmp sge Op0, C

    // icmp sle Op0, (C + -1) -> icmp slt Op0, C

    // icmp sge Op0, (C + 1) -> icmp sgt Op0, C

    // icmp slt Op0, (C + 1) -> icmp sle Op0, C

    // icmp uge Op0, (C + 1) -> icmp ugt Op0, C

    // icmp ult Op0, (C + 1) -> icmp ule Op0, C

    if (C && NoOp1WrapProblem &&

        ShareCommonDivisor(Op0, C, D,

                           ICmpInst::isGT(Pred) || ICmpInst::isLE(Pred)))

      return new ICmpInst(ICmpInst::getFlippedStrictnessPredicate(Pred), Op0,

                          C);

  }


  // if C1 has greater magnitude than C2:

  //  icmp (A + C1), (C + C2) -> icmp (A + C3), C

  //  s.t. C3 = C1 - C2

  //

  // if C2 has greater magnitude than C1:

  //  icmp (A + C1), (C + C2) -> icmp A, (C + C3)

  //  s.t. C3 = C2 - C1

  if (A && C && NoOp0WrapProblem && NoOp1WrapProblem &&

      (BO0->hasOneUse() || BO1->hasOneUse()) && !I.isUnsigned()) {

    const APInt *AP1, *AP2;

    // TODO: Support non-uniform vectors.

    // TODO: Allow poison passthrough if B or D's element is poison.

    if (match(B, m_APIntAllowPoison(AP1)) &&

        match(D, m_APIntAllowPoison(AP2)) &&

        AP1->isNegative() == AP2->isNegative()) {

      APInt AP1Abs = AP1->abs();

      APInt AP2Abs = AP2->abs();

      if (AP1Abs.uge(AP2Abs)) {

        APInt Diff = *AP1 - *AP2;

        Constant *C3 = Constant::getIntegerValue(BO0->getType(), Diff);

        Value *NewAdd = Builder.CreateAdd(

            A, C3, "", Op0HasNUW && Diff.ule(*AP1), Op0HasNSW);

        return new ICmpInst(Pred, NewAdd, C);

      } else {

        APInt Diff = *AP2 - *AP1;

        Constant *C3 = Constant::getIntegerValue(BO0->getType(), Diff);

        Value *NewAdd = Builder.CreateAdd(

            C, C3, "", Op1HasNUW && Diff.ule(*AP2), Op1HasNSW);

        return new ICmpInst(Pred, A, NewAdd);

      }

    }

    Constant *Cst1, *Cst2;

    if (match(B, m_ImmConstant(Cst1)) && match(D, m_ImmConstant(Cst2)) &&

        ICmpInst::isEquality(Pred)) {

      Constant *Diff = ConstantExpr::getSub(Cst2, Cst1);

      Value *NewAdd = Builder.CreateAdd(C, Diff);

      return new ICmpInst(Pred, A, NewAdd);

    }

  }


  // Analyze the case when either Op0 or Op1 is a sub instruction.

  // Op0 = A - B (or A and B are null); Op1 = C - D (or C and D are null).

  A = nullptr;

  B = nullptr;

  C = nullptr;

  D = nullptr;

  if (BO0 && BO0->getOpcode() == Instruction::Sub) {

    A = BO0->getOperand(0);

    B = BO0->getOperand(1);

  }

  if (BO1 && BO1->getOpcode() == Instruction::Sub) {

    C = BO1->getOperand(0);

    D = BO1->getOperand(1);

  }


  // icmp (A-B), A -> icmp 0, B for equalities or if there is no overflow.

  if (A == Op1 && NoOp0WrapProblem)

    return new ICmpInst(Pred, Constant::getNullValue(Op1->getType()), B);

  // icmp C, (C-D) -> icmp D, 0 for equalities or if there is no overflow.

  if (C == Op0 && NoOp1WrapProblem)

    return new ICmpInst(Pred, D, Constant::getNullValue(Op0->getType()));


  // Convert sub-with-unsigned-overflow comparisons into a comparison of args.

  // (A - B) u>/u<= A --> B u>/u<= A

  if (A == Op1 && (Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULE))

    return new ICmpInst(Pred, B, A);

  // C u</u>= (C - D) --> C u</u>= D

  if (C == Op0 && (Pred == ICmpInst::ICMP_ULT || Pred == ICmpInst::ICMP_UGE))

    return new ICmpInst(Pred, C, D);

  // (A - B) u>=/u< A --> B u>/u<= A  iff B != 0

  if (A == Op1 && (Pred == ICmpInst::ICMP_UGE || Pred == ICmpInst::ICMP_ULT) &&

      isKnownNonZero(B, Q))

    return new ICmpInst(CmpInst::getFlippedStrictnessPredicate(Pred), B, A);

  // C u<=/u> (C - D) --> C u</u>= D  iff B != 0

  if (C == Op0 && (Pred == ICmpInst::ICMP_ULE || Pred == ICmpInst::ICMP_UGT) &&

      isKnownNonZero(D, Q))

    return new ICmpInst(CmpInst::getFlippedStrictnessPredicate(Pred), C, D);


  // icmp (A-B), (C-B) -> icmp A, C for equalities or if there is no overflow.

  if (B && D && B == D && NoOp0WrapProblem && NoOp1WrapProblem)

    return new ICmpInst(Pred, A, C);


  // icmp (A-B), (A-D) -> icmp D, B for equalities or if there is no overflow.

  if (A && C && A == C && NoOp0WrapProblem && NoOp1WrapProblem)

    return new ICmpInst(Pred, D, B);


  // icmp (0-X) < cst --> x > -cst

  if (NoOp0WrapProblem && ICmpInst::isSigned(Pred)) {

    Value *X;

    if (match(BO0, m_Neg(m_Value(X))))

      if (Constant *RHSC = dyn_cast<Constant>(Op1))

        if (RHSC->isNotMinSignedValue())

          return new ICmpInst(I.getSwappedPredicate(), X,

                              ConstantExpr::getNeg(RHSC));

  }


  if (Instruction *R = foldICmpXorXX(I, Q, *this))

    return R;

  if (Instruction *R = foldICmpOrXX(I, Q, *this))

    return R;


  {

    // Try to remove shared multiplier from comparison:

    // X * Z pred Y * Z

    Value *X, *Y, *Z;

    if ((match(Op0, m_Mul(m_Value(X), m_Value(Z))) &&

         match(Op1, m_c_Mul(m_Specific(Z), m_Value(Y)))) ||

        (match(Op0, m_Mul(m_Value(Z), m_Value(X))) &&

         match(Op1, m_c_Mul(m_Specific(Z), m_Value(Y))))) {

      if (ICmpInst::isSigned(Pred)) {

        if (Op0HasNSW && Op1HasNSW) {

          KnownBits ZKnown = computeKnownBits(Z, &I);

          if (ZKnown.isStrictlyPositive())

            return new ICmpInst(Pred, X, Y);

          if (ZKnown.isNegative())

            return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), X, Y);

          Value *LessThan = simplifyICmpInst(ICmpInst::ICMP_SLT, X, Y,

                                             SQ.getWithInstruction(&I));

          if (LessThan && match(LessThan, m_One()))

            return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Z,

                                Constant::getNullValue(Z->getType()));

          Value *GreaterThan = simplifyICmpInst(ICmpInst::ICMP_SGT, X, Y,

                                                SQ.getWithInstruction(&I));

          if (GreaterThan && match(GreaterThan, m_One()))

            return new ICmpInst(Pred, Z, Constant::getNullValue(Z->getType()));

        }

      } else {

        bool NonZero;

        if (ICmpInst::isEquality(Pred)) {

          // If X != Y, fold (X *nw Z) eq/ne (Y *nw Z) -> Z eq/ne 0

          if (((Op0HasNSW && Op1HasNSW) || (Op0HasNUW && Op1HasNUW)) &&

              isKnownNonEqual(X, Y, SQ))

            return new ICmpInst(Pred, Z, Constant::getNullValue(Z->getType()));


          KnownBits ZKnown = computeKnownBits(Z, &I);

          // if Z % 2 != 0

          //    X * Z eq/ne Y * Z -> X eq/ne Y

          if (ZKnown.countMaxTrailingZeros() == 0)

            return new ICmpInst(Pred, X, Y);

          NonZero = !ZKnown.One.isZero() || isKnownNonZero(Z, Q);

          // if Z != 0 and nsw(X * Z) and nsw(Y * Z)

          //    X * Z eq/ne Y * Z -> X eq/ne Y

          if (NonZero && BO0 && BO1 && Op0HasNSW && Op1HasNSW)

            return new ICmpInst(Pred, X, Y);

        } else

          NonZero = isKnownNonZero(Z, Q);


        // If Z != 0 and nuw(X * Z) and nuw(Y * Z)

        //    X * Z u{lt/le/gt/ge}/eq/ne Y * Z -> X u{lt/le/gt/ge}/eq/ne Y

        if (NonZero && BO0 && BO1 && Op0HasNUW && Op1HasNUW)

          return new ICmpInst(Pred, X, Y);

      }

    }

  }


  BinaryOperator *SRem = nullptr;

  // icmp (srem X, Y), Y

  if (BO0 && BO0->getOpcode() == Instruction::SRem && Op1 == BO0->getOperand(1))

    SRem = BO0;

  // icmp Y, (srem X, Y)

  else if (BO1 && BO1->getOpcode() == Instruction::SRem &&

           Op0 == BO1->getOperand(1))

    SRem = BO1;

  if (SRem) {

    // We don't check hasOneUse to avoid increasing register pressure because

    // the value we use is the same value this instruction was already using.

    switch (SRem == BO0 ? ICmpInst::getSwappedPredicate(Pred) : Pred) {

    default:

      break;

    case ICmpInst::ICMP_EQ:

      return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    case ICmpInst::ICMP_NE:

      return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

    case ICmpInst::ICMP_SGT:

    case ICmpInst::ICMP_SGE:

      return new ICmpInst(ICmpInst::ICMP_SGT, SRem->getOperand(1),

                          Constant::getAllOnesValue(SRem->getType()));

    case ICmpInst::ICMP_SLT:

    case ICmpInst::ICMP_SLE:

      return new ICmpInst(ICmpInst::ICMP_SLT, SRem->getOperand(1),

                          Constant::getNullValue(SRem->getType()));

    }

  }


  if (BO0 && BO1 && BO0->getOpcode() == BO1->getOpcode() &&

      (BO0->hasOneUse() || BO1->hasOneUse()) &&

      BO0->getOperand(1) == BO1->getOperand(1)) {

    switch (BO0->getOpcode()) {

    default:

      break;

    case Instruction::Add:

    case Instruction::Sub:

    case Instruction::Xor: {

      if (I.isEquality()) // a+x icmp eq/ne b+x --> a icmp b

        return new ICmpInst(Pred, BO0->getOperand(0), BO1->getOperand(0));


      const APInt *C;

      if (match(BO0->getOperand(1), m_APInt(C))) {

        // icmp u/s (a ^ signmask), (b ^ signmask) --> icmp s/u a, b

        if (C->isSignMask()) {

          ICmpInst::Predicate NewPred = I.getFlippedSignednessPredicate();

          return new ICmpInst(NewPred, BO0->getOperand(0), BO1->getOperand(0));

        }


        // icmp u/s (a ^ maxsignval), (b ^ maxsignval) --> icmp s/u' a, b

        if (BO0->getOpcode() == Instruction::Xor && C->isMaxSignedValue()) {

          ICmpInst::Predicate NewPred = I.getFlippedSignednessPredicate();

          NewPred = I.getSwappedPredicate(NewPred);

          return new ICmpInst(NewPred, BO0->getOperand(0), BO1->getOperand(0));

        }

      }

      break;

    }

    case Instruction::Mul: {

      if (!I.isEquality())

        break;


      const APInt *C;

      if (match(BO0->getOperand(1), m_APInt(C)) && !C->isZero() &&

          !C->isOne()) {

        // icmp eq/ne (X * C), (Y * C) --> icmp (X & Mask), (Y & Mask)

        // Mask = -1 >> count-trailing-zeros(C).

        if (unsigned TZs = C->countr_zero()) {

          Constant *Mask = ConstantInt::get(

              BO0->getType(),

              APInt::getLowBitsSet(C->getBitWidth(), C->getBitWidth() - TZs));

          Value *And1 = Builder.CreateAnd(BO0->getOperand(0), Mask);

          Value *And2 = Builder.CreateAnd(BO1->getOperand(0), Mask);

          return new ICmpInst(Pred, And1, And2);

        }

      }

      break;

    }

    case Instruction::UDiv:

    case Instruction::LShr:

      if (I.isSigned() || !BO0->isExact() || !BO1->isExact())

        break;

      return new ICmpInst(Pred, BO0->getOperand(0), BO1->getOperand(0));


    case Instruction::SDiv:

      if (!(I.isEquality() || match(BO0->getOperand(1), m_NonNegative())) ||

          !BO0->isExact() || !BO1->isExact())

        break;

      return new ICmpInst(Pred, BO0->getOperand(0), BO1->getOperand(0));


    case Instruction::AShr:

      if (!BO0->isExact() || !BO1->isExact())

        break;

      return new ICmpInst(Pred, BO0->getOperand(0), BO1->getOperand(0));


    case Instruction::Shl: {

      bool NUW = Op0HasNUW && Op1HasNUW;

      bool NSW = Op0HasNSW && Op1HasNSW;

      if (!NUW && !NSW)

        break;

      if (!NSW && I.isSigned())

        break;

      return new ICmpInst(Pred, BO0->getOperand(0), BO1->getOperand(0));

    }

    }

  }


  if (BO0) {

    // Transform  A & (L - 1) `ult` L --> L != 0

    auto LSubOne = m_Add(m_Specific(Op1), m_AllOnes());

    auto BitwiseAnd = m_c_And(m_Value(), LSubOne);


    if (match(BO0, BitwiseAnd) && Pred == ICmpInst::ICMP_ULT) {

      auto *Zero = Constant::getNullValue(BO0->getType());

      return new ICmpInst(ICmpInst::ICMP_NE, Op1, Zero);

    }

  }


  // For unsigned predicates / eq / ne:

  // icmp pred (x << 1), x --> icmp getSignedPredicate(pred) x, 0

  // icmp pred x, (x << 1) --> icmp getSignedPredicate(pred) 0, x

  if (!ICmpInst::isSigned(Pred)) {

    if (match(Op0, m_Shl(m_Specific(Op1), m_One())))

      return new ICmpInst(ICmpInst::getSignedPredicate(Pred), Op1,

                          Constant::getNullValue(Op1->getType()));

    else if (match(Op1, m_Shl(m_Specific(Op0), m_One())))

      return new ICmpInst(ICmpInst::getSignedPredicate(Pred),

                          Constant::getNullValue(Op0->getType()), Op0);

  }


  if (Value *V = foldMultiplicationOverflowCheck(I))

    return replaceInstUsesWith(I, V);


  if (Instruction *R = foldICmpAndXX(I, Q, *this))

    return R;


  if (Value *V = foldICmpWithTruncSignExtendedVal(I, Builder))

    return replaceInstUsesWith(I, V);


  if (Value *V = foldShiftIntoShiftInAnotherHandOfAndInICmp(I, SQ, Builder))

    return replaceInstUsesWith(I, V);


  return nullptr;

}


/// Fold icmp Pred min|max(X, Y), Z.

Instruction *InstCombinerImpl::foldICmpWithMinMax(Instruction &I,

                                                  MinMaxIntrinsic *MinMax,

                                                  Value *Z, CmpPredicate Pred) {

  Value *X = MinMax->getLHS();

  Value *Y = MinMax->getRHS();

  if (ICmpInst::isSigned(Pred) && !MinMax->isSigned())

    return nullptr;

  if (ICmpInst::isUnsigned(Pred) && MinMax->isSigned()) {

    // Revert the transform signed pred -> unsigned pred

    // TODO: We can flip the signedness of predicate if both operands of icmp

    // are negative.

    if (isKnownNonNegative(Z, SQ.getWithInstruction(&I)) &&

        isKnownNonNegative(MinMax, SQ.getWithInstruction(&I))) {

      Pred = ICmpInst::getFlippedSignednessPredicate(Pred);

    } else

      return nullptr;

  }

  SimplifyQuery Q = SQ.getWithInstruction(&I);

  auto IsCondKnownTrue = [](Value *Val) -> std::optional<bool> {

    if (!Val)

      return std::nullopt;

    if (match(Val, m_One()))

      return true;

    if (match(Val, m_Zero()))

      return false;

    return std::nullopt;

  };

  // Remove samesign here since it is illegal to keep it when we speculatively

  // execute comparisons. For example, `icmp samesign ult umax(X, -46), -32`

  // cannot be decomposed into `(icmp samesign ult X, -46) or (icmp samesign ult

  // -46, -32)`. `X` is allowed to be non-negative here.

  Pred = Pred.dropSameSign();

  auto CmpXZ = IsCondKnownTrue(simplifyICmpInst(Pred, X, Z, Q));

  auto CmpYZ = IsCondKnownTrue(simplifyICmpInst(Pred, Y, Z, Q));

  if (!CmpXZ.has_value() && !CmpYZ.has_value())

    return nullptr;

  if (!CmpXZ.has_value()) {

    std::swap(X, Y);

    std::swap(CmpXZ, CmpYZ);

  }


  auto FoldIntoCmpYZ = [&]() -> Instruction * {

    if (CmpYZ.has_value())

      return replaceInstUsesWith(I, ConstantInt::getBool(I.getType(), *CmpYZ));

    return ICmpInst::Create(Instruction::ICmp, Pred, Y, Z);

  };


  switch (Pred) {

  case ICmpInst::ICMP_EQ:

  case ICmpInst::ICMP_NE: {

    // If X == Z:

    //     Expr       Result

    // min(X, Y) == Z X <= Y

    // max(X, Y) == Z X >= Y

    // min(X, Y) != Z X > Y

    // max(X, Y) != Z X < Y

    if ((Pred == ICmpInst::ICMP_EQ) == *CmpXZ) {

      ICmpInst::Predicate NewPred =

          ICmpInst::getNonStrictPredicate(MinMax->getPredicate());

      if (Pred == ICmpInst::ICMP_NE)

        NewPred = ICmpInst::getInversePredicate(NewPred);

      return ICmpInst::Create(Instruction::ICmp, NewPred, X, Y);

    }

    // Otherwise (X != Z):

    ICmpInst::Predicate NewPred = MinMax->getPredicate();

    auto MinMaxCmpXZ = IsCondKnownTrue(simplifyICmpInst(NewPred, X, Z, Q));

    if (!MinMaxCmpXZ.has_value()) {

      std::swap(X, Y);

      std::swap(CmpXZ, CmpYZ);

      // Re-check pre-condition X != Z

      if (!CmpXZ.has_value() || (Pred == ICmpInst::ICMP_EQ) == *CmpXZ)

        break;

      MinMaxCmpXZ = IsCondKnownTrue(simplifyICmpInst(NewPred, X, Z, Q));

    }

    if (!MinMaxCmpXZ.has_value())

      break;

    if (*MinMaxCmpXZ) {

      //    Expr         Fact    Result

      // min(X, Y) == Z  X < Z   false

      // max(X, Y) == Z  X > Z   false

      // min(X, Y) != Z  X < Z    true

      // max(X, Y) != Z  X > Z    true

      return replaceInstUsesWith(

          I, ConstantInt::getBool(I.getType(), Pred == ICmpInst::ICMP_NE));

    } else {

      //    Expr         Fact    Result

      // min(X, Y) == Z  X > Z   Y == Z

      // max(X, Y) == Z  X < Z   Y == Z

      // min(X, Y) != Z  X > Z   Y != Z

      // max(X, Y) != Z  X < Z   Y != Z

      return FoldIntoCmpYZ();

    }

    break;

  }

  case ICmpInst::ICMP_SLT:

  case ICmpInst::ICMP_ULT:

  case ICmpInst::ICMP_SLE:

  case ICmpInst::ICMP_ULE:

  case ICmpInst::ICMP_SGT:

  case ICmpInst::ICMP_UGT:

  case ICmpInst::ICMP_SGE:

  case ICmpInst::ICMP_UGE: {

    bool IsSame = MinMax->getPredicate() == ICmpInst::getStrictPredicate(Pred);

    if (*CmpXZ) {

      if (IsSame) {

        //      Expr        Fact    Result

        // min(X, Y) < Z    X < Z   true

        // min(X, Y) <= Z   X <= Z  true

        // max(X, Y) > Z    X > Z   true

        // max(X, Y) >= Z   X >= Z  true

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      } else {

        //      Expr        Fact    Result

        // max(X, Y) < Z    X < Z   Y < Z

        // max(X, Y) <= Z   X <= Z  Y <= Z

        // min(X, Y) > Z    X > Z   Y > Z

        // min(X, Y) >= Z   X >= Z  Y >= Z

        return FoldIntoCmpYZ();

      }

    } else {

      if (IsSame) {

        //      Expr        Fact    Result

        // min(X, Y) < Z    X >= Z  Y < Z

        // min(X, Y) <= Z   X > Z   Y <= Z

        // max(X, Y) > Z    X <= Z  Y > Z

        // max(X, Y) >= Z   X < Z   Y >= Z

        return FoldIntoCmpYZ();

      } else {

        //      Expr        Fact    Result

        // max(X, Y) < Z    X >= Z  false

        // max(X, Y) <= Z   X > Z   false

        // min(X, Y) > Z    X <= Z  false

        // min(X, Y) >= Z   X < Z   false

        return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

      }

    }

    break;

  }

  default:

    break;

  }


  return nullptr;

}


// Canonicalize checking for a power-of-2-or-zero value:

static Instruction *foldICmpPow2Test(ICmpInst &I,

                                     InstCombiner::BuilderTy &Builder) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  const CmpInst::Predicate Pred = I.getPredicate();

  Value *A = nullptr;

  bool CheckIs;

  if (I.isEquality()) {

    // (A & (A-1)) == 0 --> ctpop(A) < 2 (two commuted variants)

    // ((A-1) & A) != 0 --> ctpop(A) > 1 (two commuted variants)

    if (!match(Op0, m_OneUse(m_c_And(m_Add(m_Value(A), m_AllOnes()),

                                     m_Deferred(A)))) ||

        !match(Op1, m_ZeroInt()))

      A = nullptr;


    // (A & -A) == A --> ctpop(A) < 2 (four commuted variants)

    // (-A & A) != A --> ctpop(A) > 1 (four commuted variants)

    if (match(Op0, m_OneUse(m_c_And(m_Neg(m_Specific(Op1)), m_Specific(Op1)))))

      A = Op1;

    else if (match(Op1,

                   m_OneUse(m_c_And(m_Neg(m_Specific(Op0)), m_Specific(Op0)))))

      A = Op0;


    CheckIs = Pred == ICmpInst::ICMP_EQ;

  } else if (ICmpInst::isUnsigned(Pred)) {

    // (A ^ (A-1)) u>= A --> ctpop(A) < 2 (two commuted variants)

    // ((A-1) ^ A) u< A --> ctpop(A) > 1 (two commuted variants)


    if ((Pred == ICmpInst::ICMP_UGE || Pred == ICmpInst::ICMP_ULT) &&

        match(Op0, m_OneUse(m_c_Xor(m_Add(m_Specific(Op1), m_AllOnes()),

                                    m_Specific(Op1))))) {

      A = Op1;

      CheckIs = Pred == ICmpInst::ICMP_UGE;

    } else if ((Pred == ICmpInst::ICMP_UGT || Pred == ICmpInst::ICMP_ULE) &&

               match(Op1, m_OneUse(m_c_Xor(m_Add(m_Specific(Op0), m_AllOnes()),

                                           m_Specific(Op0))))) {

      A = Op0;

      CheckIs = Pred == ICmpInst::ICMP_ULE;

    }

  }


  if (A) {

    Type *Ty = A->getType();

    CallInst *CtPop = Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, A);

    return CheckIs ? new ICmpInst(ICmpInst::ICMP_ULT, CtPop,

                                  ConstantInt::get(Ty, 2))

                   : new ICmpInst(ICmpInst::ICMP_UGT, CtPop,

                                  ConstantInt::get(Ty, 1));

  }


  return nullptr;

}


/// Find all possible pairs (BinOp, RHS) that BinOp V, RHS can be simplified.

using OffsetOp = std::pair<Instruction::BinaryOps, Value *>;

static void collectOffsetOp(Value *V, SmallVectorImpl<OffsetOp> &Offsets,

                            bool AllowRecursion) {

  Instruction *Inst = dyn_cast<Instruction>(V);

  if (!Inst || !Inst->hasOneUse())

    return;


  switch (Inst->getOpcode()) {

  case Instruction::Add:

    Offsets.emplace_back(Instruction::Sub, Inst->getOperand(1));

    Offsets.emplace_back(Instruction::Sub, Inst->getOperand(0));

    break;

  case Instruction::Sub:

    Offsets.emplace_back(Instruction::Add, Inst->getOperand(1));

    break;

  case Instruction::Xor:

    Offsets.emplace_back(Instruction::Xor, Inst->getOperand(1));

    Offsets.emplace_back(Instruction::Xor, Inst->getOperand(0));

    break;

  case Instruction::Select:

    if (AllowRecursion) {

      collectOffsetOp(Inst->getOperand(1), Offsets, /*AllowRecursion=*/false);

      collectOffsetOp(Inst->getOperand(2), Offsets, /*AllowRecursion=*/false);

    }

    break;

  default:

    break;

  }

}


enum class OffsetKind { Invalid, Value, Select };


struct OffsetResult {

  OffsetKind Kind;

  Value *V0, *V1, *V2;


  static OffsetResult invalid() {

    return {OffsetKind::Invalid, nullptr, nullptr, nullptr};

  }

  static OffsetResult value(Value *V) {

    return {OffsetKind::Value, V, nullptr, nullptr};

  }

  static OffsetResult select(Value *Cond, Value *TrueV, Value *FalseV) {

    return {OffsetKind::Select, Cond, TrueV, FalseV};

  }

  bool isValid() const { return Kind != OffsetKind::Invalid; }

  Value *materialize(InstCombiner::BuilderTy &Builder) const {

    switch (Kind) {

    case OffsetKind::Invalid:

      llvm_unreachable("Invalid offset result");

    case OffsetKind::Value:

      return V0;

    case OffsetKind::Select:

      return Builder.CreateSelect(V0, V1, V2);

    }

    llvm_unreachable("Unknown OffsetKind enum");

  }

};


/// Offset both sides of an equality icmp to see if we can save some

/// instructions: icmp eq/ne X, Y -> icmp eq/ne X op Z, Y op Z.

/// Note: This operation should not introduce poison.

static Instruction *foldICmpEqualityWithOffset(ICmpInst &I,

                                               InstCombiner::BuilderTy &Builder,

                                               const SimplifyQuery &SQ) {

  assert(I.isEquality() && "Expected an equality icmp");

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  if (!Op0->getType()->isIntOrIntVectorTy())

    return nullptr;


  SmallVector<OffsetOp, 4> OffsetOps;

  collectOffsetOp(Op0, OffsetOps, /*AllowRecursion=*/true);

  collectOffsetOp(Op1, OffsetOps, /*AllowRecursion=*/true);


  auto ApplyOffsetImpl = [&](Value *V, unsigned BinOpc, Value *RHS) -> Value * {

    Value *Simplified = simplifyBinOp(BinOpc, V, RHS, SQ);

    // Avoid infinite loops by checking if RHS is an identity for the BinOp.

    if (!Simplified || Simplified == V)

      return nullptr;

    // Reject constant expressions as they don't simplify things.

    if (isa<Constant>(Simplified) && !match(Simplified, m_ImmConstant()))

      return nullptr;

    // Check if the transformation introduces poison.

    return impliesPoison(RHS, V) ? Simplified : nullptr;

  };


  auto ApplyOffset = [&](Value *V, unsigned BinOpc,

                         Value *RHS) -> OffsetResult {

    if (auto *Sel = dyn_cast<SelectInst>(V)) {

      if (!Sel->hasOneUse())

        return OffsetResult::invalid();

      Value *TrueVal = ApplyOffsetImpl(Sel->getTrueValue(), BinOpc, RHS);

      if (!TrueVal)

        return OffsetResult::invalid();

      Value *FalseVal = ApplyOffsetImpl(Sel->getFalseValue(), BinOpc, RHS);

      if (!FalseVal)

        return OffsetResult::invalid();

      return OffsetResult::select(Sel->getCondition(), TrueVal, FalseVal);

    }

    if (Value *Simplified = ApplyOffsetImpl(V, BinOpc, RHS))

      return OffsetResult::value(Simplified);

    return OffsetResult::invalid();

  };


  for (auto [BinOp, RHS] : OffsetOps) {

    auto BinOpc = static_cast<unsigned>(BinOp);


    auto Op0Result = ApplyOffset(Op0, BinOpc, RHS);

    if (!Op0Result.isValid())

      continue;

    auto Op1Result = ApplyOffset(Op1, BinOpc, RHS);

    if (!Op1Result.isValid())

      continue;


    Value *NewLHS = Op0Result.materialize(Builder);

    Value *NewRHS = Op1Result.materialize(Builder);

    return new ICmpInst(I.getPredicate(), NewLHS, NewRHS);

  }


  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpEquality(ICmpInst &I) {

  if (!I.isEquality())

    return nullptr;


  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  const CmpInst::Predicate Pred = I.getPredicate();

  Value *A, *B, *C, *D;

  if (match(Op0, m_Xor(m_Value(A), m_Value(B)))) {

    if (A == Op1 || B == Op1) { // (A^B) == A  ->  B == 0

      Value *OtherVal = A == Op1 ? B : A;

      return new ICmpInst(Pred, OtherVal, Constant::getNullValue(A->getType()));

    }


    if (match(Op1, m_Xor(m_Value(C), m_Value(D)))) {

      // A^c1 == C^c2 --> A == C^(c1^c2)

      ConstantInt *C1, *C2;

      if (match(B, m_ConstantInt(C1)) && match(D, m_ConstantInt(C2)) &&

          Op1->hasOneUse()) {

        Constant *NC = Builder.getInt(C1->getValue() ^ C2->getValue());

        Value *Xor = Builder.CreateXor(C, NC);

        return new ICmpInst(Pred, A, Xor);

      }


      // A^B == A^D -> B == D

      if (A == C)

        return new ICmpInst(Pred, B, D);

      if (A == D)

        return new ICmpInst(Pred, B, C);

      if (B == C)

        return new ICmpInst(Pred, A, D);

      if (B == D)

        return new ICmpInst(Pred, A, C);

    }

  }


  if (match(Op1, m_Xor(m_Value(A), m_Value(B))) && (A == Op0 || B == Op0)) {

    // A == (A^B)  ->  B == 0

    Value *OtherVal = A == Op0 ? B : A;

    return new ICmpInst(Pred, OtherVal, Constant::getNullValue(A->getType()));

  }


  // (X&Z) == (Y&Z) -> (X^Y) & Z == 0

  if (match(Op0, m_And(m_Value(A), m_Value(B))) &&

      match(Op1, m_And(m_Value(C), m_Value(D)))) {

    Value *X = nullptr, *Y = nullptr, *Z = nullptr;


    if (A == C) {

      X = B;

      Y = D;

      Z = A;

    } else if (A == D) {

      X = B;

      Y = C;

      Z = A;

    } else if (B == C) {

      X = A;

      Y = D;

      Z = B;

    } else if (B == D) {

      X = A;

      Y = C;

      Z = B;

    }


    if (X) {

      // If X^Y is a negative power of two, then `icmp eq/ne (Z & NegP2), 0`

      // will fold to `icmp ult/uge Z, -NegP2` incurringb no additional

      // instructions.

      const APInt *C0, *C1;

      bool XorIsNegP2 = match(X, m_APInt(C0)) && match(Y, m_APInt(C1)) &&

                        (*C0 ^ *C1).isNegatedPowerOf2();


      // If either Op0/Op1 are both one use or X^Y will constant fold and one of

      // Op0/Op1 are one use, proceed. In those cases we are instruction neutral

      // but `icmp eq/ne A, 0` is easier to analyze than `icmp eq/ne A, B`.

      int UseCnt =

          int(Op0->hasOneUse()) + int(Op1->hasOneUse()) +

          (int(match(X, m_ImmConstant()) && match(Y, m_ImmConstant())));

      if (XorIsNegP2 || UseCnt >= 2) {

        // Build (X^Y) & Z

        Op1 = Builder.CreateXor(X, Y);

        Op1 = Builder.CreateAnd(Op1, Z);

        return new ICmpInst(Pred, Op1, Constant::getNullValue(Op1->getType()));

      }

    }

  }


  {

    // Similar to above, but specialized for constant because invert is needed:

    // (X | C) == (Y | C) --> (X ^ Y) & ~C == 0

    Value *X, *Y;

    Constant *C;

    if (match(Op0, m_OneUse(m_Or(m_Value(X), m_Constant(C)))) &&

        match(Op1, m_OneUse(m_Or(m_Value(Y), m_Specific(C))))) {

      Value *Xor = Builder.CreateXor(X, Y);

      Value *And = Builder.CreateAnd(Xor, ConstantExpr::getNot(C));

      return new ICmpInst(Pred, And, Constant::getNullValue(And->getType()));

    }

  }


  if (match(Op1, m_ZExt(m_Value(A))) &&

      (Op0->hasOneUse() || Op1->hasOneUse())) {

    // (B & (Pow2C-1)) == zext A --> A == trunc B

    // (B & (Pow2C-1)) != zext A --> A != trunc B

    const APInt *MaskC;

    if (match(Op0, m_And(m_Value(B), m_LowBitMask(MaskC))) &&

        MaskC->countr_one() == A->getType()->getScalarSizeInBits())

      return new ICmpInst(Pred, A, Builder.CreateTrunc(B, A->getType()));

  }


  // (A >> C) == (B >> C) --> (A^B) u< (1 << C)

  // For lshr and ashr pairs.

  const APInt *AP1, *AP2;

  if ((match(Op0, m_OneUse(m_LShr(m_Value(A), m_APIntAllowPoison(AP1)))) &&

       match(Op1, m_OneUse(m_LShr(m_Value(B), m_APIntAllowPoison(AP2))))) ||

      (match(Op0, m_OneUse(m_AShr(m_Value(A), m_APIntAllowPoison(AP1)))) &&

       match(Op1, m_OneUse(m_AShr(m_Value(B), m_APIntAllowPoison(AP2)))))) {

    if (*AP1 != *AP2)

      return nullptr;

    unsigned TypeBits = AP1->getBitWidth();

    unsigned ShAmt = AP1->getLimitedValue(TypeBits);

    if (ShAmt < TypeBits && ShAmt != 0) {

      ICmpInst::Predicate NewPred =

          Pred == ICmpInst::ICMP_NE ? ICmpInst::ICMP_UGE : ICmpInst::ICMP_ULT;

      Value *Xor = Builder.CreateXor(A, B, I.getName() + ".unshifted");

      APInt CmpVal = APInt::getOneBitSet(TypeBits, ShAmt);

      return new ICmpInst(NewPred, Xor, ConstantInt::get(A->getType(), CmpVal));

    }

  }


  // (A << C) == (B << C) --> ((A^B) & (~0U >> C)) == 0

  ConstantInt *Cst1;

  if (match(Op0, m_OneUse(m_Shl(m_Value(A), m_ConstantInt(Cst1)))) &&

      match(Op1, m_OneUse(m_Shl(m_Value(B), m_Specific(Cst1))))) {

    unsigned TypeBits = Cst1->getBitWidth();

    unsigned ShAmt = (unsigned)Cst1->getLimitedValue(TypeBits);

    if (ShAmt < TypeBits && ShAmt != 0) {

      Value *Xor = Builder.CreateXor(A, B, I.getName() + ".unshifted");

      APInt AndVal = APInt::getLowBitsSet(TypeBits, TypeBits - ShAmt);

      Value *And =

          Builder.CreateAnd(Xor, Builder.getInt(AndVal), I.getName() + ".mask");

      return new ICmpInst(Pred, And, Constant::getNullValue(Cst1->getType()));

    }

  }


  // Transform "icmp eq (trunc (lshr(X, cst1)), cst" to

  // "icmp (and X, mask), cst"

  uint64_t ShAmt = 0;

  if (Op0->hasOneUse() &&

      match(Op0, m_Trunc(m_OneUse(m_LShr(m_Value(A), m_ConstantInt(ShAmt))))) &&

      match(Op1, m_ConstantInt(Cst1)) &&

      // Only do this when A has multiple uses.  This is most important to do

      // when it exposes other optimizations.

      !A->hasOneUse()) {

    unsigned ASize = cast<IntegerType>(A->getType())->getPrimitiveSizeInBits();


    if (ShAmt < ASize) {

      APInt MaskV =

          APInt::getLowBitsSet(ASize, Op0->getType()->getPrimitiveSizeInBits());

      MaskV <<= ShAmt;


      APInt CmpV = Cst1->getValue().zext(ASize);

      CmpV <<= ShAmt;


      Value *Mask = Builder.CreateAnd(A, Builder.getInt(MaskV));

      return new ICmpInst(Pred, Mask, Builder.getInt(CmpV));

    }

  }


  if (Instruction *ICmp = foldICmpIntrinsicWithIntrinsic(I, Builder))

    return ICmp;


  // Match icmp eq (trunc (lshr A, BW), (ashr (trunc A), BW-1)), which checks

  // the top BW/2 + 1 bits are all the same. Create "A >=s INT_MIN && A <=s

  // INT_MAX", which we generate as "icmp ult (add A, 2^(BW-1)), 2^BW" to skip a

  // few steps of instcombine.

  unsigned BitWidth = Op0->getType()->getScalarSizeInBits();

  if (match(Op0, m_AShr(m_Trunc(m_Value(A)), m_SpecificInt(BitWidth - 1))) &&

      match(Op1, m_Trunc(m_LShr(m_Specific(A), m_SpecificInt(BitWidth)))) &&

      A->getType()->getScalarSizeInBits() == BitWidth * 2 &&

      (I.getOperand(0)->hasOneUse() || I.getOperand(1)->hasOneUse())) {

    APInt C = APInt::getOneBitSet(BitWidth * 2, BitWidth - 1);

    Value *Add = Builder.CreateAdd(A, ConstantInt::get(A->getType(), C));

    return new ICmpInst(Pred == ICmpInst::ICMP_EQ ? ICmpInst::ICMP_ULT

                                                  : ICmpInst::ICMP_UGE,

                        Add, ConstantInt::get(A->getType(), C.shl(1)));

  }


  // Canonicalize:

  // Assume B_Pow2 != 0

  // 1. A & B_Pow2 != B_Pow2 -> A & B_Pow2 == 0

  // 2. A & B_Pow2 == B_Pow2 -> A & B_Pow2 != 0

  if (match(Op0, m_c_And(m_Specific(Op1), m_Value())) &&

      isKnownToBeAPowerOfTwo(Op1, /* OrZero */ false, &I))

    return new ICmpInst(CmpInst::getInversePredicate(Pred), Op0,

                        ConstantInt::getNullValue(Op0->getType()));


  if (match(Op1, m_c_And(m_Specific(Op0), m_Value())) &&

      isKnownToBeAPowerOfTwo(Op0, /* OrZero */ false, &I))

    return new ICmpInst(CmpInst::getInversePredicate(Pred), Op1,

                        ConstantInt::getNullValue(Op1->getType()));


  // Canonicalize:

  // icmp eq/ne X, OneUse(rotate-right(X))

  //    -> icmp eq/ne X, rotate-left(X)

  // We generally try to convert rotate-right -> rotate-left, this just

  // canonicalizes another case.

  if (match(&I, m_c_ICmp(m_Value(A),

                         m_OneUse(m_Intrinsic<Intrinsic::fshr>(

                             m_Deferred(A), m_Deferred(A), m_Value(B))))))

    return new ICmpInst(

        Pred, A,

        Builder.CreateIntrinsic(Op0->getType(), Intrinsic::fshl, {A, A, B}));


  // Canonicalize:

  // icmp eq/ne OneUse(A ^ Cst), B --> icmp eq/ne (A ^ B), Cst

  Constant *Cst;

  if (match(&I, m_c_ICmp(m_OneUse(m_Xor(m_Value(A), m_ImmConstant(Cst))),

                         m_CombineAnd(m_Value(B), m_Unless(m_ImmConstant())))))

    return new ICmpInst(Pred, Builder.CreateXor(A, B), Cst);


  {

    // (icmp eq/ne (and (add/sub/xor X, P2), P2), P2)

    auto m_Matcher =

        m_CombineOr(m_CombineOr(m_c_Add(m_Value(B), m_Deferred(A)),

                                m_c_Xor(m_Value(B), m_Deferred(A))),

                    m_Sub(m_Value(B), m_Deferred(A)));

    std::optional<bool> IsZero = std::nullopt;

    if (match(&I, m_c_ICmp(m_OneUse(m_c_And(m_Value(A), m_Matcher)),

                           m_Deferred(A))))

      IsZero = false;

    // (icmp eq/ne (and (add/sub/xor X, P2), P2), 0)

    else if (match(&I,

                   m_ICmp(m_OneUse(m_c_And(m_Value(A), m_Matcher)), m_Zero())))

      IsZero = true;


    if (IsZero && isKnownToBeAPowerOfTwo(A, /* OrZero */ true, &I))

      // (icmp eq/ne (and (add/sub/xor X, P2), P2), P2)

      //    -> (icmp eq/ne (and X, P2), 0)

      // (icmp eq/ne (and (add/sub/xor X, P2), P2), 0)

      //    -> (icmp eq/ne (and X, P2), P2)

      return new ICmpInst(Pred, Builder.CreateAnd(B, A),

                          *IsZero ? A

                                  : ConstantInt::getNullValue(A->getType()));

  }


  if (auto *Res = foldICmpEqualityWithOffset(

          I, Builder, getSimplifyQuery().getWithInstruction(&I)))

    return Res;


  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpWithTrunc(ICmpInst &ICmp) {

  ICmpInst::Predicate Pred = ICmp.getPredicate();

  Value *Op0 = ICmp.getOperand(0), *Op1 = ICmp.getOperand(1);


  // Try to canonicalize trunc + compare-to-constant into a mask + cmp.

  // The trunc masks high bits while the compare may effectively mask low bits.

  Value *X;

  const APInt *C;

  if (!match(Op0, m_OneUse(m_Trunc(m_Value(X)))) || !match(Op1, m_APInt(C)))

    return nullptr;


  // This matches patterns corresponding to tests of the signbit as well as:

  // (trunc X) pred C2 --> (X & Mask) == C

  if (auto Res = decomposeBitTestICmp(Op0, Op1, Pred, /*WithTrunc=*/true,

                                      /*AllowNonZeroC=*/true)) {

    Value *And = Builder.CreateAnd(Res->X, Res->Mask);

    Constant *C = ConstantInt::get(Res->X->getType(), Res->C);

    return new ICmpInst(Res->Pred, And, C);

  }


  unsigned SrcBits = X->getType()->getScalarSizeInBits();

  if (auto *II = dyn_cast<IntrinsicInst>(X)) {

    if (II->getIntrinsicID() == Intrinsic::cttz ||

        II->getIntrinsicID() == Intrinsic::ctlz) {

      unsigned MaxRet = SrcBits;

      // If the "is_zero_poison" argument is set, then we know at least

      // one bit is set in the input, so the result is always at least one

      // less than the full bitwidth of that input.

      if (match(II->getArgOperand(1), m_One()))

        MaxRet--;


      // Make sure the destination is wide enough to hold the largest output of

      // the intrinsic.

      if (llvm::Log2_32(MaxRet) + 1 <= Op0->getType()->getScalarSizeInBits())

        if (Instruction *I =

                foldICmpIntrinsicWithConstant(ICmp, II, C->zext(SrcBits)))

          return I;

    }

  }


  return nullptr;

}


Instruction *InstCombinerImpl::foldICmpWithZextOrSext(ICmpInst &ICmp) {

  assert(isa<CastInst>(ICmp.getOperand(0)) && "Expected cast for operand 0");

  auto *CastOp0 = cast<CastInst>(ICmp.getOperand(0));

  Value *X;

  if (!match(CastOp0, m_ZExtOrSExt(m_Value(X))))

    return nullptr;


  bool IsSignedExt = CastOp0->getOpcode() == Instruction::SExt;

  bool IsSignedCmp = ICmp.isSigned();


  // icmp Pred (ext X), (ext Y)

  Value *Y;

  if (match(ICmp.getOperand(1), m_ZExtOrSExt(m_Value(Y)))) {

    bool IsZext0 = isa<ZExtInst>(ICmp.getOperand(0));

    bool IsZext1 = isa<ZExtInst>(ICmp.getOperand(1));


    if (IsZext0 != IsZext1) {

      // If X and Y and both i1

      // (icmp eq/ne (zext X) (sext Y))

      //      eq -> (icmp eq (or X, Y), 0)

      //      ne -> (icmp ne (or X, Y), 0)

      if (ICmp.isEquality() && X->getType()->isIntOrIntVectorTy(1) &&

          Y->getType()->isIntOrIntVectorTy(1))

        return new ICmpInst(ICmp.getPredicate(), Builder.CreateOr(X, Y),

                            Constant::getNullValue(X->getType()));


      // If we have mismatched casts and zext has the nneg flag, we can

      //  treat the "zext nneg" as "sext". Otherwise, we cannot fold and quit.


      auto *NonNegInst0 = dyn_cast<PossiblyNonNegInst>(ICmp.getOperand(0));

      auto *NonNegInst1 = dyn_cast<PossiblyNonNegInst>(ICmp.getOperand(1));


      bool IsNonNeg0 = NonNegInst0 && NonNegInst0->hasNonNeg();

      bool IsNonNeg1 = NonNegInst1 && NonNegInst1->hasNonNeg();


      if ((IsZext0 && IsNonNeg0) || (IsZext1 && IsNonNeg1))

        IsSignedExt = true;

      else

        return nullptr;

    }


    // Not an extension from the same type?

    Type *XTy = X->getType(), *YTy = Y->getType();

    if (XTy != YTy) {

      // One of the casts must have one use because we are creating a new cast.

      if (!ICmp.getOperand(0)->hasOneUse() && !ICmp.getOperand(1)->hasOneUse())

        return nullptr;

      // Extend the narrower operand to the type of the wider operand.

      CastInst::CastOps CastOpcode =

          IsSignedExt ? Instruction::SExt : Instruction::ZExt;

      if (XTy->getScalarSizeInBits() < YTy->getScalarSizeInBits())

        X = Builder.CreateCast(CastOpcode, X, YTy);

      else if (YTy->getScalarSizeInBits() < XTy->getScalarSizeInBits())

        Y = Builder.CreateCast(CastOpcode, Y, XTy);

      else

        return nullptr;

    }


    // (zext X) == (zext Y) --> X == Y

    // (sext X) == (sext Y) --> X == Y

    if (ICmp.isEquality())

      return new ICmpInst(ICmp.getPredicate(), X, Y);


    // A signed comparison of sign extended values simplifies into a

    // signed comparison.

    if (IsSignedCmp && IsSignedExt)

      return new ICmpInst(ICmp.getPredicate(), X, Y);


    // The other three cases all fold into an unsigned comparison.

    return new ICmpInst(ICmp.getUnsignedPredicate(), X, Y);

  }


  // Below here, we are only folding a compare with constant.

  auto *C = dyn_cast<Constant>(ICmp.getOperand(1));

  if (!C)

    return nullptr;


  // If a lossless truncate is possible...

  Type *SrcTy = CastOp0->getSrcTy();

  Constant *Res = getLosslessTrunc(C, SrcTy, CastOp0->getOpcode());

  if (Res) {

    if (ICmp.isEquality())

      return new ICmpInst(ICmp.getPredicate(), X, Res);


    // A signed comparison of sign extended values simplifies into a

    // signed comparison.

    if (IsSignedExt && IsSignedCmp)

      return new ICmpInst(ICmp.getPredicate(), X, Res);


    // The other three cases all fold into an unsigned comparison.

    return new ICmpInst(ICmp.getUnsignedPredicate(), X, Res);

  }


  // The re-extended constant changed, partly changed (in the case of a vector),

  // or could not be determined to be equal (in the case of a constant

  // expression), so the constant cannot be represented in the shorter type.

  // All the cases that fold to true or false will have already been handled

  // by simplifyICmpInst, so only deal with the tricky case.

  if (IsSignedCmp || !IsSignedExt || !isa<ConstantInt>(C))

    return nullptr;


  // Is source op positive?

  // icmp ult (sext X), C --> icmp sgt X, -1

  if (ICmp.getPredicate() == ICmpInst::ICMP_ULT)

    return new ICmpInst(CmpInst::ICMP_SGT, X, Constant::getAllOnesValue(SrcTy));


  // Is source op negative?

  // icmp ugt (sext X), C --> icmp slt X, 0

  assert(ICmp.getPredicate() == ICmpInst::ICMP_UGT && "ICmp should be folded!");

  return new ICmpInst(CmpInst::ICMP_SLT, X, Constant::getNullValue(SrcTy));

}


/// Handle icmp (cast x), (cast or constant).

Instruction *InstCombinerImpl::foldICmpWithCastOp(ICmpInst &ICmp) {

  // If any operand of ICmp is a inttoptr roundtrip cast then remove it as

  // icmp compares only pointer's value.

  // icmp (inttoptr (ptrtoint p1)), p2 --> icmp p1, p2.

  Value *SimplifiedOp0 = simplifyIntToPtrRoundTripCast(ICmp.getOperand(0));

  Value *SimplifiedOp1 = simplifyIntToPtrRoundTripCast(ICmp.getOperand(1));

  if (SimplifiedOp0 || SimplifiedOp1)

    return new ICmpInst(ICmp.getPredicate(),

                        SimplifiedOp0 ? SimplifiedOp0 : ICmp.getOperand(0),

                        SimplifiedOp1 ? SimplifiedOp1 : ICmp.getOperand(1));


  auto *CastOp0 = dyn_cast<CastInst>(ICmp.getOperand(0));

  if (!CastOp0)

    return nullptr;

  if (!isa<Constant>(ICmp.getOperand(1)) && !isa<CastInst>(ICmp.getOperand(1)))

    return nullptr;


  Value *Op0Src = CastOp0->getOperand(0);

  Type *SrcTy = CastOp0->getSrcTy();

  Type *DestTy = CastOp0->getDestTy();


  // Turn icmp (ptrtoint x), (ptrtoint/c) into a compare of the input if the

  // integer type is the same size as the pointer type.

  auto CompatibleSizes = [&](Type *PtrTy, Type *IntTy) {

    if (isa<VectorType>(PtrTy)) {

      PtrTy = cast<VectorType>(PtrTy)->getElementType();

      IntTy = cast<VectorType>(IntTy)->getElementType();

    }

    return DL.getPointerTypeSizeInBits(PtrTy) == IntTy->getIntegerBitWidth();

  };

  if (CastOp0->getOpcode() == Instruction::PtrToInt &&

      CompatibleSizes(SrcTy, DestTy)) {

    Value *NewOp1 = nullptr;

    if (auto *PtrToIntOp1 = dyn_cast<PtrToIntOperator>(ICmp.getOperand(1))) {

      Value *PtrSrc = PtrToIntOp1->getOperand(0);

      if (PtrSrc->getType() == Op0Src->getType())

        NewOp1 = PtrToIntOp1->getOperand(0);

    } else if (auto *RHSC = dyn_cast<Constant>(ICmp.getOperand(1))) {

      NewOp1 = ConstantExpr::getIntToPtr(RHSC, SrcTy);

    }


    if (NewOp1)

      return new ICmpInst(ICmp.getPredicate(), Op0Src, NewOp1);

  }


  // Do the same in the other direction for icmp (inttoptr x), (inttoptr/c).

  if (CastOp0->getOpcode() == Instruction::IntToPtr &&

      CompatibleSizes(DestTy, SrcTy)) {

    Value *NewOp1 = nullptr;

    if (auto *IntToPtrOp1 = dyn_cast<IntToPtrInst>(ICmp.getOperand(1))) {

      Value *IntSrc = IntToPtrOp1->getOperand(0);

      if (IntSrc->getType() == Op0Src->getType())

        NewOp1 = IntToPtrOp1->getOperand(0);

    } else if (auto *RHSC = dyn_cast<Constant>(ICmp.getOperand(1))) {

      NewOp1 = ConstantFoldConstant(ConstantExpr::getPtrToInt(RHSC, SrcTy), DL);

    }


    if (NewOp1)

      return new ICmpInst(ICmp.getPredicate(), Op0Src, NewOp1);

  }


  if (Instruction *R = foldICmpWithTrunc(ICmp))

    return R;


  return foldICmpWithZextOrSext(ICmp);

}


static bool isNeutralValue(Instruction::BinaryOps BinaryOp, Value *RHS,

                           bool IsSigned) {

  switch (BinaryOp) {

  default:

    llvm_unreachable("Unsupported binary op");

  case Instruction::Add:

  case Instruction::Sub:

    return match(RHS, m_Zero());

  case Instruction::Mul:

    return !(RHS->getType()->isIntOrIntVectorTy(1) && IsSigned) &&

           match(RHS, m_One());

  }

}


OverflowResult

InstCombinerImpl::computeOverflow(Instruction::BinaryOps BinaryOp,

                                  bool IsSigned, Value *LHS, Value *RHS,

                                  Instruction *CxtI) const {

  switch (BinaryOp) {

  default:

    llvm_unreachable("Unsupported binary op");

  case Instruction::Add:

    if (IsSigned)

      return computeOverflowForSignedAdd(LHS, RHS, CxtI);

    else

      return computeOverflowForUnsignedAdd(LHS, RHS, CxtI);

  case Instruction::Sub:

    if (IsSigned)

      return computeOverflowForSignedSub(LHS, RHS, CxtI);

    else

      return computeOverflowForUnsignedSub(LHS, RHS, CxtI);

  case Instruction::Mul:

    if (IsSigned)

      return computeOverflowForSignedMul(LHS, RHS, CxtI);

    else

      return computeOverflowForUnsignedMul(LHS, RHS, CxtI);

  }

}


bool InstCombinerImpl::OptimizeOverflowCheck(Instruction::BinaryOps BinaryOp,

                                             bool IsSigned, Value *LHS,

                                             Value *RHS, Instruction &OrigI,

                                             Value *&Result,

                                             Constant *&Overflow) {

  if (OrigI.isCommutative() && isa<Constant>(LHS) && !isa<Constant>(RHS))

    std::swap(LHS, RHS);


  // If the overflow check was an add followed by a compare, the insertion point

  // may be pointing to the compare.  We want to insert the new instructions

  // before the add in case there are uses of the add between the add and the

  // compare.

  Builder.SetInsertPoint(&OrigI);


  Type *OverflowTy = Type::getInt1Ty(LHS->getContext());

  if (auto *LHSTy = dyn_cast<VectorType>(LHS->getType()))

    OverflowTy = VectorType::get(OverflowTy, LHSTy->getElementCount());


  if (isNeutralValue(BinaryOp, RHS, IsSigned)) {

    Result = LHS;

    Overflow = ConstantInt::getFalse(OverflowTy);

    return true;

  }


  switch (computeOverflow(BinaryOp, IsSigned, LHS, RHS, &OrigI)) {

  case OverflowResult::MayOverflow:

    return false;

  case OverflowResult::AlwaysOverflowsLow:

  case OverflowResult::AlwaysOverflowsHigh:

    Result = Builder.CreateBinOp(BinaryOp, LHS, RHS);

    Result->takeName(&OrigI);

    Overflow = ConstantInt::getTrue(OverflowTy);

    return true;

  case OverflowResult::NeverOverflows:

    Result = Builder.CreateBinOp(BinaryOp, LHS, RHS);

    Result->takeName(&OrigI);

    Overflow = ConstantInt::getFalse(OverflowTy);

    if (auto *Inst = dyn_cast<Instruction>(Result)) {

      if (IsSigned)

        Inst->setHasNoSignedWrap();

      else

        Inst->setHasNoUnsignedWrap();

    }

    return true;

  }


  llvm_unreachable("Unexpected overflow result");

}


/// Recognize and process idiom involving test for multiplication

/// overflow.

///

/// The caller has matched a pattern of the form:

///   I = cmp u (mul(zext A, zext B), V

/// The function checks if this is a test for overflow and if so replaces

/// multiplication with call to 'mul.with.overflow' intrinsic.

///

/// \param I Compare instruction.

/// \param MulVal Result of 'mult' instruction.  It is one of the arguments of

///               the compare instruction.  Must be of integer type.

/// \param OtherVal The other argument of compare instruction.

/// \returns Instruction which must replace the compare instruction, NULL if no

///          replacement required.

static Instruction *processUMulZExtIdiom(ICmpInst &I, Value *MulVal,

                                         const APInt *OtherVal,

                                         InstCombinerImpl &IC) {

  // Don't bother doing this transformation for pointers, don't do it for

  // vectors.

  if (!isa<IntegerType>(MulVal->getType()))

    return nullptr;


  auto *MulInstr = dyn_cast<Instruction>(MulVal);

  if (!MulInstr)

    return nullptr;

  assert(MulInstr->getOpcode() == Instruction::Mul);


  auto *LHS = cast<ZExtInst>(MulInstr->getOperand(0)),

       *RHS = cast<ZExtInst>(MulInstr->getOperand(1));

  assert(LHS->getOpcode() == Instruction::ZExt);

  assert(RHS->getOpcode() == Instruction::ZExt);

  Value *A = LHS->getOperand(0), *B = RHS->getOperand(0);


  // Calculate type and width of the result produced by mul.with.overflow.

  Type *TyA = A->getType(), *TyB = B->getType();

  unsigned WidthA = TyA->getPrimitiveSizeInBits(),

           WidthB = TyB->getPrimitiveSizeInBits();

  unsigned MulWidth;

  Type *MulType;

  if (WidthB > WidthA) {

    MulWidth = WidthB;

    MulType = TyB;

  } else {

    MulWidth = WidthA;

    MulType = TyA;

  }


  // In order to replace the original mul with a narrower mul.with.overflow,

  // all uses must ignore upper bits of the product.  The number of used low

  // bits must be not greater than the width of mul.with.overflow.

  if (MulVal->hasNUsesOrMore(2))

    for (User *U : MulVal->users()) {

      if (U == &I)

        continue;

      if (TruncInst *TI = dyn_cast<TruncInst>(U)) {

        // Check if truncation ignores bits above MulWidth.

        unsigned TruncWidth = TI->getType()->getPrimitiveSizeInBits();

        if (TruncWidth > MulWidth)

          return nullptr;

      } else if (BinaryOperator *BO = dyn_cast<BinaryOperator>(U)) {

        // Check if AND ignores bits above MulWidth.

        if (BO->getOpcode() != Instruction::And)

          return nullptr;

        if (ConstantInt *CI = dyn_cast<ConstantInt>(BO->getOperand(1))) {

          const APInt &CVal = CI->getValue();

          if (CVal.getBitWidth() - CVal.countl_zero() > MulWidth)

            return nullptr;

        } else {

          // In this case we could have the operand of the binary operation

          // being defined in another block, and performing the replacement

          // could break the dominance relation.

          return nullptr;

        }

      } else {

        // Other uses prohibit this transformation.

        return nullptr;

      }

    }


  // Recognize patterns

  switch (I.getPredicate()) {

  case ICmpInst::ICMP_UGT: {

    // Recognize pattern:

    //   mulval = mul(zext A, zext B)

    //   cmp ugt mulval, max

    APInt MaxVal = APInt::getMaxValue(MulWidth);

    MaxVal = MaxVal.zext(OtherVal->getBitWidth());

    if (MaxVal.eq(*OtherVal))

      break; // Recognized

    return nullptr;

  }


  case ICmpInst::ICMP_ULT: {

    // Recognize pattern:

    //   mulval = mul(zext A, zext B)

    //   cmp ule mulval, max + 1

    APInt MaxVal = APInt::getOneBitSet(OtherVal->getBitWidth(), MulWidth);

    if (MaxVal.eq(*OtherVal))

      break; // Recognized

    return nullptr;

  }


  default:

    return nullptr;

  }


  InstCombiner::BuilderTy &Builder = IC.Builder;

  Builder.SetInsertPoint(MulInstr);


  // Replace: mul(zext A, zext B) --> mul.with.overflow(A, B)

  Value *MulA = A, *MulB = B;

  if (WidthA < MulWidth)

    MulA = Builder.CreateZExt(A, MulType);

  if (WidthB < MulWidth)

    MulB = Builder.CreateZExt(B, MulType);

  CallInst *Call =

      Builder.CreateIntrinsic(Intrinsic::umul_with_overflow, MulType,

                              {MulA, MulB}, /*FMFSource=*/nullptr, "umul");

  IC.addToWorklist(MulInstr);


  // If there are uses of mul result other than the comparison, we know that

  // they are truncation or binary AND. Change them to use result of

  // mul.with.overflow and adjust properly mask/size.

  if (MulVal->hasNUsesOrMore(2)) {

    Value *Mul = Builder.CreateExtractValue(Call, 0, "umul.value");

    for (User *U : make_early_inc_range(MulVal->users())) {

      if (U == &I)

        continue;

      if (TruncInst *TI = dyn_cast<TruncInst>(U)) {

        if (TI->getType()->getPrimitiveSizeInBits() == MulWidth)

          IC.replaceInstUsesWith(*TI, Mul);

        else

          TI->setOperand(0, Mul);

      } else if (BinaryOperator *BO = dyn_cast<BinaryOperator>(U)) {

        assert(BO->getOpcode() == Instruction::And);

        // Replace (mul & mask) --> zext (mul.with.overflow & short_mask)

        ConstantInt *CI = cast<ConstantInt>(BO->getOperand(1));

        APInt ShortMask = CI->getValue().trunc(MulWidth);

        Value *ShortAnd = Builder.CreateAnd(Mul, ShortMask);

        Value *Zext = Builder.CreateZExt(ShortAnd, BO->getType());

        IC.replaceInstUsesWith(*BO, Zext);

      } else {

        llvm_unreachable("Unexpected Binary operation");

      }

      IC.addToWorklist(cast<Instruction>(U));

    }

  }


  // The original icmp gets replaced with the overflow value, maybe inverted

  // depending on predicate.

  if (I.getPredicate() == ICmpInst::ICMP_ULT) {

    Value *Res = Builder.CreateExtractValue(Call, 1);

    return BinaryOperator::CreateNot(Res);

  }


  return ExtractValueInst::Create(Call, 1);

}


/// When performing a comparison against a constant, it is possible that not all

/// the bits in the LHS are demanded. This helper method computes the mask that

/// IS demanded.

static APInt getDemandedBitsLHSMask(ICmpInst &I, unsigned BitWidth) {

  const APInt *RHS;

  if (!match(I.getOperand(1), m_APInt(RHS)))

    return APInt::getAllOnes(BitWidth);


  // If this is a normal comparison, it demands all bits. If it is a sign bit

  // comparison, it only demands the sign bit.

  bool UnusedBit;

  if (isSignBitCheck(I.getPredicate(), *RHS, UnusedBit))

    return APInt::getSignMask(BitWidth);


  switch (I.getPredicate()) {

  // For a UGT comparison, we don't care about any bits that

  // correspond to the trailing ones of the comparand.  The value of these

  // bits doesn't impact the outcome of the comparison, because any value

  // greater than the RHS must differ in a bit higher than these due to carry.

  case ICmpInst::ICMP_UGT:

    return APInt::getBitsSetFrom(BitWidth, RHS->countr_one());


  // Similarly, for a ULT comparison, we don't care about the trailing zeros.

  // Any value less than the RHS must differ in a higher bit because of carries.

  case ICmpInst::ICMP_ULT:

    return APInt::getBitsSetFrom(BitWidth, RHS->countr_zero());


  default:

    return APInt::getAllOnes(BitWidth);

  }

}


/// Check that one use is in the same block as the definition and all

/// other uses are in blocks dominated by a given block.

///

/// \param DI Definition

/// \param UI Use

/// \param DB Block that must dominate all uses of \p DI outside

///           the parent block

/// \return true when \p UI is the only use of \p DI in the parent block

/// and all other uses of \p DI are in blocks dominated by \p DB.

///

bool InstCombinerImpl::dominatesAllUses(const Instruction *DI,

                                        const Instruction *UI,

                                        const BasicBlock *DB) const {

  assert(DI && UI && "Instruction not defined\n");

  // Ignore incomplete definitions.

  if (!DI->getParent())

    return false;

  // DI and UI must be in the same block.

  if (DI->getParent() != UI->getParent())

    return false;

  // Protect from self-referencing blocks.

  if (DI->getParent() == DB)

    return false;

  for (const User *U : DI->users()) {

    auto *Usr = cast<Instruction>(U);

    if (Usr != UI && !DT.dominates(DB, Usr->getParent()))

      return false;

  }

  return true;

}


/// Return true when the instruction sequence within a block is select-cmp-br.

static bool isChainSelectCmpBranch(const SelectInst *SI) {

  const BasicBlock *BB = SI->getParent();

  if (!BB)

    return false;

  auto *BI = dyn_cast_or_null<BranchInst>(BB->getTerminator());

  if (!BI || BI->getNumSuccessors() != 2)

    return false;

  auto *IC = dyn_cast<ICmpInst>(BI->getCondition());

  if (!IC || (IC->getOperand(0) != SI && IC->getOperand(1) != SI))

    return false;

  return true;

}


/// True when a select result is replaced by one of its operands

/// in select-icmp sequence. This will eventually result in the elimination

/// of the select.

///

/// \param SI    Select instruction

/// \param Icmp  Compare instruction

/// \param SIOpd Operand that replaces the select

///

/// Notes:

/// - The replacement is global and requires dominator information

/// - The caller is responsible for the actual replacement

///

/// Example:

///

/// entry:

///  %4 = select i1 %3, %C* %0, %C* null

///  %5 = icmp eq %C* %4, null

///  br i1 %5, label %9, label %7

///  ...

///  ; <label>:7                                       ; preds = %entry

///  %8 = getelementptr inbounds %C* %4, i64 0, i32 0

///  ...

///

/// can be transformed to

///

///  %5 = icmp eq %C* %0, null

///  %6 = select i1 %3, i1 %5, i1 true

///  br i1 %6, label %9, label %7

///  ...

///  ; <label>:7                                       ; preds = %entry

///  %8 = getelementptr inbounds %C* %0, i64 0, i32 0  // replace by %0!

///

/// Similar when the first operand of the select is a constant or/and

/// the compare is for not equal rather than equal.

///

/// NOTE: The function is only called when the select and compare constants

/// are equal, the optimization can work only for EQ predicates. This is not a

/// major restriction since a NE compare should be 'normalized' to an equal

/// compare, which usually happens in the combiner and test case

/// select-cmp-br.ll checks for it.

bool InstCombinerImpl::replacedSelectWithOperand(SelectInst *SI,

                                                 const ICmpInst *Icmp,

                                                 const unsigned SIOpd) {

  assert((SIOpd == 1 || SIOpd == 2) && "Invalid select operand!");

  if (isChainSelectCmpBranch(SI) && Icmp->getPredicate() == ICmpInst::ICMP_EQ) {

    BasicBlock *Succ = SI->getParent()->getTerminator()->getSuccessor(1);

    // The check for the single predecessor is not the best that can be

    // done. But it protects efficiently against cases like when SI's

    // home block has two successors, Succ and Succ1, and Succ1 predecessor

    // of Succ. Then SI can't be replaced by SIOpd because the use that gets

    // replaced can be reached on either path. So the uniqueness check

    // guarantees that the path all uses of SI (outside SI's parent) are on

    // is disjoint from all other paths out of SI. But that information

    // is more expensive to compute, and the trade-off here is in favor

    // of compile-time. It should also be noticed that we check for a single

    // predecessor and not only uniqueness. This to handle the situation when

    // Succ and Succ1 points to the same basic block.

    if (Succ->getSinglePredecessor() && dominatesAllUses(SI, Icmp, Succ)) {

      NumSel++;

      SI->replaceUsesOutsideBlock(SI->getOperand(SIOpd), SI->getParent());

      return true;

    }

  }

  return false;

}


/// Try to fold the comparison based on range information we can get by checking

/// whether bits are known to be zero or one in the inputs.

Instruction *InstCombinerImpl::foldICmpUsingKnownBits(ICmpInst &I) {

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  Type *Ty = Op0->getType();

  ICmpInst::Predicate Pred = I.getPredicate();


  // Get scalar or pointer size.

  unsigned BitWidth = Ty->isIntOrIntVectorTy()

                          ? Ty->getScalarSizeInBits()

                          : DL.getPointerTypeSizeInBits(Ty->getScalarType());


  if (!BitWidth)

    return nullptr;


  KnownBits Op0Known(BitWidth);

  KnownBits Op1Known(BitWidth);


  {

    // Don't use dominating conditions when folding icmp using known bits. This

    // may convert signed into unsigned predicates in ways that other passes

    // (especially IndVarSimplify) may not be able to reliably undo.

    SimplifyQuery Q = SQ.getWithoutDomCondCache().getWithInstruction(&I);

    if (SimplifyDemandedBits(&I, 0, getDemandedBitsLHSMask(I, BitWidth),

                             Op0Known, Q))

      return &I;


    if (SimplifyDemandedBits(&I, 1, APInt::getAllOnes(BitWidth), Op1Known, Q))

      return &I;

  }


  if (!isa<Constant>(Op0) && Op0Known.isConstant())

    return new ICmpInst(

        Pred, ConstantExpr::getIntegerValue(Ty, Op0Known.getConstant()), Op1);

  if (!isa<Constant>(Op1) && Op1Known.isConstant())

    return new ICmpInst(

        Pred, Op0, ConstantExpr::getIntegerValue(Ty, Op1Known.getConstant()));


  if (std::optional<bool> Res = ICmpInst::compare(Op0Known, Op1Known, Pred))

    return replaceInstUsesWith(I, ConstantInt::getBool(I.getType(), *Res));


  // Given the known and unknown bits, compute a range that the LHS could be

  // in.  Compute the Min, Max and RHS values based on the known bits. For the

  // EQ and NE we use unsigned values.

  APInt Op0Min(BitWidth, 0), Op0Max(BitWidth, 0);

  APInt Op1Min(BitWidth, 0), Op1Max(BitWidth, 0);

  if (I.isSigned()) {

    Op0Min = Op0Known.getSignedMinValue();

    Op0Max = Op0Known.getSignedMaxValue();

    Op1Min = Op1Known.getSignedMinValue();

    Op1Max = Op1Known.getSignedMaxValue();

  } else {

    Op0Min = Op0Known.getMinValue();

    Op0Max = Op0Known.getMaxValue();

    Op1Min = Op1Known.getMinValue();

    Op1Max = Op1Known.getMaxValue();

  }


  // Don't break up a clamp pattern -- (min(max X, Y), Z) -- by replacing a

  // min/max canonical compare with some other compare. That could lead to

  // conflict with select canonicalization and infinite looping.

  // FIXME: This constraint may go away if min/max intrinsics are canonical.

  auto isMinMaxCmp = [&](Instruction &Cmp) {

    if (!Cmp.hasOneUse())

      return false;

    Value *A, *B;

    SelectPatternFlavor SPF = matchSelectPattern(Cmp.user_back(), A, B).Flavor;

    if (!SelectPatternResult::isMinOrMax(SPF))

      return false;

    return match(Op0, m_MaxOrMin(m_Value(), m_Value())) ||

           match(Op1, m_MaxOrMin(m_Value(), m_Value()));

  };

  if (!isMinMaxCmp(I)) {

    switch (Pred) {

    default:

      break;

    case ICmpInst::ICMP_ULT: {

      if (Op1Min == Op0Max) // A <u B -> A != B if max(A) == min(B)

        return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);

      const APInt *CmpC;

      if (match(Op1, m_APInt(CmpC))) {

        // A <u C -> A == C-1 if min(A)+1 == C

        if (*CmpC == Op0Min + 1)

          return new ICmpInst(ICmpInst::ICMP_EQ, Op0,

                              ConstantInt::get(Op1->getType(), *CmpC - 1));

        // X <u C --> X == 0, if the number of zero bits in the bottom of X

        // exceeds the log2 of C.

        if (Op0Known.countMinTrailingZeros() >= CmpC->ceilLogBase2())

          return new ICmpInst(ICmpInst::ICMP_EQ, Op0,

                              Constant::getNullValue(Op1->getType()));

      }

      break;

    }

    case ICmpInst::ICMP_UGT: {

      if (Op1Max == Op0Min) // A >u B -> A != B if min(A) == max(B)

        return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);

      const APInt *CmpC;

      if (match(Op1, m_APInt(CmpC))) {

        // A >u C -> A == C+1 if max(a)-1 == C

        if (*CmpC == Op0Max - 1)

          return new ICmpInst(ICmpInst::ICMP_EQ, Op0,

                              ConstantInt::get(Op1->getType(), *CmpC + 1));

        // X >u C --> X != 0, if the number of zero bits in the bottom of X

        // exceeds the log2 of C.

        if (Op0Known.countMinTrailingZeros() >= CmpC->getActiveBits())

          return new ICmpInst(ICmpInst::ICMP_NE, Op0,

                              Constant::getNullValue(Op1->getType()));

      }

      break;

    }

    case ICmpInst::ICMP_SLT: {

      if (Op1Min == Op0Max) // A <s B -> A != B if max(A) == min(B)

        return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);

      const APInt *CmpC;

      if (match(Op1, m_APInt(CmpC))) {

        if (*CmpC == Op0Min + 1) // A <s C -> A == C-1 if min(A)+1 == C

          return new ICmpInst(ICmpInst::ICMP_EQ, Op0,

                              ConstantInt::get(Op1->getType(), *CmpC - 1));

      }

      break;

    }

    case ICmpInst::ICMP_SGT: {

      if (Op1Max == Op0Min) // A >s B -> A != B if min(A) == max(B)

        return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);

      const APInt *CmpC;

      if (match(Op1, m_APInt(CmpC))) {

        if (*CmpC == Op0Max - 1) // A >s C -> A == C+1 if max(A)-1 == C

          return new ICmpInst(ICmpInst::ICMP_EQ, Op0,

                              ConstantInt::get(Op1->getType(), *CmpC + 1));

      }

      break;

    }

    }

  }


  // Based on the range information we know about the LHS, see if we can

  // simplify this comparison.  For example, (x&4) < 8 is always true.

  switch (Pred) {

  default:

    break;

  case ICmpInst::ICMP_EQ:

  case ICmpInst::ICMP_NE: {

    // If all bits are known zero except for one, then we know at most one bit

    // is set. If the comparison is against zero, then this is a check to see if

    // *that* bit is set.

    APInt Op0KnownZeroInverted = ~Op0Known.Zero;

    if (Op1Known.isZero()) {

      // If the LHS is an AND with the same constant, look through it.

      Value *LHS = nullptr;

      const APInt *LHSC;

      if (!match(Op0, m_And(m_Value(LHS), m_APInt(LHSC))) ||

          *LHSC != Op0KnownZeroInverted)

        LHS = Op0;


      Value *X;

      const APInt *C1;

      if (match(LHS, m_Shl(m_Power2(C1), m_Value(X)))) {

        Type *XTy = X->getType();

        unsigned Log2C1 = C1->countr_zero();

        APInt C2 = Op0KnownZeroInverted;

        APInt C2Pow2 = (C2 & ~(*C1 - 1)) + *C1;

        if (C2Pow2.isPowerOf2()) {

          // iff (C1 is pow2) & ((C2 & ~(C1-1)) + C1) is pow2):

          // ((C1 << X) & C2) == 0 -> X >= (Log2(C2+C1) - Log2(C1))

          // ((C1 << X) & C2) != 0 -> X  < (Log2(C2+C1) - Log2(C1))

          unsigned Log2C2 = C2Pow2.countr_zero();

          auto *CmpC = ConstantInt::get(XTy, Log2C2 - Log2C1);

          auto NewPred =

              Pred == CmpInst::ICMP_EQ ? CmpInst::ICMP_UGE : CmpInst::ICMP_ULT;

          return new ICmpInst(NewPred, X, CmpC);

        }

      }

    }


    // Op0 eq C_Pow2 -> Op0 ne 0 if Op0 is known to be C_Pow2 or zero.

    if (Op1Known.isConstant() && Op1Known.getConstant().isPowerOf2() &&

        (Op0Known & Op1Known) == Op0Known)

      return new ICmpInst(CmpInst::getInversePredicate(Pred), Op0,

                          ConstantInt::getNullValue(Op1->getType()));

    break;

  }

  case ICmpInst::ICMP_SGE:

    if (Op1Min == Op0Max) // A >=s B -> A == B if max(A) == min(B)

      return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);

    break;

  case ICmpInst::ICMP_SLE:

    if (Op1Max == Op0Min) // A <=s B -> A == B if min(A) == max(B)

      return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);

    break;

  case ICmpInst::ICMP_UGE:

    if (Op1Min == Op0Max) // A >=u B -> A == B if max(A) == min(B)

      return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);

    break;

  case ICmpInst::ICMP_ULE:

    if (Op1Max == Op0Min) // A <=u B -> A == B if min(A) == max(B)

      return new ICmpInst(ICmpInst::ICMP_EQ, Op0, Op1);

    break;

  }


  // Turn a signed comparison into an unsigned one if both operands are known to

  // have the same sign. Set samesign if possible (except for equality

  // predicates).

  if ((I.isSigned() || (I.isUnsigned() && !I.hasSameSign())) &&

      ((Op0Known.Zero.isNegative() && Op1Known.Zero.isNegative()) ||

       (Op0Known.One.isNegative() && Op1Known.One.isNegative()))) {

    I.setPredicate(I.getUnsignedPredicate());

    I.setSameSign();

    return &I;

  }


  return nullptr;

}


/// If one operand of an icmp is effectively a bool (value range of {0,1}),

/// then try to reduce patterns based on that limit.

Instruction *InstCombinerImpl::foldICmpUsingBoolRange(ICmpInst &I) {

  Value *X, *Y;

  CmpPredicate Pred;


  // X must be 0 and bool must be true for "ULT":

  // X <u (zext i1 Y) --> (X == 0) & Y

  if (match(&I, m_c_ICmp(Pred, m_Value(X), m_OneUse(m_ZExt(m_Value(Y))))) &&

      Y->getType()->isIntOrIntVectorTy(1) && Pred == ICmpInst::ICMP_ULT)

    return BinaryOperator::CreateAnd(Builder.CreateIsNull(X), Y);


  // X must be 0 or bool must be true for "ULE":

  // X <=u (sext i1 Y) --> (X == 0) | Y

  if (match(&I, m_c_ICmp(Pred, m_Value(X), m_OneUse(m_SExt(m_Value(Y))))) &&

      Y->getType()->isIntOrIntVectorTy(1) && Pred == ICmpInst::ICMP_ULE)

    return BinaryOperator::CreateOr(Builder.CreateIsNull(X), Y);


  // icmp eq/ne X, (zext/sext (icmp eq/ne X, C))

  CmpPredicate Pred1, Pred2;

  const APInt *C;

  Instruction *ExtI;

  if (match(&I, m_c_ICmp(Pred1, m_Value(X),

                         m_CombineAnd(m_Instruction(ExtI),

                                      m_ZExtOrSExt(m_ICmp(Pred2, m_Deferred(X),

                                                          m_APInt(C)))))) &&

      ICmpInst::isEquality(Pred1) && ICmpInst::isEquality(Pred2)) {

    bool IsSExt = ExtI->getOpcode() == Instruction::SExt;

    bool HasOneUse = ExtI->hasOneUse() && ExtI->getOperand(0)->hasOneUse();

    auto CreateRangeCheck = [&] {

      Value *CmpV1 =

          Builder.CreateICmp(Pred1, X, Constant::getNullValue(X->getType()));

      Value *CmpV2 = Builder.CreateICmp(

          Pred1, X, ConstantInt::getSigned(X->getType(), IsSExt ? -1 : 1));

      return BinaryOperator::Create(

          Pred1 == ICmpInst::ICMP_EQ ? Instruction::Or : Instruction::And,

          CmpV1, CmpV2);

    };

    if (C->isZero()) {

      if (Pred2 == ICmpInst::ICMP_EQ) {

        // icmp eq X, (zext/sext (icmp eq X, 0)) --> false

        // icmp ne X, (zext/sext (icmp eq X, 0)) --> true

        return replaceInstUsesWith(

            I, ConstantInt::getBool(I.getType(), Pred1 == ICmpInst::ICMP_NE));

      } else if (!IsSExt || HasOneUse) {

        // icmp eq X, (zext (icmp ne X, 0)) --> X == 0 || X == 1

        // icmp ne X, (zext (icmp ne X, 0)) --> X != 0 && X != 1

        // icmp eq X, (sext (icmp ne X, 0)) --> X == 0 || X == -1

        // icmp ne X, (sext (icmp ne X, 0)) --> X != 0 && X != -1

        return CreateRangeCheck();

      }

    } else if (IsSExt ? C->isAllOnes() : C->isOne()) {

      if (Pred2 == ICmpInst::ICMP_NE) {

        // icmp eq X, (zext (icmp ne X, 1)) --> false

        // icmp ne X, (zext (icmp ne X, 1)) --> true

        // icmp eq X, (sext (icmp ne X, -1)) --> false

        // icmp ne X, (sext (icmp ne X, -1)) --> true

        return replaceInstUsesWith(

            I, ConstantInt::getBool(I.getType(), Pred1 == ICmpInst::ICMP_NE));

      } else if (!IsSExt || HasOneUse) {

        // icmp eq X, (zext (icmp eq X, 1)) --> X == 0 || X == 1

        // icmp ne X, (zext (icmp eq X, 1)) --> X != 0 && X != 1

        // icmp eq X, (sext (icmp eq X, -1)) --> X == 0 || X == -1

        // icmp ne X, (sext (icmp eq X, -1)) --> X != 0 && X == -1

        return CreateRangeCheck();

      }

    } else {

      // when C != 0 && C != 1:

      //   icmp eq X, (zext (icmp eq X, C)) --> icmp eq X, 0

      //   icmp eq X, (zext (icmp ne X, C)) --> icmp eq X, 1

      //   icmp ne X, (zext (icmp eq X, C)) --> icmp ne X, 0

      //   icmp ne X, (zext (icmp ne X, C)) --> icmp ne X, 1

      // when C != 0 && C != -1:

      //   icmp eq X, (sext (icmp eq X, C)) --> icmp eq X, 0

      //   icmp eq X, (sext (icmp ne X, C)) --> icmp eq X, -1

      //   icmp ne X, (sext (icmp eq X, C)) --> icmp ne X, 0

      //   icmp ne X, (sext (icmp ne X, C)) --> icmp ne X, -1

      return ICmpInst::Create(

          Instruction::ICmp, Pred1, X,

          ConstantInt::getSigned(X->getType(), Pred2 == ICmpInst::ICMP_NE

                                                   ? (IsSExt ? -1 : 1)

                                                   : 0));

    }

  }


  return nullptr;

}


/// If we have an icmp le or icmp ge instruction with a constant operand, turn

/// it into the appropriate icmp lt or icmp gt instruction. This transform

/// allows them to be folded in visitICmpInst.

static ICmpInst *canonicalizeCmpWithConstant(ICmpInst &I) {

  ICmpInst::Predicate Pred = I.getPredicate();

  if (ICmpInst::isEquality(Pred) || !ICmpInst::isIntPredicate(Pred) ||

      InstCombiner::isCanonicalPredicate(Pred))

    return nullptr;


  Value *Op0 = I.getOperand(0);

  Value *Op1 = I.getOperand(1);

  auto *Op1C = dyn_cast<Constant>(Op1);

  if (!Op1C)

    return nullptr;


  auto FlippedStrictness = getFlippedStrictnessPredicateAndConstant(Pred, Op1C);

  if (!FlippedStrictness)

    return nullptr;


  return new ICmpInst(FlippedStrictness->first, Op0, FlippedStrictness->second);

}


/// If we have a comparison with a non-canonical predicate, if we can update

/// all the users, invert the predicate and adjust all the users.

CmpInst *InstCombinerImpl::canonicalizeICmpPredicate(CmpInst &I) {

  // Is the predicate already canonical?

  CmpInst::Predicate Pred = I.getPredicate();

  if (InstCombiner::isCanonicalPredicate(Pred))

    return nullptr;


  // Can all users be adjusted to predicate inversion?

  if (!InstCombiner::canFreelyInvertAllUsersOf(&I, /*IgnoredUser=*/nullptr))

    return nullptr;


  // Ok, we can canonicalize comparison!

  // Let's first invert the comparison's predicate.

  I.setPredicate(CmpInst::getInversePredicate(Pred));

  I.setName(I.getName() + ".not");


  // And, adapt users.

  freelyInvertAllUsersOf(&I);


  return &I;

}


/// Integer compare with boolean values can always be turned into bitwise ops.

static Instruction *canonicalizeICmpBool(ICmpInst &I,

                                         InstCombiner::BuilderTy &Builder) {

  Value *A = I.getOperand(0), *B = I.getOperand(1);

  assert(A->getType()->isIntOrIntVectorTy(1) && "Bools only");


  // A boolean compared to true/false can be simplified to Op0/true/false in

  // 14 out of the 20 (10 predicates * 2 constants) possible combinations.

  // Cases not handled by InstSimplify are always 'not' of Op0.

  if (match(B, m_Zero())) {

    switch (I.getPredicate()) {

    case CmpInst::ICMP_EQ:  // A ==   0 -> !A

    case CmpInst::ICMP_ULE: // A <=u  0 -> !A

    case CmpInst::ICMP_SGE: // A >=s  0 -> !A

      return BinaryOperator::CreateNot(A);

    default:

      llvm_unreachable("ICmp i1 X, C not simplified as expected.");

    }

  } else if (match(B, m_One())) {

    switch (I.getPredicate()) {

    case CmpInst::ICMP_NE:  // A !=  1 -> !A

    case CmpInst::ICMP_ULT: // A <u  1 -> !A

    case CmpInst::ICMP_SGT: // A >s -1 -> !A

      return BinaryOperator::CreateNot(A);

    default:

      llvm_unreachable("ICmp i1 X, C not simplified as expected.");

    }

  }


  switch (I.getPredicate()) {

  default:

    llvm_unreachable("Invalid icmp instruction!");

  case ICmpInst::ICMP_EQ:

    // icmp eq i1 A, B -> ~(A ^ B)

    return BinaryOperator::CreateNot(Builder.CreateXor(A, B));


  case ICmpInst::ICMP_NE:

    // icmp ne i1 A, B -> A ^ B

    return BinaryOperator::CreateXor(A, B);


  case ICmpInst::ICMP_UGT:

    // icmp ugt -> icmp ult

    std::swap(A, B);

    [[fallthrough]];

  case ICmpInst::ICMP_ULT:

    // icmp ult i1 A, B -> ~A & B

    return BinaryOperator::CreateAnd(Builder.CreateNot(A), B);


  case ICmpInst::ICMP_SGT:

    // icmp sgt -> icmp slt

    std::swap(A, B);

    [[fallthrough]];

  case ICmpInst::ICMP_SLT:

    // icmp slt i1 A, B -> A & ~B

    return BinaryOperator::CreateAnd(Builder.CreateNot(B), A);


  case ICmpInst::ICMP_UGE:

    // icmp uge -> icmp ule

    std::swap(A, B);

    [[fallthrough]];

  case ICmpInst::ICMP_ULE:

    // icmp ule i1 A, B -> ~A | B

    return BinaryOperator::CreateOr(Builder.CreateNot(A), B);


  case ICmpInst::ICMP_SGE:

    // icmp sge -> icmp sle

    std::swap(A, B);

    [[fallthrough]];

  case ICmpInst::ICMP_SLE:

    // icmp sle i1 A, B -> A | ~B

    return BinaryOperator::CreateOr(Builder.CreateNot(B), A);

  }

}


// Transform pattern like:

//   (1 << Y) u<= X  or  ~(-1 << Y) u<  X  or  ((1 << Y)+(-1)) u<  X

//   (1 << Y) u>  X  or  ~(-1 << Y) u>= X  or  ((1 << Y)+(-1)) u>= X

// Into:

//   (X l>> Y) != 0

//   (X l>> Y) == 0

static Instruction *foldICmpWithHighBitMask(ICmpInst &Cmp,

                                            InstCombiner::BuilderTy &Builder) {

  CmpPredicate Pred, NewPred;

  Value *X, *Y;

  if (match(&Cmp,

            m_c_ICmp(Pred, m_OneUse(m_Shl(m_One(), m_Value(Y))), m_Value(X)))) {

    switch (Pred) {

    case ICmpInst::ICMP_ULE:

      NewPred = ICmpInst::ICMP_NE;

      break;

    case ICmpInst::ICMP_UGT:

      NewPred = ICmpInst::ICMP_EQ;

      break;

    default:

      return nullptr;

    }

  } else if (match(&Cmp, m_c_ICmp(Pred,

                                  m_OneUse(m_CombineOr(

                                      m_Not(m_Shl(m_AllOnes(), m_Value(Y))),

                                      m_Add(m_Shl(m_One(), m_Value(Y)),

                                            m_AllOnes()))),

                                  m_Value(X)))) {

    // The variant with 'add' is not canonical, (the variant with 'not' is)

    // we only get it because it has extra uses, and can't be canonicalized,


    switch (Pred) {

    case ICmpInst::ICMP_ULT:

      NewPred = ICmpInst::ICMP_NE;

      break;

    case ICmpInst::ICMP_UGE:

      NewPred = ICmpInst::ICMP_EQ;

      break;

    default:

      return nullptr;

    }

  } else

    return nullptr;


  Value *NewX = Builder.CreateLShr(X, Y, X->getName() + ".highbits");

  Constant *Zero = Constant::getNullValue(NewX->getType());

  return CmpInst::Create(Instruction::ICmp, NewPred, NewX, Zero);

}


static Instruction *foldVectorCmp(CmpInst &Cmp,

                                  InstCombiner::BuilderTy &Builder) {

  const CmpInst::Predicate Pred = Cmp.getPredicate();

  Value *LHS = Cmp.getOperand(0), *RHS = Cmp.getOperand(1);

  Value *V1, *V2;


  auto createCmpReverse = [&](CmpInst::Predicate Pred, Value *X, Value *Y) {

    Value *V = Builder.CreateCmp(Pred, X, Y, Cmp.getName());

    if (auto *I = dyn_cast<Instruction>(V))

      I->copyIRFlags(&Cmp);

    Module *M = Cmp.getModule();

    Function *F = Intrinsic::getOrInsertDeclaration(

        M, Intrinsic::vector_reverse, V->getType());

    return CallInst::Create(F, V);

  };


  if (match(LHS, m_VecReverse(m_Value(V1)))) {

    // cmp Pred, rev(V1), rev(V2) --> rev(cmp Pred, V1, V2)

    if (match(RHS, m_VecReverse(m_Value(V2))) &&

        (LHS->hasOneUse() || RHS->hasOneUse()))

      return createCmpReverse(Pred, V1, V2);


    // cmp Pred, rev(V1), RHSSplat --> rev(cmp Pred, V1, RHSSplat)

    if (LHS->hasOneUse() && isSplatValue(RHS))

      return createCmpReverse(Pred, V1, RHS);

  }

  // cmp Pred, LHSSplat, rev(V2) --> rev(cmp Pred, LHSSplat, V2)

  else if (isSplatValue(LHS) && match(RHS, m_OneUse(m_VecReverse(m_Value(V2)))))

    return createCmpReverse(Pred, LHS, V2);


  ArrayRef<int> M;

  if (!match(LHS, m_Shuffle(m_Value(V1), m_Undef(), m_Mask(M))))

    return nullptr;


  // If both arguments of the cmp are shuffles that use the same mask and

  // shuffle within a single vector, move the shuffle after the cmp:

  // cmp (shuffle V1, M), (shuffle V2, M) --> shuffle (cmp V1, V2), M

  Type *V1Ty = V1->getType();

  if (match(RHS, m_Shuffle(m_Value(V2), m_Undef(), m_SpecificMask(M))) &&

      V1Ty == V2->getType() && (LHS->hasOneUse() || RHS->hasOneUse())) {

    Value *NewCmp = Builder.CreateCmp(Pred, V1, V2);

    return new ShuffleVectorInst(NewCmp, M);

  }


  // Try to canonicalize compare with splatted operand and splat constant.

  // TODO: We could generalize this for more than splats. See/use the code in

  //       InstCombiner::foldVectorBinop().

  Constant *C;

  if (!LHS->hasOneUse() || !match(RHS, m_Constant(C)))

    return nullptr;


  // Length-changing splats are ok, so adjust the constants as needed:

  // cmp (shuffle V1, M), C --> shuffle (cmp V1, C'), M

  Constant *ScalarC = C->getSplatValue(/* AllowPoison */ true);

  int MaskSplatIndex;

  if (ScalarC && match(M, m_SplatOrPoisonMask(MaskSplatIndex))) {

    // We allow poison in matching, but this transform removes it for safety.

    // Demanded elements analysis should be able to recover some/all of that.

    C = ConstantVector::getSplat(cast<VectorType>(V1Ty)->getElementCount(),

                                 ScalarC);

    SmallVector<int, 8> NewM(M.size(), MaskSplatIndex);

    Value *NewCmp = Builder.CreateCmp(Pred, V1, C);

    return new ShuffleVectorInst(NewCmp, NewM);

  }


  return nullptr;

}


// extract(uadd.with.overflow(A, B), 0) ult A

//  -> extract(uadd.with.overflow(A, B), 1)

static Instruction *foldICmpOfUAddOv(ICmpInst &I) {

  CmpInst::Predicate Pred = I.getPredicate();

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);


  Value *UAddOv;

  Value *A, *B;

  auto UAddOvResultPat = m_ExtractValue<0>(

      m_Intrinsic<Intrinsic::uadd_with_overflow>(m_Value(A), m_Value(B)));

  if (match(Op0, UAddOvResultPat) &&

      ((Pred == ICmpInst::ICMP_ULT && (Op1 == A || Op1 == B)) ||

       (Pred == ICmpInst::ICMP_EQ && match(Op1, m_ZeroInt()) &&

        (match(A, m_One()) || match(B, m_One()))) ||

       (Pred == ICmpInst::ICMP_NE && match(Op1, m_AllOnes()) &&

        (match(A, m_AllOnes()) || match(B, m_AllOnes())))))

    // extract(uadd.with.overflow(A, B), 0) < A

    // extract(uadd.with.overflow(A, 1), 0) == 0

    // extract(uadd.with.overflow(A, -1), 0) != -1

    UAddOv = cast<ExtractValueInst>(Op0)->getAggregateOperand();

  else if (match(Op1, UAddOvResultPat) && Pred == ICmpInst::ICMP_UGT &&

           (Op0 == A || Op0 == B))

    // A > extract(uadd.with.overflow(A, B), 0)

    UAddOv = cast<ExtractValueInst>(Op1)->getAggregateOperand();

  else

    return nullptr;


  return ExtractValueInst::Create(UAddOv, 1);

}


static Instruction *foldICmpInvariantGroup(ICmpInst &I) {

  if (!I.getOperand(0)->getType()->isPointerTy() ||

      NullPointerIsDefined(

          I.getParent()->getParent(),

          I.getOperand(0)->getType()->getPointerAddressSpace())) {

    return nullptr;

  }

  Instruction *Op;

  if (match(I.getOperand(0), m_Instruction(Op)) &&

      match(I.getOperand(1), m_Zero()) &&

      Op->isLaunderOrStripInvariantGroup()) {

    return ICmpInst::Create(Instruction::ICmp, I.getPredicate(),

                            Op->getOperand(0), I.getOperand(1));

  }

  return nullptr;

}


/// This function folds patterns produced by lowering of reduce idioms, such as

/// llvm.vector.reduce.and which are lowered into instruction chains. This code

/// attempts to generate fewer number of scalar comparisons instead of vector

/// comparisons when possible.

static Instruction *foldReductionIdiom(ICmpInst &I,

                                       InstCombiner::BuilderTy &Builder,

                                       const DataLayout &DL) {

  if (I.getType()->isVectorTy())

    return nullptr;

  CmpPredicate OuterPred, InnerPred;

  Value *LHS, *RHS;


  // Match lowering of @llvm.vector.reduce.and. Turn

  ///   %vec_ne = icmp ne <8 x i8> %lhs, %rhs

  ///   %scalar_ne = bitcast <8 x i1> %vec_ne to i8

  ///   %res = icmp <pred> i8 %scalar_ne, 0

  ///

  /// into

  ///

  ///   %lhs.scalar = bitcast <8 x i8> %lhs to i64

  ///   %rhs.scalar = bitcast <8 x i8> %rhs to i64

  ///   %res = icmp <pred> i64 %lhs.scalar, %rhs.scalar

  ///

  /// for <pred> in {ne, eq}.

  if (!match(&I, m_ICmp(OuterPred,

                        m_OneUse(m_BitCast(m_OneUse(

                            m_ICmp(InnerPred, m_Value(LHS), m_Value(RHS))))),

                        m_Zero())))

    return nullptr;

  auto *LHSTy = dyn_cast<FixedVectorType>(LHS->getType());

  if (!LHSTy || !LHSTy->getElementType()->isIntegerTy())

    return nullptr;

  unsigned NumBits =

      LHSTy->getNumElements() * LHSTy->getElementType()->getIntegerBitWidth();

  // TODO: Relax this to "not wider than max legal integer type"?

  if (!DL.isLegalInteger(NumBits))

    return nullptr;


  if (ICmpInst::isEquality(OuterPred) && InnerPred == ICmpInst::ICMP_NE) {

    auto *ScalarTy = Builder.getIntNTy(NumBits);

    LHS = Builder.CreateBitCast(LHS, ScalarTy, LHS->getName() + ".scalar");

    RHS = Builder.CreateBitCast(RHS, ScalarTy, RHS->getName() + ".scalar");

    return ICmpInst::Create(Instruction::ICmp, OuterPred, LHS, RHS,

                            I.getName());

  }


  return nullptr;

}


// This helper will be called with icmp operands in both orders.

Instruction *InstCombinerImpl::foldICmpCommutative(CmpPredicate Pred,

                                                   Value *Op0, Value *Op1,

                                                   ICmpInst &CxtI) {

  // Try to optimize 'icmp GEP, P' or 'icmp P, GEP'.

  if (auto *GEP = dyn_cast<GEPOperator>(Op0))

    if (Instruction *NI = foldGEPICmp(GEP, Op1, Pred, CxtI))

      return NI;


  if (auto *SI = dyn_cast<SelectInst>(Op0))

    if (Instruction *NI = foldSelectICmp(Pred, SI, Op1, CxtI))

      return NI;


  if (auto *MinMax = dyn_cast<MinMaxIntrinsic>(Op0))

    if (Instruction *Res = foldICmpWithMinMax(CxtI, MinMax, Op1, Pred))

      return Res;


  {

    Value *X;

    const APInt *C;

    // icmp X+Cst, X

    if (match(Op0, m_Add(m_Value(X), m_APInt(C))) && Op1 == X)

      return foldICmpAddOpConst(X, *C, Pred);

  }


  // abs(X) >=  X --> true

  // abs(X) u<= X --> true

  // abs(X) <   X --> false

  // abs(X) u>  X --> false

  // abs(X) u>= X --> IsIntMinPosion ? `X > -1`: `X u<= INTMIN`

  // abs(X) <=  X --> IsIntMinPosion ? `X > -1`: `X u<= INTMIN`

  // abs(X) ==  X --> IsIntMinPosion ? `X > -1`: `X u<= INTMIN`

  // abs(X) u<  X --> IsIntMinPosion ? `X < 0` : `X >   INTMIN`

  // abs(X) >   X --> IsIntMinPosion ? `X < 0` : `X >   INTMIN`

  // abs(X) !=  X --> IsIntMinPosion ? `X < 0` : `X >   INTMIN`

  {

    Value *X;

    Constant *C;

    if (match(Op0, m_Intrinsic<Intrinsic::abs>(m_Value(X), m_Constant(C))) &&

        match(Op1, m_Specific(X))) {

      Value *NullValue = Constant::getNullValue(X->getType());

      Value *AllOnesValue = Constant::getAllOnesValue(X->getType());

      const APInt SMin =

          APInt::getSignedMinValue(X->getType()->getScalarSizeInBits());

      bool IsIntMinPosion = C->isAllOnesValue();

      switch (Pred) {

      case CmpInst::ICMP_ULE:

      case CmpInst::ICMP_SGE:

        return replaceInstUsesWith(CxtI, ConstantInt::getTrue(CxtI.getType()));

      case CmpInst::ICMP_UGT:

      case CmpInst::ICMP_SLT:

        return replaceInstUsesWith(CxtI, ConstantInt::getFalse(CxtI.getType()));

      case CmpInst::ICMP_UGE:

      case CmpInst::ICMP_SLE:

      case CmpInst::ICMP_EQ: {

        return replaceInstUsesWith(

            CxtI, IsIntMinPosion

                      ? Builder.CreateICmpSGT(X, AllOnesValue)

                      : Builder.CreateICmpULT(

                            X, ConstantInt::get(X->getType(), SMin + 1)));

      }

      case CmpInst::ICMP_ULT:

      case CmpInst::ICMP_SGT:

      case CmpInst::ICMP_NE: {

        return replaceInstUsesWith(

            CxtI, IsIntMinPosion

                      ? Builder.CreateICmpSLT(X, NullValue)

                      : Builder.CreateICmpUGT(

                            X, ConstantInt::get(X->getType(), SMin)));

      }

      default:

        llvm_unreachable("Invalid predicate!");

      }

    }

  }


  const SimplifyQuery Q = SQ.getWithInstruction(&CxtI);

  if (Value *V = foldICmpWithLowBitMaskedVal(Pred, Op0, Op1, Q, *this))

    return replaceInstUsesWith(CxtI, V);


  // Folding (X / Y) pred X => X swap(pred) 0 for constant Y other than 0 or 1

  auto CheckUGT1 = [](const APInt &Divisor) { return Divisor.ugt(1); };

  {

    if (match(Op0, m_UDiv(m_Specific(Op1), m_CheckedInt(CheckUGT1)))) {

      return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Op1,

                          Constant::getNullValue(Op1->getType()));

    }


    if (!ICmpInst::isUnsigned(Pred) &&

        match(Op0, m_SDiv(m_Specific(Op1), m_CheckedInt(CheckUGT1)))) {

      return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Op1,

                          Constant::getNullValue(Op1->getType()));

    }

  }


  // Another case of this fold is (X >> Y) pred X => X swap(pred) 0 if Y != 0

  auto CheckNE0 = [](const APInt &Shift) { return !Shift.isZero(); };

  {

    if (match(Op0, m_LShr(m_Specific(Op1), m_CheckedInt(CheckNE0)))) {

      return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Op1,

                          Constant::getNullValue(Op1->getType()));

    }


    if ((Pred == CmpInst::ICMP_SLT || Pred == CmpInst::ICMP_SGE) &&

        match(Op0, m_AShr(m_Specific(Op1), m_CheckedInt(CheckNE0)))) {

      return new ICmpInst(ICmpInst::getSwappedPredicate(Pred), Op1,

                          Constant::getNullValue(Op1->getType()));

    }

  }


  return nullptr;

}


Instruction *InstCombinerImpl::visitICmpInst(ICmpInst &I) {

  bool Changed = false;

  const SimplifyQuery Q = SQ.getWithInstruction(&I);

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  unsigned Op0Cplxity = getComplexity(Op0);

  unsigned Op1Cplxity = getComplexity(Op1);


  /// Orders the operands of the compare so that they are listed from most

  /// complex to least complex.  This puts constants before unary operators,

  /// before binary operators.

  if (Op0Cplxity < Op1Cplxity) {

    I.swapOperands();

    std::swap(Op0, Op1);

    Changed = true;

  }


  if (Value *V = simplifyICmpInst(I.getCmpPredicate(), Op0, Op1, Q))

    return replaceInstUsesWith(I, V);


  // Comparing -val or val with non-zero is the same as just comparing val

  // ie, abs(val) != 0 -> val != 0

  if (I.getPredicate() == ICmpInst::ICMP_NE && match(Op1, m_Zero())) {

    Value *Cond, *SelectTrue, *SelectFalse;

    if (match(Op0, m_Select(m_Value(Cond), m_Value(SelectTrue),

                            m_Value(SelectFalse)))) {

      if (Value *V = dyn_castNegVal(SelectTrue)) {

        if (V == SelectFalse)

          return CmpInst::Create(Instruction::ICmp, I.getPredicate(), V, Op1);

      } else if (Value *V = dyn_castNegVal(SelectFalse)) {

        if (V == SelectTrue)

          return CmpInst::Create(Instruction::ICmp, I.getPredicate(), V, Op1);

      }

    }

  }


  if (Instruction *Res = foldICmpTruncWithTruncOrExt(I, Q))

    return Res;


  if (Op0->getType()->isIntOrIntVectorTy(1))

    if (Instruction *Res = canonicalizeICmpBool(I, Builder))

      return Res;


  if (Instruction *Res = canonicalizeCmpWithConstant(I))

    return Res;


  if (Instruction *Res = canonicalizeICmpPredicate(I))

    return Res;


  if (Instruction *Res = foldICmpWithConstant(I))

    return Res;


  if (Instruction *Res = foldICmpWithDominatingICmp(I))

    return Res;


  if (Instruction *Res = foldICmpUsingBoolRange(I))

    return Res;


  if (Instruction *Res = foldICmpUsingKnownBits(I))

    return Res;


  if (Instruction *Res = foldIsMultipleOfAPowerOfTwo(I))

    return Res;


  // Test if the ICmpInst instruction is used exclusively by a select as

  // part of a minimum or maximum operation. If so, refrain from doing

  // any other folding. This helps out other analyses which understand

  // non-obfuscated minimum and maximum idioms, such as ScalarEvolution

  // and CodeGen. And in this case, at least one of the comparison

  // operands has at least one user besides the compare (the select),

  // which would often largely negate the benefit of folding anyway.

  //

  // Do the same for the other patterns recognized by matchSelectPattern.

  if (I.hasOneUse())

    if (SelectInst *SI = dyn_cast<SelectInst>(I.user_back())) {

      Value *A, *B;

      SelectPatternResult SPR = matchSelectPattern(SI, A, B);

      if (SPR.Flavor != SPF_UNKNOWN)

        return nullptr;

    }


  // Do this after checking for min/max to prevent infinite looping.

  if (Instruction *Res = foldICmpWithZero(I))

    return Res;


  // FIXME: We only do this after checking for min/max to prevent infinite

  // looping caused by a reverse canonicalization of these patterns for min/max.

  // FIXME: The organization of folds is a mess. These would naturally go into

  // canonicalizeCmpWithConstant(), but we can't move all of the above folds

  // down here after the min/max restriction.

  ICmpInst::Predicate Pred = I.getPredicate();

  const APInt *C;

  if (match(Op1, m_APInt(C))) {

    // For i32: x >u 2147483647 -> x <s 0  -> true if sign bit set

    if (Pred == ICmpInst::ICMP_UGT && C->isMaxSignedValue()) {

      Constant *Zero = Constant::getNullValue(Op0->getType());

      return new ICmpInst(ICmpInst::ICMP_SLT, Op0, Zero);

    }


    // For i32: x <u 2147483648 -> x >s -1  -> true if sign bit clear

    if (Pred == ICmpInst::ICMP_ULT && C->isMinSignedValue()) {

      Constant *AllOnes = Constant::getAllOnesValue(Op0->getType());

      return new ICmpInst(ICmpInst::ICMP_SGT, Op0, AllOnes);

    }

  }


  // The folds in here may rely on wrapping flags and special constants, so

  // they can break up min/max idioms in some cases but not seemingly similar

  // patterns.

  // FIXME: It may be possible to enhance select folding to make this

  //        unnecessary. It may also be moot if we canonicalize to min/max

  //        intrinsics.

  if (Instruction *Res = foldICmpBinOp(I, Q))

    return Res;


  if (Instruction *Res = foldICmpInstWithConstant(I))

    return Res;


  // Try to match comparison as a sign bit test. Intentionally do this after

  // foldICmpInstWithConstant() to potentially let other folds to happen first.

  if (Instruction *New = foldSignBitTest(I))

    return New;


  if (auto *PN = dyn_cast<PHINode>(Op0))

    if (Instruction *NV = foldOpIntoPhi(I, PN))

      return NV;

  if (auto *PN = dyn_cast<PHINode>(Op1))

    if (Instruction *NV = foldOpIntoPhi(I, PN))

      return NV;


  if (Instruction *Res = foldICmpInstWithConstantNotInt(I))

    return Res;


  if (Instruction *Res = foldICmpCommutative(I.getCmpPredicate(), Op0, Op1, I))

    return Res;

  if (Instruction *Res =

          foldICmpCommutative(I.getSwappedCmpPredicate(), Op1, Op0, I))

    return Res;


  if (I.isCommutative()) {

    if (auto Pair = matchSymmetricPair(I.getOperand(0), I.getOperand(1))) {

      replaceOperand(I, 0, Pair->first);

      replaceOperand(I, 1, Pair->second);

      return &I;

    }

  }


  // In case of a comparison with two select instructions having the same

  // condition, check whether one of the resulting branches can be simplified.

  // If so, just compare the other branch and select the appropriate result.

  // For example:

  //   %tmp1 = select i1 %cmp, i32 %y, i32 %x

  //   %tmp2 = select i1 %cmp, i32 %z, i32 %x

  //   %cmp2 = icmp slt i32 %tmp2, %tmp1

  // The icmp will result false for the false value of selects and the result

  // will depend upon the comparison of true values of selects if %cmp is

  // true. Thus, transform this into:

  //   %cmp = icmp slt i32 %y, %z

  //   %sel = select i1 %cond, i1 %cmp, i1 false

  // This handles similar cases to transform.

  {

    Value *Cond, *A, *B, *C, *D;

    if (match(Op0, m_Select(m_Value(Cond), m_Value(A), m_Value(B))) &&

        match(Op1, m_Select(m_Specific(Cond), m_Value(C), m_Value(D))) &&

        (Op0->hasOneUse() || Op1->hasOneUse())) {

      // Check whether comparison of TrueValues can be simplified

      if (Value *Res = simplifyICmpInst(Pred, A, C, SQ)) {

        Value *NewICMP = Builder.CreateICmp(Pred, B, D);

        return SelectInst::Create(Cond, Res, NewICMP);

      }

      // Check whether comparison of FalseValues can be simplified

      if (Value *Res = simplifyICmpInst(Pred, B, D, SQ)) {

        Value *NewICMP = Builder.CreateICmp(Pred, A, C);

        return SelectInst::Create(Cond, NewICMP, Res);

      }

    }

  }


  // icmp slt (sub nsw x, y), (add nsw x, y)  -->  icmp sgt y, 0

  // icmp ult (sub nuw x, y), (add nuw x, y)  -->  icmp ugt y, 0

  // icmp eq (sub nsw/nuw x, y), (add nsw/nuw x, y)   -->  icmp eq y, 0

  {

    Value *A, *B;

    CmpPredicate CmpPred;

    if (match(&I, m_c_ICmp(CmpPred, m_Sub(m_Value(A), m_Value(B)),

                           m_c_Add(m_Deferred(A), m_Deferred(B))))) {

      auto *I0 = cast<OverflowingBinaryOperator>(Op0);

      auto *I1 = cast<OverflowingBinaryOperator>(Op1);

      bool I0NUW = I0->hasNoUnsignedWrap();

      bool I1NUW = I1->hasNoUnsignedWrap();

      bool I0NSW = I0->hasNoSignedWrap();

      bool I1NSW = I1->hasNoSignedWrap();

      if ((ICmpInst::isUnsigned(Pred) && I0NUW && I1NUW) ||

          (ICmpInst::isSigned(Pred) && I0NSW && I1NSW) ||

          (ICmpInst::isEquality(Pred) &&

           ((I0NUW || I0NSW) && (I1NUW || I1NSW)))) {

        return new ICmpInst(CmpPredicate::getSwapped(CmpPred), B,

                            ConstantInt::get(Op0->getType(), 0));

      }

    }

  }


  // Try to optimize equality comparisons against alloca-based pointers.

  if (Op0->getType()->isPointerTy() && I.isEquality()) {

    assert(Op1->getType()->isPointerTy() &&

           "Comparing pointer with non-pointer?");

    if (auto *Alloca = dyn_cast<AllocaInst>(getUnderlyingObject(Op0)))

      if (foldAllocaCmp(Alloca))

        return nullptr;

    if (auto *Alloca = dyn_cast<AllocaInst>(getUnderlyingObject(Op1)))

      if (foldAllocaCmp(Alloca))

        return nullptr;

  }


  if (Instruction *Res = foldICmpBitCast(I))

    return Res;


  // TODO: Hoist this above the min/max bailout.

  if (Instruction *R = foldICmpWithCastOp(I))

    return R;


  {

    Value *X, *Y;

    // Transform (X & ~Y) == 0 --> (X & Y) != 0

    // and       (X & ~Y) != 0 --> (X & Y) == 0

    // if A is a power of 2.

    if (match(Op0, m_And(m_Value(X), m_Not(m_Value(Y)))) &&

        match(Op1, m_Zero()) && isKnownToBeAPowerOfTwo(X, false, &I) &&

        I.isEquality())

      return new ICmpInst(I.getInversePredicate(), Builder.CreateAnd(X, Y),

                          Op1);


    // Op0 pred Op1 -> ~Op1 pred ~Op0, if this allows us to drop an instruction.

    if (Op0->getType()->isIntOrIntVectorTy()) {

      bool ConsumesOp0, ConsumesOp1;

      if (isFreeToInvert(Op0, Op0->hasOneUse(), ConsumesOp0) &&

          isFreeToInvert(Op1, Op1->hasOneUse(), ConsumesOp1) &&

          (ConsumesOp0 || ConsumesOp1)) {

        Value *InvOp0 = getFreelyInverted(Op0, Op0->hasOneUse(), &Builder);

        Value *InvOp1 = getFreelyInverted(Op1, Op1->hasOneUse(), &Builder);

        assert(InvOp0 && InvOp1 &&

               "Mismatch between isFreeToInvert and getFreelyInverted");

        return new ICmpInst(I.getSwappedPredicate(), InvOp0, InvOp1);

      }

    }


    Instruction *AddI = nullptr;

    if (match(&I, m_UAddWithOverflow(m_Value(X), m_Value(Y),

                                     m_Instruction(AddI))) &&

        isa<IntegerType>(X->getType())) {

      Value *Result;

      Constant *Overflow;

      // m_UAddWithOverflow can match patterns that do not include  an explicit

      // "add" instruction, so check the opcode of the matched op.

      if (AddI->getOpcode() == Instruction::Add &&

          OptimizeOverflowCheck(Instruction::Add, /*Signed*/ false, X, Y, *AddI,

                                Result, Overflow)) {

        replaceInstUsesWith(*AddI, Result);

        eraseInstFromFunction(*AddI);

        return replaceInstUsesWith(I, Overflow);

      }

    }


    // (zext X) * (zext Y)  --> llvm.umul.with.overflow.

    if (match(Op0, m_NUWMul(m_ZExt(m_Value(X)), m_ZExt(m_Value(Y)))) &&

        match(Op1, m_APInt(C))) {

      if (Instruction *R = processUMulZExtIdiom(I, Op0, C, *this))

        return R;

    }


    // Signbit test folds

    // Fold (X u>> BitWidth - 1 Pred ZExt(i1))  -->  X s< 0 Pred i1

    // Fold (X s>> BitWidth - 1 Pred SExt(i1))  -->  X s< 0 Pred i1

    Instruction *ExtI;

    if ((I.isUnsigned() || I.isEquality()) &&

        match(Op1,

              m_CombineAnd(m_Instruction(ExtI), m_ZExtOrSExt(m_Value(Y)))) &&

        Y->getType()->getScalarSizeInBits() == 1 &&

        (Op0->hasOneUse() || Op1->hasOneUse())) {

      unsigned OpWidth = Op0->getType()->getScalarSizeInBits();

      Instruction *ShiftI;

      if (match(Op0, m_CombineAnd(m_Instruction(ShiftI),

                                  m_Shr(m_Value(X), m_SpecificIntAllowPoison(

                                                        OpWidth - 1))))) {

        unsigned ExtOpc = ExtI->getOpcode();

        unsigned ShiftOpc = ShiftI->getOpcode();

        if ((ExtOpc == Instruction::ZExt && ShiftOpc == Instruction::LShr) ||

            (ExtOpc == Instruction::SExt && ShiftOpc == Instruction::AShr)) {

          Value *SLTZero =

              Builder.CreateICmpSLT(X, Constant::getNullValue(X->getType()));

          Value *Cmp = Builder.CreateICmp(Pred, SLTZero, Y, I.getName());

          return replaceInstUsesWith(I, Cmp);

        }

      }

    }

  }


  if (Instruction *Res = foldICmpEquality(I))

    return Res;


  if (Instruction *Res = foldICmpPow2Test(I, Builder))

    return Res;


  if (Instruction *Res = foldICmpOfUAddOv(I))

    return Res;


  // The 'cmpxchg' instruction returns an aggregate containing the old value and

  // an i1 which indicates whether or not we successfully did the swap.

  //

  // Replace comparisons between the old value and the expected value with the

  // indicator that 'cmpxchg' returns.

  //

  // N.B.  This transform is only valid when the 'cmpxchg' is not permitted to

  // spuriously fail.  In those cases, the old value may equal the expected

  // value but it is possible for the swap to not occur.

  if (I.getPredicate() == ICmpInst::ICMP_EQ)

    if (auto *EVI = dyn_cast<ExtractValueInst>(Op0))

      if (auto *ACXI = dyn_cast<AtomicCmpXchgInst>(EVI->getAggregateOperand()))

        if (EVI->getIndices()[0] == 0 && ACXI->getCompareOperand() == Op1 &&

            !ACXI->isWeak())

          return ExtractValueInst::Create(ACXI, 1);


  if (Instruction *Res = foldICmpWithHighBitMask(I, Builder))

    return Res;


  if (I.getType()->isVectorTy())

    if (Instruction *Res = foldVectorCmp(I, Builder))

      return Res;


  if (Instruction *Res = foldICmpInvariantGroup(I))

    return Res;


  if (Instruction *Res = foldReductionIdiom(I, Builder, DL))

    return Res;


  {

    Value *A;

    const APInt *C1, *C2;

    ICmpInst::Predicate Pred = I.getPredicate();

    if (ICmpInst::isEquality(Pred)) {

      // sext(a) & c1 == c2 --> a & c3 == trunc(c2)

      // sext(a) & c1 != c2 --> a & c3 != trunc(c2)

      if (match(Op0, m_And(m_SExt(m_Value(A)), m_APInt(C1))) &&

          match(Op1, m_APInt(C2))) {

        Type *InputTy = A->getType();

        unsigned InputBitWidth = InputTy->getScalarSizeInBits();

        // c2 must be non-negative at the bitwidth of a.

        if (C2->getActiveBits() < InputBitWidth) {

          APInt TruncC1 = C1->trunc(InputBitWidth);

          // Check if there are 1s in C1 high bits of size InputBitWidth.

          if (C1->uge(APInt::getOneBitSet(C1->getBitWidth(), InputBitWidth)))

            TruncC1.setBit(InputBitWidth - 1);

          Value *AndInst = Builder.CreateAnd(A, TruncC1);

          return new ICmpInst(

              Pred, AndInst,

              ConstantInt::get(InputTy, C2->trunc(InputBitWidth)));

        }

      }

    }

  }


  return Changed ? &I : nullptr;

}


/// Fold fcmp ([us]itofp x, cst) if possible.

Instruction *InstCombinerImpl::foldFCmpIntToFPConst(FCmpInst &I,

                                                    Instruction *LHSI,

                                                    Constant *RHSC) {

  const APFloat *RHS;

  if (!match(RHSC, m_APFloat(RHS)))

    return nullptr;


  // Get the width of the mantissa.  We don't want to hack on conversions that

  // might lose information from the integer, e.g. "i64 -> float"

  int MantissaWidth = LHSI->getType()->getFPMantissaWidth();

  if (MantissaWidth == -1)

    return nullptr; // Unknown.


  Type *IntTy = LHSI->getOperand(0)->getType();

  unsigned IntWidth = IntTy->getScalarSizeInBits();

  bool LHSUnsigned = isa<UIToFPInst>(LHSI);


  if (I.isEquality()) {

    FCmpInst::Predicate P = I.getPredicate();

    bool IsExact = false;

    APSInt RHSCvt(IntWidth, LHSUnsigned);

    RHS->convertToInteger(RHSCvt, APFloat::rmNearestTiesToEven, &IsExact);


    // If the floating point constant isn't an integer value, we know if we will

    // ever compare equal / not equal to it.

    if (!IsExact) {

      // TODO: Can never be -0.0 and other non-representable values

      APFloat RHSRoundInt(*RHS);

      RHSRoundInt.roundToIntegral(APFloat::rmNearestTiesToEven);

      if (*RHS != RHSRoundInt) {

        if (P == FCmpInst::FCMP_OEQ || P == FCmpInst::FCMP_UEQ)

          return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));


        assert(P == FCmpInst::FCMP_ONE || P == FCmpInst::FCMP_UNE);

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      }

    }


    // TODO: If the constant is exactly representable, is it always OK to do

    // equality compares as integer?

  }


  // Check to see that the input is converted from an integer type that is small

  // enough that preserves all bits.  TODO: check here for "known" sign bits.

  // This would allow us to handle (fptosi (x >>s 62) to float) if x is i64 f.e.


  // Following test does NOT adjust IntWidth downwards for signed inputs,

  // because the most negative value still requires all the mantissa bits

  // to distinguish it from one less than that value.

  if ((int)IntWidth > MantissaWidth) {

    // Conversion would lose accuracy. Check if loss can impact comparison.

    int Exp = ilogb(*RHS);

    if (Exp == APFloat::IEK_Inf) {

      int MaxExponent = ilogb(APFloat::getLargest(RHS->getSemantics()));

      if (MaxExponent < (int)IntWidth - !LHSUnsigned)

        // Conversion could create infinity.

        return nullptr;

    } else {

      // Note that if RHS is zero or NaN, then Exp is negative

      // and first condition is trivially false.

      if (MantissaWidth <= Exp && Exp <= (int)IntWidth - !LHSUnsigned)

        // Conversion could affect comparison.

        return nullptr;

    }

  }


  // Otherwise, we can potentially simplify the comparison.  We know that it

  // will always come through as an integer value and we know the constant is

  // not a NAN (it would have been previously simplified).

  assert(!RHS->isNaN() && "NaN comparison not already folded!");


  ICmpInst::Predicate Pred;

  switch (I.getPredicate()) {

  default:

    llvm_unreachable("Unexpected predicate!");

  case FCmpInst::FCMP_UEQ:

  case FCmpInst::FCMP_OEQ:

    Pred = ICmpInst::ICMP_EQ;

    break;

  case FCmpInst::FCMP_UGT:

  case FCmpInst::FCMP_OGT:

    Pred = LHSUnsigned ? ICmpInst::ICMP_UGT : ICmpInst::ICMP_SGT;

    break;

  case FCmpInst::FCMP_UGE:

  case FCmpInst::FCMP_OGE:

    Pred = LHSUnsigned ? ICmpInst::ICMP_UGE : ICmpInst::ICMP_SGE;

    break;

  case FCmpInst::FCMP_ULT:

  case FCmpInst::FCMP_OLT:

    Pred = LHSUnsigned ? ICmpInst::ICMP_ULT : ICmpInst::ICMP_SLT;

    break;

  case FCmpInst::FCMP_ULE:

  case FCmpInst::FCMP_OLE:

    Pred = LHSUnsigned ? ICmpInst::ICMP_ULE : ICmpInst::ICMP_SLE;

    break;

  case FCmpInst::FCMP_UNE:

  case FCmpInst::FCMP_ONE:

    Pred = ICmpInst::ICMP_NE;

    break;

  case FCmpInst::FCMP_ORD:

    return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

  case FCmpInst::FCMP_UNO:

    return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

  }


  // Now we know that the APFloat is a normal number, zero or inf.


  // See if the FP constant is too large for the integer.  For example,

  // comparing an i8 to 300.0.

  if (!LHSUnsigned) {

    // If the RHS value is > SignedMax, fold the comparison.  This handles +INF

    // and large values.

    APFloat SMax(RHS->getSemantics());

    SMax.convertFromAPInt(APInt::getSignedMaxValue(IntWidth), true,

                          APFloat::rmNearestTiesToEven);

    if (SMax < *RHS) { // smax < 13123.0

      if (Pred == ICmpInst::ICMP_NE || Pred == ICmpInst::ICMP_SLT ||

          Pred == ICmpInst::ICMP_SLE)

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    }

  } else {

    // If the RHS value is > UnsignedMax, fold the comparison. This handles

    // +INF and large values.

    APFloat UMax(RHS->getSemantics());

    UMax.convertFromAPInt(APInt::getMaxValue(IntWidth), false,

                          APFloat::rmNearestTiesToEven);

    if (UMax < *RHS) { // umax < 13123.0

      if (Pred == ICmpInst::ICMP_NE || Pred == ICmpInst::ICMP_ULT ||

          Pred == ICmpInst::ICMP_ULE)

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    }

  }


  if (!LHSUnsigned) {

    // See if the RHS value is < SignedMin.

    APFloat SMin(RHS->getSemantics());

    SMin.convertFromAPInt(APInt::getSignedMinValue(IntWidth), true,

                          APFloat::rmNearestTiesToEven);

    if (SMin > *RHS) { // smin > 12312.0

      if (Pred == ICmpInst::ICMP_NE || Pred == ICmpInst::ICMP_SGT ||

          Pred == ICmpInst::ICMP_SGE)

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    }

  } else {

    // See if the RHS value is < UnsignedMin.

    APFloat UMin(RHS->getSemantics());

    UMin.convertFromAPInt(APInt::getMinValue(IntWidth), false,

                          APFloat::rmNearestTiesToEven);

    if (UMin > *RHS) { // umin > 12312.0

      if (Pred == ICmpInst::ICMP_NE || Pred == ICmpInst::ICMP_UGT ||

          Pred == ICmpInst::ICMP_UGE)

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    }

  }


  // Okay, now we know that the FP constant fits in the range [SMIN, SMAX] or

  // [0, UMAX], but it may still be fractional. Check whether this is the case

  // using the IsExact flag.

  // Don't do this for zero, because -0.0 is not fractional.

  APSInt RHSInt(IntWidth, LHSUnsigned);

  bool IsExact;

  RHS->convertToInteger(RHSInt, APFloat::rmTowardZero, &IsExact);

  if (!RHS->isZero()) {

    if (!IsExact) {

      // If we had a comparison against a fractional value, we have to adjust

      // the compare predicate and sometimes the value.  RHSC is rounded towards

      // zero at this point.

      switch (Pred) {

      default:

        llvm_unreachable("Unexpected integer comparison!");

      case ICmpInst::ICMP_NE: // (float)int != 4.4   --> true

        return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

      case ICmpInst::ICMP_EQ: // (float)int == 4.4   --> false

        return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

      case ICmpInst::ICMP_ULE:

        // (float)int <= 4.4   --> int <= 4

        // (float)int <= -4.4  --> false

        if (RHS->isNegative())

          return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

        break;

      case ICmpInst::ICMP_SLE:

        // (float)int <= 4.4   --> int <= 4

        // (float)int <= -4.4  --> int < -4

        if (RHS->isNegative())

          Pred = ICmpInst::ICMP_SLT;

        break;

      case ICmpInst::ICMP_ULT:

        // (float)int < -4.4   --> false

        // (float)int < 4.4    --> int <= 4

        if (RHS->isNegative())

          return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

        Pred = ICmpInst::ICMP_ULE;

        break;

      case ICmpInst::ICMP_SLT:

        // (float)int < -4.4   --> int < -4

        // (float)int < 4.4    --> int <= 4

        if (!RHS->isNegative())

          Pred = ICmpInst::ICMP_SLE;

        break;

      case ICmpInst::ICMP_UGT:

        // (float)int > 4.4    --> int > 4

        // (float)int > -4.4   --> true

        if (RHS->isNegative())

          return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

        break;

      case ICmpInst::ICMP_SGT:

        // (float)int > 4.4    --> int > 4

        // (float)int > -4.4   --> int >= -4

        if (RHS->isNegative())

          Pred = ICmpInst::ICMP_SGE;

        break;

      case ICmpInst::ICMP_UGE:

        // (float)int >= -4.4   --> true

        // (float)int >= 4.4    --> int > 4

        if (RHS->isNegative())

          return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

        Pred = ICmpInst::ICMP_UGT;

        break;

      case ICmpInst::ICMP_SGE:

        // (float)int >= -4.4   --> int >= -4

        // (float)int >= 4.4    --> int > 4

        if (!RHS->isNegative())

          Pred = ICmpInst::ICMP_SGT;

        break;

      }

    }

  }


  // Lower this FP comparison into an appropriate integer version of the

  // comparison.

  return new ICmpInst(Pred, LHSI->getOperand(0),

                      ConstantInt::get(LHSI->getOperand(0)->getType(), RHSInt));

}


/// Fold (C / X) < 0.0 --> X < 0.0 if possible. Swap predicate if necessary.

static Instruction *foldFCmpReciprocalAndZero(FCmpInst &I, Instruction *LHSI,

                                              Constant *RHSC) {

  // When C is not 0.0 and infinities are not allowed:

  // (C / X) < 0.0 is a sign-bit test of X

  // (C / X) < 0.0 --> X < 0.0 (if C is positive)

  // (C / X) < 0.0 --> X > 0.0 (if C is negative, swap the predicate)

  //

  // Proof:

  // Multiply (C / X) < 0.0 by X * X / C.

  // - X is non zero, if it is the flag 'ninf' is violated.

  // - C defines the sign of X * X * C. Thus it also defines whether to swap

  //   the predicate. C is also non zero by definition.

  //

  // Thus X * X / C is non zero and the transformation is valid. [qed]


  FCmpInst::Predicate Pred = I.getPredicate();


  // Check that predicates are valid.

  if ((Pred != FCmpInst::FCMP_OGT) && (Pred != FCmpInst::FCMP_OLT) &&

      (Pred != FCmpInst::FCMP_OGE) && (Pred != FCmpInst::FCMP_OLE))

    return nullptr;


  // Check that RHS operand is zero.

  if (!match(RHSC, m_AnyZeroFP()))

    return nullptr;


  // Check fastmath flags ('ninf').

  if (!LHSI->hasNoInfs() || !I.hasNoInfs())

    return nullptr;


  // Check the properties of the dividend. It must not be zero to avoid a

  // division by zero (see Proof).

  const APFloat *C;

  if (!match(LHSI->getOperand(0), m_APFloat(C)))

    return nullptr;


  if (C->isZero())

    return nullptr;


  // Get swapped predicate if necessary.

  if (C->isNegative())

    Pred = I.getSwappedPredicate();


  return new FCmpInst(Pred, LHSI->getOperand(1), RHSC, "", &I);

}


// Transform 'fptrunc(x) cmp C' to 'x cmp ext(C)' if possible.

// Patterns include:

//    fptrunc(x) <  C  -->  x <  ext(C)

//    fptrunc(x) <= C  -->  x <= ext(C)

//    fptrunc(x) >  C  -->  x >  ext(C)

//    fptrunc(x) >= C  -->  x >= ext(C)

// where 'ext(C)' is the extension of 'C' to the type of 'x' with a small bias

// due to precision loss.

static Instruction *foldFCmpFpTrunc(FCmpInst &I, const Instruction &FPTrunc,

                                    const Constant &C) {

  FCmpInst::Predicate Pred = I.getPredicate();

  bool RoundDown = false;


  if (Pred == FCmpInst::FCMP_OGE || Pred == FCmpInst::FCMP_UGE ||

      Pred == FCmpInst::FCMP_OLT || Pred == FCmpInst::FCMP_ULT)

    RoundDown = true;

  else if (Pred == FCmpInst::FCMP_OGT || Pred == FCmpInst::FCMP_UGT ||

           Pred == FCmpInst::FCMP_OLE || Pred == FCmpInst::FCMP_ULE)

    RoundDown = false;

  else

    return nullptr;


  const APFloat *CValue;

  if (!match(&C, m_APFloat(CValue)))

    return nullptr;


  if (CValue->isNaN() || CValue->isInfinity())

    return nullptr;


  auto ConvertFltSema = [](const APFloat &Src, const fltSemantics &Sema) {

    bool LosesInfo;

    APFloat Dest = Src;

    Dest.convert(Sema, APFloat::rmNearestTiesToEven, &LosesInfo);

    return Dest;

  };


  auto NextValue = [](const APFloat &Value, bool RoundDown) {

    APFloat NextValue = Value;

    NextValue.next(RoundDown);

    return NextValue;

  };


  APFloat NextCValue = NextValue(*CValue, RoundDown);


  Type *DestType = FPTrunc.getOperand(0)->getType();

  const fltSemantics &DestFltSema =

      DestType->getScalarType()->getFltSemantics();


  APFloat ExtCValue = ConvertFltSema(*CValue, DestFltSema);

  APFloat ExtNextCValue = ConvertFltSema(NextCValue, DestFltSema);


  // When 'NextCValue' is infinity, use an imaged 'NextCValue' that equals

  // 'CValue + bias' to avoid the infinity after conversion. The bias is

  // estimated as 'CValue - PrevCValue', where 'PrevCValue' is the previous

  // value of 'CValue'.

  if (NextCValue.isInfinity()) {

    APFloat PrevCValue = NextValue(*CValue, !RoundDown);

    APFloat Bias = ConvertFltSema(*CValue - PrevCValue, DestFltSema);


    ExtNextCValue = ExtCValue + Bias;

  }


  APFloat ExtMidValue =

      scalbn(ExtCValue + ExtNextCValue, -1, APFloat::rmNearestTiesToEven);


  const fltSemantics &SrcFltSema =

      C.getType()->getScalarType()->getFltSemantics();


  // 'MidValue' might be rounded to 'NextCValue'. Correct it here.

  APFloat MidValue = ConvertFltSema(ExtMidValue, SrcFltSema);

  if (MidValue != *CValue)

    ExtMidValue.next(!RoundDown);


  // Check whether 'ExtMidValue' is a valid result since the assumption on

  // imaged 'NextCValue' might not hold for new float types.

  // ppc_fp128 can't pass here when converting from max float because of

  // APFloat implementation.

  if (NextCValue.isInfinity()) {

    // ExtMidValue --- narrowed ---> Finite

    if (ConvertFltSema(ExtMidValue, SrcFltSema).isInfinity())

      return nullptr;


    // NextExtMidValue --- narrowed ---> Infinity

    APFloat NextExtMidValue = NextValue(ExtMidValue, RoundDown);

    if (ConvertFltSema(NextExtMidValue, SrcFltSema).isFinite())

      return nullptr;

  }


  return new FCmpInst(Pred, FPTrunc.getOperand(0),

                      ConstantFP::get(DestType, ExtMidValue), "", &I);

}


/// Optimize fabs(X) compared with zero.

static Instruction *foldFabsWithFcmpZero(FCmpInst &I, InstCombinerImpl &IC) {

  Value *X;

  if (!match(I.getOperand(0), m_FAbs(m_Value(X))))

    return nullptr;


  const APFloat *C;

  if (!match(I.getOperand(1), m_APFloat(C)))

    return nullptr;


  if (!C->isPosZero()) {

    if (!C->isSmallestNormalized())

      return nullptr;


    const Function *F = I.getFunction();

    DenormalMode Mode = F->getDenormalMode(C->getSemantics());

    if (Mode.Input == DenormalMode::PreserveSign ||

        Mode.Input == DenormalMode::PositiveZero) {


      auto replaceFCmp = [](FCmpInst *I, FCmpInst::Predicate P, Value *X) {

        Constant *Zero = ConstantFP::getZero(X->getType());

        return new FCmpInst(P, X, Zero, "", I);

      };


      switch (I.getPredicate()) {

      case FCmpInst::FCMP_OLT:

        // fcmp olt fabs(x), smallest_normalized_number -> fcmp oeq x, 0.0

        return replaceFCmp(&I, FCmpInst::FCMP_OEQ, X);

      case FCmpInst::FCMP_UGE:

        // fcmp uge fabs(x), smallest_normalized_number -> fcmp une x, 0.0

        return replaceFCmp(&I, FCmpInst::FCMP_UNE, X);

      case FCmpInst::FCMP_OGE:

        // fcmp oge fabs(x), smallest_normalized_number -> fcmp one x, 0.0

        return replaceFCmp(&I, FCmpInst::FCMP_ONE, X);

      case FCmpInst::FCMP_ULT:

        // fcmp ult fabs(x), smallest_normalized_number -> fcmp ueq x, 0.0

        return replaceFCmp(&I, FCmpInst::FCMP_UEQ, X);

      default:

        break;

      }

    }


    return nullptr;

  }


  auto replacePredAndOp0 = [&IC](FCmpInst *I, FCmpInst::Predicate P, Value *X) {

    I->setPredicate(P);

    return IC.replaceOperand(*I, 0, X);

  };


  switch (I.getPredicate()) {

  case FCmpInst::FCMP_UGE:

  case FCmpInst::FCMP_OLT:

    // fabs(X) >= 0.0 --> true

    // fabs(X) <  0.0 --> false

    llvm_unreachable("fcmp should have simplified");


  case FCmpInst::FCMP_OGT:

    // fabs(X) > 0.0 --> X != 0.0

    return replacePredAndOp0(&I, FCmpInst::FCMP_ONE, X);


  case FCmpInst::FCMP_UGT:

    // fabs(X) u> 0.0 --> X u!= 0.0

    return replacePredAndOp0(&I, FCmpInst::FCMP_UNE, X);


  case FCmpInst::FCMP_OLE:

    // fabs(X) <= 0.0 --> X == 0.0

    return replacePredAndOp0(&I, FCmpInst::FCMP_OEQ, X);


  case FCmpInst::FCMP_ULE:

    // fabs(X) u<= 0.0 --> X u== 0.0

    return replacePredAndOp0(&I, FCmpInst::FCMP_UEQ, X);


  case FCmpInst::FCMP_OGE:

    // fabs(X) >= 0.0 --> !isnan(X)

    assert(!I.hasNoNaNs() && "fcmp should have simplified");

    return replacePredAndOp0(&I, FCmpInst::FCMP_ORD, X);


  case FCmpInst::FCMP_ULT:

    // fabs(X) u< 0.0 --> isnan(X)

    assert(!I.hasNoNaNs() && "fcmp should have simplified");

    return replacePredAndOp0(&I, FCmpInst::FCMP_UNO, X);


  case FCmpInst::FCMP_OEQ:

  case FCmpInst::FCMP_UEQ:

  case FCmpInst::FCMP_ONE:

  case FCmpInst::FCMP_UNE:

  case FCmpInst::FCMP_ORD:

  case FCmpInst::FCMP_UNO:

    // Look through the fabs() because it doesn't change anything but the sign.

    // fabs(X) == 0.0 --> X == 0.0,

    // fabs(X) != 0.0 --> X != 0.0

    // isnan(fabs(X)) --> isnan(X)

    // !isnan(fabs(X) --> !isnan(X)

    return replacePredAndOp0(&I, I.getPredicate(), X);


  default:

    return nullptr;

  }

}


/// Optimize sqrt(X) compared with zero.

static Instruction *foldSqrtWithFcmpZero(FCmpInst &I, InstCombinerImpl &IC) {

  Value *X;

  if (!match(I.getOperand(0), m_Sqrt(m_Value(X))))

    return nullptr;


  if (!match(I.getOperand(1), m_PosZeroFP()))

    return nullptr;


  auto ReplacePredAndOp0 = [&](FCmpInst::Predicate P) {

    I.setPredicate(P);

    return IC.replaceOperand(I, 0, X);

  };


  // Clear ninf flag if sqrt doesn't have it.

  if (!cast<Instruction>(I.getOperand(0))->hasNoInfs())

    I.setHasNoInfs(false);


  switch (I.getPredicate()) {

  case FCmpInst::FCMP_OLT:

  case FCmpInst::FCMP_UGE:

    // sqrt(X) < 0.0 --> false

    // sqrt(X) u>= 0.0 --> true

    llvm_unreachable("fcmp should have simplified");

  case FCmpInst::FCMP_ULT:

  case FCmpInst::FCMP_ULE:

  case FCmpInst::FCMP_OGT:

  case FCmpInst::FCMP_OGE:

  case FCmpInst::FCMP_OEQ:

  case FCmpInst::FCMP_UNE:

    // sqrt(X) u< 0.0 --> X u< 0.0

    // sqrt(X) u<= 0.0 --> X u<= 0.0

    // sqrt(X) > 0.0 --> X > 0.0

    // sqrt(X) >= 0.0 --> X >= 0.0

    // sqrt(X) == 0.0 --> X == 0.0

    // sqrt(X) u!= 0.0 --> X u!= 0.0

    return IC.replaceOperand(I, 0, X);


  case FCmpInst::FCMP_OLE:

    // sqrt(X) <= 0.0 --> X == 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_OEQ);

  case FCmpInst::FCMP_UGT:

    // sqrt(X) u> 0.0 --> X u!= 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_UNE);

  case FCmpInst::FCMP_UEQ:

    // sqrt(X) u== 0.0 --> X u<= 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_ULE);

  case FCmpInst::FCMP_ONE:

    // sqrt(X) != 0.0 --> X > 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_OGT);

  case FCmpInst::FCMP_ORD:

    // !isnan(sqrt(X)) --> X >= 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_OGE);

  case FCmpInst::FCMP_UNO:

    // isnan(sqrt(X)) --> X u< 0.0

    return ReplacePredAndOp0(FCmpInst::FCMP_ULT);

  default:

    llvm_unreachable("Unexpected predicate!");

  }

}


static Instruction *foldFCmpFNegCommonOp(FCmpInst &I) {

  CmpInst::Predicate Pred = I.getPredicate();

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);


  // Canonicalize fneg as Op1.

  if (match(Op0, m_FNeg(m_Value())) && !match(Op1, m_FNeg(m_Value()))) {

    std::swap(Op0, Op1);

    Pred = I.getSwappedPredicate();

  }


  if (!match(Op1, m_FNeg(m_Specific(Op0))))

    return nullptr;


  // Replace the negated operand with 0.0:

  // fcmp Pred Op0, -Op0 --> fcmp Pred Op0, 0.0

  Constant *Zero = ConstantFP::getZero(Op0->getType());

  return new FCmpInst(Pred, Op0, Zero, "", &I);

}


static Instruction *foldFCmpFSubIntoFCmp(FCmpInst &I, Instruction *LHSI,

                                         Constant *RHSC, InstCombinerImpl &CI) {

  const CmpInst::Predicate Pred = I.getPredicate();

  Value *X = LHSI->getOperand(0);

  Value *Y = LHSI->getOperand(1);

  switch (Pred) {

  default:

    break;

  case FCmpInst::FCMP_UGT:

  case FCmpInst::FCMP_ULT:

  case FCmpInst::FCMP_UNE:

  case FCmpInst::FCMP_OEQ:

  case FCmpInst::FCMP_OGE:

  case FCmpInst::FCMP_OLE:

    // The optimization is not valid if X and Y are infinities of the same

    // sign, i.e. the inf - inf = nan case. If the fsub has the ninf or nnan

    // flag then we can assume we do not have that case. Otherwise we might be

    // able to prove that either X or Y is not infinity.

    if (!LHSI->hasNoNaNs() && !LHSI->hasNoInfs() &&

        !isKnownNeverInfinity(Y,

                              CI.getSimplifyQuery().getWithInstruction(&I)) &&

        !isKnownNeverInfinity(X, CI.getSimplifyQuery().getWithInstruction(&I)))

      break;


    [[fallthrough]];

  case FCmpInst::FCMP_OGT:

  case FCmpInst::FCMP_OLT:

  case FCmpInst::FCMP_ONE:

  case FCmpInst::FCMP_UEQ:

  case FCmpInst::FCMP_UGE:

  case FCmpInst::FCMP_ULE:

    // fcmp pred (x - y), 0 --> fcmp pred x, y

    if (match(RHSC, m_AnyZeroFP()) &&

        I.getFunction()->getDenormalMode(

            LHSI->getType()->getScalarType()->getFltSemantics()) ==

            DenormalMode::getIEEE()) {

      CI.replaceOperand(I, 0, X);

      CI.replaceOperand(I, 1, Y);

      return &I;

    }

    break;

  }


  return nullptr;

}


static Instruction *foldFCmpWithFloorAndCeil(FCmpInst &I,

                                             InstCombinerImpl &IC) {

  Value *LHS = I.getOperand(0), *RHS = I.getOperand(1);

  Type *OpType = LHS->getType();

  CmpInst::Predicate Pred = I.getPredicate();


  bool FloorX = match(LHS, m_Intrinsic<Intrinsic::floor>(m_Specific(RHS)));

  bool CeilX = match(LHS, m_Intrinsic<Intrinsic::ceil>(m_Specific(RHS)));


  if (!FloorX && !CeilX) {

    if ((FloorX = match(RHS, m_Intrinsic<Intrinsic::floor>(m_Specific(LHS)))) ||

        (CeilX = match(RHS, m_Intrinsic<Intrinsic::ceil>(m_Specific(LHS))))) {

      std::swap(LHS, RHS);

      Pred = I.getSwappedPredicate();

    }

  }


  switch (Pred) {

  case FCmpInst::FCMP_OLE:

    // fcmp ole floor(x), x => fcmp ord x, 0

    if (FloorX)

      return new FCmpInst(FCmpInst::FCMP_ORD, RHS, ConstantFP::getZero(OpType),

                          "", &I);

    break;

  case FCmpInst::FCMP_OGT:

    // fcmp ogt floor(x), x => false

    if (FloorX)

      return IC.replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    break;

  case FCmpInst::FCMP_OGE:

    // fcmp oge ceil(x), x => fcmp ord x, 0

    if (CeilX)

      return new FCmpInst(FCmpInst::FCMP_ORD, RHS, ConstantFP::getZero(OpType),

                          "", &I);

    break;

  case FCmpInst::FCMP_OLT:

    // fcmp olt ceil(x), x => false

    if (CeilX)

      return IC.replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

    break;

  case FCmpInst::FCMP_ULE:

    // fcmp ule floor(x), x => true

    if (FloorX)

      return IC.replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

    break;

  case FCmpInst::FCMP_UGT:

    // fcmp ugt floor(x), x => fcmp uno x, 0

    if (FloorX)

      return new FCmpInst(FCmpInst::FCMP_UNO, RHS, ConstantFP::getZero(OpType),

                          "", &I);

    break;

  case FCmpInst::FCMP_UGE:

    // fcmp uge ceil(x), x => true

    if (CeilX)

      return IC.replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

    break;

  case FCmpInst::FCMP_ULT:

    // fcmp ult ceil(x), x => fcmp uno x, 0

    if (CeilX)

      return new FCmpInst(FCmpInst::FCMP_UNO, RHS, ConstantFP::getZero(OpType),

                          "", &I);

    break;

  default:

    break;

  }


  return nullptr;

}


Instruction *InstCombinerImpl::visitFCmpInst(FCmpInst &I) {

  bool Changed = false;


  /// Orders the operands of the compare so that they are listed from most

  /// complex to least complex.  This puts constants before unary operators,

  /// before binary operators.

  if (getComplexity(I.getOperand(0)) < getComplexity(I.getOperand(1))) {

    I.swapOperands();

    Changed = true;

  }


  const CmpInst::Predicate Pred = I.getPredicate();

  Value *Op0 = I.getOperand(0), *Op1 = I.getOperand(1);

  if (Value *V = simplifyFCmpInst(Pred, Op0, Op1, I.getFastMathFlags(),

                                  SQ.getWithInstruction(&I)))

    return replaceInstUsesWith(I, V);


  // Simplify 'fcmp pred X, X'

  Type *OpType = Op0->getType();

  assert(OpType == Op1->getType() && "fcmp with different-typed operands?");

  if (Op0 == Op1) {

    switch (Pred) {

    default:

      break;

    case FCmpInst::FCMP_UNO: // True if unordered: isnan(X) | isnan(Y)

    case FCmpInst::FCMP_ULT: // True if unordered or less than

    case FCmpInst::FCMP_UGT: // True if unordered or greater than

    case FCmpInst::FCMP_UNE: // True if unordered or not equal

      // Canonicalize these to be 'fcmp uno %X, 0.0'.

      I.setPredicate(FCmpInst::FCMP_UNO);

      I.setOperand(1, Constant::getNullValue(OpType));

      return &I;


    case FCmpInst::FCMP_ORD: // True if ordered (no nans)

    case FCmpInst::FCMP_OEQ: // True if ordered and equal

    case FCmpInst::FCMP_OGE: // True if ordered and greater than or equal

    case FCmpInst::FCMP_OLE: // True if ordered and less than or equal

      // Canonicalize these to be 'fcmp ord %X, 0.0'.

      I.setPredicate(FCmpInst::FCMP_ORD);

      I.setOperand(1, Constant::getNullValue(OpType));

      return &I;

    }

  }


  if (I.isCommutative()) {

    if (auto Pair = matchSymmetricPair(I.getOperand(0), I.getOperand(1))) {

      replaceOperand(I, 0, Pair->first);

      replaceOperand(I, 1, Pair->second);

      return &I;

    }

  }


  // If we're just checking for a NaN (ORD/UNO) and have a non-NaN operand,

  // then canonicalize the operand to 0.0.

  if (Pred == CmpInst::FCMP_ORD || Pred == CmpInst::FCMP_UNO) {

    if (!match(Op0, m_PosZeroFP()) &&

        isKnownNeverNaN(Op0, getSimplifyQuery().getWithInstruction(&I)))

      return replaceOperand(I, 0, ConstantFP::getZero(OpType));


    if (!match(Op1, m_PosZeroFP()) &&

        isKnownNeverNaN(Op1, getSimplifyQuery().getWithInstruction(&I)))

      return replaceOperand(I, 1, ConstantFP::getZero(OpType));

  }


  // fcmp pred (fneg X), (fneg Y) -> fcmp swap(pred) X, Y

  Value *X, *Y;

  if (match(Op0, m_FNeg(m_Value(X))) && match(Op1, m_FNeg(m_Value(Y))))

    return new FCmpInst(I.getSwappedPredicate(), X, Y, "", &I);


  if (Instruction *R = foldFCmpFNegCommonOp(I))

    return R;


  // Test if the FCmpInst instruction is used exclusively by a select as

  // part of a minimum or maximum operation. If so, refrain from doing

  // any other folding. This helps out other analyses which understand

  // non-obfuscated minimum and maximum idioms, such as ScalarEvolution

  // and CodeGen. And in this case, at least one of the comparison

  // operands has at least one user besides the compare (the select),

  // which would often largely negate the benefit of folding anyway.

  if (I.hasOneUse())

    if (SelectInst *SI = dyn_cast<SelectInst>(I.user_back())) {

      Value *A, *B;

      SelectPatternResult SPR = matchSelectPattern(SI, A, B);

      if (SPR.Flavor != SPF_UNKNOWN)

        return nullptr;

    }


  // The sign of 0.0 is ignored by fcmp, so canonicalize to +0.0:

  // fcmp Pred X, -0.0 --> fcmp Pred X, 0.0

  if (match(Op1, m_AnyZeroFP()) && !match(Op1, m_PosZeroFP()))

    return replaceOperand(I, 1, ConstantFP::getZero(OpType));


  // Canonicalize:

  // fcmp olt X, +inf -> fcmp one X, +inf

  // fcmp ole X, +inf -> fcmp ord X, 0

  // fcmp ogt X, +inf -> false

  // fcmp oge X, +inf -> fcmp oeq X, +inf

  // fcmp ult X, +inf -> fcmp une X, +inf

  // fcmp ule X, +inf -> true

  // fcmp ugt X, +inf -> fcmp uno X, 0

  // fcmp uge X, +inf -> fcmp ueq X, +inf

  // fcmp olt X, -inf -> false

  // fcmp ole X, -inf -> fcmp oeq X, -inf

  // fcmp ogt X, -inf -> fcmp one X, -inf

  // fcmp oge X, -inf -> fcmp ord X, 0

  // fcmp ult X, -inf -> fcmp uno X, 0

  // fcmp ule X, -inf -> fcmp ueq X, -inf

  // fcmp ugt X, -inf -> fcmp une X, -inf

  // fcmp uge X, -inf -> true

  const APFloat *C;

  if (match(Op1, m_APFloat(C)) && C->isInfinity()) {

    switch (C->isNegative() ? FCmpInst::getSwappedPredicate(Pred) : Pred) {

    default:

      break;

    case FCmpInst::FCMP_ORD:

    case FCmpInst::FCMP_UNO:

    case FCmpInst::FCMP_TRUE:

    case FCmpInst::FCMP_FALSE:

    case FCmpInst::FCMP_OGT:

    case FCmpInst::FCMP_ULE:

      llvm_unreachable("Should be simplified by InstSimplify");

    case FCmpInst::FCMP_OLT:

      return new FCmpInst(FCmpInst::FCMP_ONE, Op0, Op1, "", &I);

    case FCmpInst::FCMP_OLE:

      return new FCmpInst(FCmpInst::FCMP_ORD, Op0, ConstantFP::getZero(OpType),

                          "", &I);

    case FCmpInst::FCMP_OGE:

      return new FCmpInst(FCmpInst::FCMP_OEQ, Op0, Op1, "", &I);

    case FCmpInst::FCMP_ULT:

      return new FCmpInst(FCmpInst::FCMP_UNE, Op0, Op1, "", &I);

    case FCmpInst::FCMP_UGT:

      return new FCmpInst(FCmpInst::FCMP_UNO, Op0, ConstantFP::getZero(OpType),

                          "", &I);

    case FCmpInst::FCMP_UGE:

      return new FCmpInst(FCmpInst::FCMP_UEQ, Op0, Op1, "", &I);

    }

  }


  // Ignore signbit of bitcasted int when comparing equality to FP 0.0:

  // fcmp oeq/une (bitcast X), 0.0 --> (and X, SignMaskC) ==/!= 0

  if (match(Op1, m_PosZeroFP()) &&

      match(Op0, m_OneUse(m_ElementWiseBitCast(m_Value(X))))) {

    ICmpInst::Predicate IntPred = ICmpInst::BAD_ICMP_PREDICATE;

    if (Pred == FCmpInst::FCMP_OEQ)

      IntPred = ICmpInst::ICMP_EQ;

    else if (Pred == FCmpInst::FCMP_UNE)

      IntPred = ICmpInst::ICMP_NE;


    if (IntPred != ICmpInst::BAD_ICMP_PREDICATE) {

      Type *IntTy = X->getType();

      const APInt &SignMask = ~APInt::getSignMask(IntTy->getScalarSizeInBits());

      Value *MaskX = Builder.CreateAnd(X, ConstantInt::get(IntTy, SignMask));

      return new ICmpInst(IntPred, MaskX, ConstantInt::getNullValue(IntTy));

    }

  }


  // Handle fcmp with instruction LHS and constant RHS.

  Instruction *LHSI;

  Constant *RHSC;

  if (match(Op0, m_Instruction(LHSI)) && match(Op1, m_Constant(RHSC))) {

    switch (LHSI->getOpcode()) {

    case Instruction::Select:

      // fcmp eq (cond ? x : -x), 0 --> fcmp eq x, 0

      if (FCmpInst::isEquality(Pred) && match(RHSC, m_AnyZeroFP()) &&

          match(LHSI, m_c_Select(m_FNeg(m_Value(X)), m_Deferred(X))))

        return replaceOperand(I, 0, X);

      if (Instruction *NV = FoldOpIntoSelect(I, cast<SelectInst>(LHSI)))

        return NV;

      break;

    case Instruction::FSub:

      if (LHSI->hasOneUse())

        if (Instruction *NV = foldFCmpFSubIntoFCmp(I, LHSI, RHSC, *this))

          return NV;

      break;

    case Instruction::PHI:

      if (Instruction *NV = foldOpIntoPhi(I, cast<PHINode>(LHSI)))

        return NV;

      break;

    case Instruction::SIToFP:

    case Instruction::UIToFP:

      if (Instruction *NV = foldFCmpIntToFPConst(I, LHSI, RHSC))

        return NV;

      break;

    case Instruction::FDiv:

      if (Instruction *NV = foldFCmpReciprocalAndZero(I, LHSI, RHSC))

        return NV;

      break;

    case Instruction::Load:

      if (auto *GEP = dyn_cast<GetElementPtrInst>(LHSI->getOperand(0)))

        if (auto *GV = dyn_cast<GlobalVariable>(GEP->getOperand(0)))

          if (Instruction *Res = foldCmpLoadFromIndexedGlobal(

                  cast<LoadInst>(LHSI), GEP, GV, I))

            return Res;

      break;

    case Instruction::FPTrunc:

      if (Instruction *NV = foldFCmpFpTrunc(I, *LHSI, *RHSC))

        return NV;

      break;

    }

  }


  if (Instruction *R = foldFabsWithFcmpZero(I, *this))

    return R;


  if (Instruction *R = foldSqrtWithFcmpZero(I, *this))

    return R;


  if (Instruction *R = foldFCmpWithFloorAndCeil(I, *this))

    return R;


  if (match(Op0, m_FNeg(m_Value(X)))) {

    // fcmp pred (fneg X), C --> fcmp swap(pred) X, -C

    Constant *C;

    if (match(Op1, m_Constant(C)))

      if (Constant *NegC = ConstantFoldUnaryOpOperand(Instruction::FNeg, C, DL))

        return new FCmpInst(I.getSwappedPredicate(), X, NegC, "", &I);

  }


  // fcmp (fadd X, 0.0), Y --> fcmp X, Y

  if (match(Op0, m_FAdd(m_Value(X), m_AnyZeroFP())))

    return new FCmpInst(Pred, X, Op1, "", &I);


  // fcmp X, (fadd Y, 0.0) --> fcmp X, Y

  if (match(Op1, m_FAdd(m_Value(Y), m_AnyZeroFP())))

    return new FCmpInst(Pred, Op0, Y, "", &I);


  if (match(Op0, m_FPExt(m_Value(X)))) {

    // fcmp (fpext X), (fpext Y) -> fcmp X, Y

    if (match(Op1, m_FPExt(m_Value(Y))) && X->getType() == Y->getType())

      return new FCmpInst(Pred, X, Y, "", &I);


    const APFloat *C;

    if (match(Op1, m_APFloat(C))) {

      const fltSemantics &FPSem =

          X->getType()->getScalarType()->getFltSemantics();

      bool Lossy;

      APFloat TruncC = *C;

      TruncC.convert(FPSem, APFloat::rmNearestTiesToEven, &Lossy);


      if (Lossy) {

        // X can't possibly equal the higher-precision constant, so reduce any

        // equality comparison.

        // TODO: Other predicates can be handled via getFCmpCode().

        switch (Pred) {

        case FCmpInst::FCMP_OEQ:

          // X is ordered and equal to an impossible constant --> false

          return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));

        case FCmpInst::FCMP_ONE:

          // X is ordered and not equal to an impossible constant --> ordered

          return new FCmpInst(FCmpInst::FCMP_ORD, X,

                              ConstantFP::getZero(X->getType()));

        case FCmpInst::FCMP_UEQ:

          // X is unordered or equal to an impossible constant --> unordered

          return new FCmpInst(FCmpInst::FCMP_UNO, X,

                              ConstantFP::getZero(X->getType()));

        case FCmpInst::FCMP_UNE:

          // X is unordered or not equal to an impossible constant --> true

          return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));

        default:

          break;

        }

      }


      // fcmp (fpext X), C -> fcmp X, (fptrunc C) if fptrunc is lossless

      // Avoid lossy conversions and denormals.

      // Zero is a special case that's OK to convert.

      APFloat Fabs = TruncC;

      Fabs.clearSign();

      if (!Lossy &&

          (Fabs.isZero() || !(Fabs < APFloat::getSmallestNormalized(FPSem)))) {

        Constant *NewC = ConstantFP::get(X->getType(), TruncC);

        return new FCmpInst(Pred, X, NewC, "", &I);

      }

    }

  }


  // Convert a sign-bit test of an FP value into a cast and integer compare.

  // TODO: Simplify if the copysign constant is 0.0 or NaN.

  // TODO: Handle non-zero compare constants.

  // TODO: Handle other predicates.

  if (match(Op0, m_OneUse(m_Intrinsic<Intrinsic::copysign>(m_APFloat(C),

                                                           m_Value(X)))) &&

      match(Op1, m_AnyZeroFP()) && !C->isZero() && !C->isNaN()) {

    Type *IntType = Builder.getIntNTy(X->getType()->getScalarSizeInBits());

    if (auto *VecTy = dyn_cast<VectorType>(OpType))

      IntType = VectorType::get(IntType, VecTy->getElementCount());


    // copysign(non-zero constant, X) < 0.0 --> (bitcast X) < 0

    if (Pred == FCmpInst::FCMP_OLT) {

      Value *IntX = Builder.CreateBitCast(X, IntType);

      return new ICmpInst(ICmpInst::ICMP_SLT, IntX,

                          ConstantInt::getNullValue(IntType));

    }

  }


  {

    Value *CanonLHS = nullptr, *CanonRHS = nullptr;

    match(Op0, m_Intrinsic<Intrinsic::canonicalize>(m_Value(CanonLHS)));

    match(Op1, m_Intrinsic<Intrinsic::canonicalize>(m_Value(CanonRHS)));


    // (canonicalize(x) == x) => (x == x)

    if (CanonLHS == Op1)

      return new FCmpInst(Pred, Op1, Op1, "", &I);


    // (x == canonicalize(x)) => (x == x)

    if (CanonRHS == Op0)

      return new FCmpInst(Pred, Op0, Op0, "", &I);


    // (canonicalize(x) == canonicalize(y)) => (x == y)

    if (CanonLHS && CanonRHS)

      return new FCmpInst(Pred, CanonLHS, CanonRHS, "", &I);

  }


  if (I.getType()->isVectorTy())

    if (Instruction *Res = foldVectorCmp(I, Builder))

      return Res;


  return Changed ? &I : nullptr;

}

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

Select
AMDGPU Register Bank Select
Definition: AMDGPURegBankSelect.cpp:68

PHI
Rewrite undef for PHI
Definition: AMDGPURewriteUndefForPHI.cpp:98

APFloat.h
This file declares a class to represent arbitrary precision floating point values and provide a varie...

APSInt.h
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

Local.h

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

CaptureTracking.h

CmpInstAnalysis.h

ConstantFolding.h

ConstantRange.h

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

DataLayout.h

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:347

End
bool End
Definition: ELF_riscv.cpp:480

X
static GCMetadataPrinterRegistry::Add< ErlangGCPrinter > X("erlang", "erlang-compatible garbage collector")

Check
#define Check(C,...)
Definition: GenericConvergenceVerifierImpl.h:34

GEP
Hexagon Common GEP
Definition: HexagonCommonGEP.cpp:164

IntrinsicInst.h

foldFCmpReciprocalAndZero
static Instruction * foldFCmpReciprocalAndZero(FCmpInst &I, Instruction *LHSI, Constant *RHSC)
Fold (C / X) < 0.0 --> X < 0.0 if possible. Swap predicate if necessary.
Definition: InstCombineCompares.cpp:8217

foldFabsWithFcmpZero
static Instruction * foldFabsWithFcmpZero(FCmpInst &I, InstCombinerImpl &IC)
Optimize fabs(X) compared with zero.
Definition: InstCombineCompares.cpp:8356

collectOffsetOp
static void collectOffsetOp(Value *V, SmallVectorImpl< OffsetOp > &Offsets, bool AllowRecursion)
Definition: InstCombineCompares.cpp:5882

rewriteGEPAsOffset
static Value * rewriteGEPAsOffset(Value *Start, Value *Base, GEPNoWrapFlags NW, const DataLayout &DL, SetVector< Value * > &Explored, InstCombiner &IC)
Returns a re-written value of Start as an indexed GEP using Base as a pointer.
Definition: InstCombineCompares.cpp:548

foldICmpEqualityWithOffset
static Instruction * foldICmpEqualityWithOffset(ICmpInst &I, InstCombiner::BuilderTy &Builder, const SimplifyQuery &SQ)
Offset both sides of an equality icmp to see if we can save some instructions: icmp eq/ne X,...
Definition: InstCombineCompares.cpp:5943

addWithOverflow
static bool addWithOverflow(APInt &Result, const APInt &In1, const APInt &In2, bool IsSigned=false)
Compute Result = In1+In2, returning true if the result overflowed for this type.
Definition: InstCombineCompares.cpp:45

foldICmpAndXX
static Instruction * foldICmpAndXX(ICmpInst &I, const SimplifyQuery &Q, InstCombinerImpl &IC)
Definition: InstCombineCompares.cpp:5013

foldVectorCmp
static Instruction * foldVectorCmp(CmpInst &Cmp, InstCombiner::BuilderTy &Builder)
Definition: InstCombineCompares.cpp:7337

isMaskOrZero
static bool isMaskOrZero(const Value *V, bool Not, const SimplifyQuery &Q, unsigned Depth=0)
Definition: InstCombineCompares.cpp:4429

createLogicFromTable
static Value * createLogicFromTable(const std::bitset< 4 > &Table, Value *Op0, Value *Op1, IRBuilderBase &Builder, bool HasOneUse)
Definition: InstCombineCompares.cpp:3087

foldICmpOfUAddOv
static Instruction * foldICmpOfUAddOv(ICmpInst &I)
Definition: InstCombineCompares.cpp:7407

isChainSelectCmpBranch
static bool isChainSelectCmpBranch(const SelectInst *SI)
Return true when the instruction sequence within a block is select-cmp-br.
Definition: InstCombineCompares.cpp:6789

foldICmpInvariantGroup
static Instruction * foldICmpInvariantGroup(ICmpInst &I)
Definition: InstCombineCompares.cpp:7435

OffsetOp
std::pair< Instruction::BinaryOps, Value * > OffsetOp
Find all possible pairs (BinOp, RHS) that BinOp V, RHS can be simplified.
Definition: InstCombineCompares.cpp:5881

foldReductionIdiom
static Instruction * foldReductionIdiom(ICmpInst &I, InstCombiner::BuilderTy &Builder, const DataLayout &DL)
This function folds patterns produced by lowering of reduce idioms, such as llvm.vector....
Definition: InstCombineCompares.cpp:7456

canonicalizeICmpBool
static Instruction * canonicalizeICmpBool(ICmpInst &I, InstCombiner::BuilderTy &Builder)
Integer compare with boolean values can always be turned into bitwise ops.
Definition: InstCombineCompares.cpp:7215

OffsetKind
OffsetKind
Definition: InstCombineCompares.cpp:5911

foldFCmpFSubIntoFCmp
static Instruction * foldFCmpFSubIntoFCmp(FCmpInst &I, Instruction *LHSI, Constant *RHSC, InstCombinerImpl &CI)
Definition: InstCombineCompares.cpp:8536

foldICmpOrXorSubChain
static Value * foldICmpOrXorSubChain(ICmpInst &Cmp, BinaryOperator *Or, InstCombiner::BuilderTy &Builder)
Fold icmp eq/ne (or (xor/sub (X1, X2), xor/sub (X3, X4))), 0.
Definition: InstCombineCompares.cpp:2061

hasBranchUse
static bool hasBranchUse(ICmpInst &I)
Given an icmp instruction, return true if any use of this comparison is a branch on sign bit comparis...
Definition: InstCombineCompares.cpp:71

foldICmpWithLowBitMaskedVal
static Value * foldICmpWithLowBitMaskedVal(CmpPredicate Pred, Value *Op0, Value *Op1, const SimplifyQuery &Q, InstCombiner &IC)
Some comparisons can be simplified.
Definition: InstCombineCompares.cpp:4536

getDemandedBitsLHSMask
static APInt getDemandedBitsLHSMask(ICmpInst &I, unsigned BitWidth)
When performing a comparison against a constant, it is possible that not all the bits in the LHS are ...
Definition: InstCombineCompares.cpp:6728

foldICmpShlLHSC
static Instruction * foldICmpShlLHSC(ICmpInst &Cmp, Instruction *Shl, const APInt &C)
Fold icmp (shl nuw C2, Y), C.
Definition: InstCombineCompares.cpp:2312

foldFCmpWithFloorAndCeil
static Instruction * foldFCmpWithFloorAndCeil(FCmpInst &I, InstCombinerImpl &IC)
Definition: InstCombineCompares.cpp:8582

foldICmpXorXX
static Instruction * foldICmpXorXX(ICmpInst &I, const SimplifyQuery &Q, InstCombinerImpl &IC)
Definition: InstCombineCompares.cpp:5110

foldICmpOfCmpIntrinsicWithConstant
static Instruction * foldICmpOfCmpIntrinsicWithConstant(CmpPredicate Pred, IntrinsicInst *I, const APInt &C, InstCombiner::BuilderTy &Builder)
Definition: InstCombineCompares.cpp:4171

processUMulZExtIdiom
static Instruction * processUMulZExtIdiom(ICmpInst &I, Value *MulVal, const APInt *OtherVal, InstCombinerImpl &IC)
Recognize and process idiom involving test for multiplication overflow.
Definition: InstCombineCompares.cpp:6581

foldSqrtWithFcmpZero
static Instruction * foldSqrtWithFcmpZero(FCmpInst &I, InstCombinerImpl &IC)
Optimize sqrt(X) compared with zero.
Definition: InstCombineCompares.cpp:8457

foldFCmpFNegCommonOp
static Instruction * foldFCmpFNegCommonOp(FCmpInst &I)
Definition: InstCombineCompares.cpp:8517

foldICmpWithHighBitMask
static Instruction * foldICmpWithHighBitMask(ICmpInst &Cmp, InstCombiner::BuilderTy &Builder)
Definition: InstCombineCompares.cpp:7294

canonicalizeCmpWithConstant
static ICmpInst * canonicalizeCmpWithConstant(ICmpInst &I)
If we have an icmp le or icmp ge instruction with a constant operand, turn it into the appropriate ic...
Definition: InstCombineCompares.cpp:7172

foldICmpIntrinsicWithIntrinsic
static Instruction * foldICmpIntrinsicWithIntrinsic(ICmpInst &Cmp, InstCombiner::BuilderTy &Builder)
Fold an icmp with LLVM intrinsics.
Definition: InstCombineCompares.cpp:3944

foldICmpUSubSatOrUAddSatWithConstant
static Instruction * foldICmpUSubSatOrUAddSatWithConstant(CmpPredicate Pred, SaturatingInst *II, const APInt &C, InstCombiner::BuilderTy &Builder)
Definition: InstCombineCompares.cpp:4086

foldICmpPow2Test
static Instruction * foldICmpPow2Test(ICmpInst &I, InstCombiner::BuilderTy &Builder)
Definition: InstCombineCompares.cpp:5828

subWithOverflow
static bool subWithOverflow(APInt &Result, const APInt &In1, const APInt &In2, bool IsSigned=false)
Compute Result = In1-In2, returning true if the result overflowed for this type.
Definition: InstCombineCompares.cpp:58

canRewriteGEPAsOffset
static bool canRewriteGEPAsOffset(Value *Start, Value *Base, GEPNoWrapFlags &NW, const DataLayout &DL, SetVector< Value * > &Explored)
Returns true if we can rewrite Start as a GEP with pointer Base and some integer offset.
Definition: InstCombineCompares.cpp:434

foldFCmpFpTrunc
static Instruction * foldFCmpFpTrunc(FCmpInst &I, const Instruction &FPTrunc, const Constant &C)
Definition: InstCombineCompares.cpp:8271

foldICmpXNegX
static Instruction * foldICmpXNegX(ICmpInst &I, InstCombiner::BuilderTy &Builder)
Definition: InstCombineCompares.cpp:4981

processUGT_ADDCST_ADD
static Instruction * processUGT_ADDCST_ADD(ICmpInst &I, Value *A, Value *B, ConstantInt *CI2, ConstantInt *CI1, InstCombinerImpl &IC)
The caller has matched a pattern of the form: I = icmp ugt (add (add A, B), CI2), CI1 If this is of t...
Definition: InstCombineCompares.cpp:1101

foldShiftIntoShiftInAnotherHandOfAndInICmp
static Value * foldShiftIntoShiftInAnotherHandOfAndInICmp(ICmpInst &I, const SimplifyQuery SQ, InstCombiner::BuilderTy &Builder)
Definition: InstCombineCompares.cpp:4740

isSignTest
static bool isSignTest(ICmpInst::Predicate &Pred, const APInt &C)
Returns true if the exploded icmp can be expressed as a signed comparison to zero and updates the pre...
Definition: InstCombineCompares.cpp:82

transformToIndexedCompare
static Instruction * transformToIndexedCompare(GEPOperator *GEPLHS, Value *RHS, CmpPredicate Cond, const DataLayout &DL, InstCombiner &IC)
Converts (CMP GEPLHS, RHS) if this change would make RHS a constant.
Definition: InstCombineCompares.cpp:642

foldCtpopPow2Test
static Instruction * foldCtpopPow2Test(ICmpInst &I, IntrinsicInst *CtpopLhs, const APInt &CRhs, InstCombiner::BuilderTy &Builder, const SimplifyQuery &Q)
Definition: InstCombineCompares.cpp:3798

setInsertionPoint
static void setInsertionPoint(IRBuilder<> &Builder, Value *V, bool Before=true)
Definition: InstCombineCompares.cpp:522

isNeutralValue
static bool isNeutralValue(Instruction::BinaryOps BinaryOp, Value *RHS, bool IsSigned)
Definition: InstCombineCompares.cpp:6479

isMultipleOf
static bool isMultipleOf(Value *X, const APInt &C, const SimplifyQuery &Q)
Return true if X is a multiple of C.
Definition: InstCombineCompares.cpp:5156

foldICmpWithTruncSignExtendedVal
static Value * foldICmpWithTruncSignExtendedVal(ICmpInst &I, InstCombiner::BuilderTy &Builder)
Some comparisons can be simplified.
Definition: InstCombineCompares.cpp:4666

foldICmpOrXX
static Instruction * foldICmpOrXX(ICmpInst &I, const SimplifyQuery &Q, InstCombinerImpl &IC)
Definition: InstCombineCompares.cpp:5075

InstCombineInternal.h
This file provides internal interfaces used to implement the InstCombine.

InstCombiner.h
This file provides the interface for the instcombine pass implementation.

InstrTypes.h

InstructionSimplify.h

Instructions.h

KnownBits.h

isZero
static bool isZero(Value *V, const DataLayout &DL, DominatorTree *DT, AssumptionCache *AC)
Definition: Lint.cpp:546

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

Operands
mir Rename Register Operands
Definition: MIRNamerPass.cpp:74

T1
#define T1
Definition: Mips16ISelLowering.cpp:348

II
uint64_t IntrinsicInst * II
Definition: NVVMIntrRange.cpp:46

Y
static GCMetadataPrinterRegistry::Add< OcamlGCMetadataPrinter > Y("ocaml", "ocaml 3.10-compatible collector")

P
#define P(N)

PatternMatch.h

Cond
const SmallVectorImpl< MachineOperand > & Cond
Definition: RISCVRedundantCopyElimination.cpp:71

SetVector.h
This file implements a set that has insertion order iteration characteristics.

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition: Statistic.h:167

getType
static SymbolRef::Type getType(const Symbol *Sym)
Definition: TapiFile.cpp:39

IntX
@ IntX
Definition: TargetLibraryInfo.cpp:68

VectorUtils.h

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

BaseType

llvm::APFloat
Definition: APFloat.h:900

llvm::APFloat::convert
LLVM_ABI opStatus convert(const fltSemantics &ToSemantics, roundingMode RM, bool *losesInfo)
Definition: APFloat.cpp:6057

llvm::APFloat::clearSign
void clearSign()
Definition: APFloat.h:1298

llvm::APFloat::isNaN
bool isNaN() const
Definition: APFloat.h:1447

llvm::APFloat::isZero
bool isZero() const
Definition: APFloat.h:1445

llvm::APFloat::getSmallestNormalized
static APFloat getSmallestNormalized(const fltSemantics &Sem, bool Negative=false)
Returns the smallest (by magnitude) normalized finite number in the given semantics.
Definition: APFloat.h:1158

llvm::APFloat::bitcastToAPInt
APInt bitcastToAPInt() const
Definition: APFloat.h:1353

llvm::APFloat::getLargest
static APFloat getLargest(const fltSemantics &Sem, bool Negative=false)
Returns the largest finite number in the given semantics.
Definition: APFloat.h:1138

llvm::APFloat::next
opStatus next(bool nextDown)
Definition: APFloat.h:1254

llvm::APFloat::getInf
static APFloat getInf(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Infinity.
Definition: APFloat.h:1098

llvm::APFloat::classify
LLVM_ABI FPClassTest classify() const
Return the FPClassTest which will return true for the value.
Definition: APFloat.cpp:5986

llvm::APFloat::roundToIntegral
opStatus roundToIntegral(roundingMode RM)
Definition: APFloat.h:1248

llvm::APFloat::isInfinity
bool isInfinity() const
Definition: APFloat.h:1446

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::APInt::udiv
LLVM_ABI APInt udiv(const APInt &RHS) const
Unsigned division operation.
Definition: APInt.cpp:1573

llvm::APInt::getAllOnes
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition: APInt.h:234

llvm::APInt::udivrem
static LLVM_ABI void udivrem(const APInt &LHS, const APInt &RHS, APInt &Quotient, APInt &Remainder)
Dual division/remainder interface.
Definition: APInt.cpp:1758

llvm::APInt::isNegatedPowerOf2
bool isNegatedPowerOf2() const
Check if this APInt's negated value is a power of two greater than zero.
Definition: APInt.h:449

llvm::APInt::zext
LLVM_ABI APInt zext(unsigned width) const
Zero extend to a new width.
Definition: APInt.cpp:1012

llvm::APInt::getSignMask
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition: APInt.h:229

llvm::APInt::isMinSignedValue
bool isMinSignedValue() const
Determine if this is the smallest signed value.
Definition: APInt.h:423

llvm::APInt::getZExtValue
uint64_t getZExtValue() const
Get zero extended value.
Definition: APInt.h:1540

llvm::APInt::getActiveBits
unsigned getActiveBits() const
Compute the number of active bits in the value.
Definition: APInt.h:1512

llvm::APInt::trunc
LLVM_ABI APInt trunc(unsigned width) const
Truncate to new width.
Definition: APInt.cpp:936

llvm::APInt::getMaxValue
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
Definition: APInt.h:206

llvm::APInt::setBit
void setBit(unsigned BitPosition)
Set the given bit to 1 whose position is given as "bitPosition".
Definition: APInt.h:1330

llvm::APInt::abs
APInt abs() const
Get the absolute value.
Definition: APInt.h:1795

llvm::APInt::ceilLogBase2
unsigned ceilLogBase2() const
Definition: APInt.h:1764

llvm::APInt::Rounding::DOWN
@ DOWN

llvm::APInt::Rounding::UP
@ UP

llvm::APInt::sgt
bool sgt(const APInt &RHS) const
Signed greater than comparison.
Definition: APInt.h:1201

llvm::APInt::isAllOnes
bool isAllOnes() const
Determine if all bits are set. This is true for zero-width values.
Definition: APInt.h:371

llvm::APInt::usub_ov
LLVM_ABI APInt usub_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1948

llvm::APInt::ugt
bool ugt(const APInt &RHS) const
Unsigned greater than comparison.
Definition: APInt.h:1182

llvm::APInt::isZero
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition: APInt.h:380

llvm::APInt::isSignMask
bool isSignMask() const
Check if the APInt's value is returned by getSignMask.
Definition: APInt.h:466

llvm::APInt::getBitWidth
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition: APInt.h:1488

llvm::APInt::ult
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition: APInt.h:1111

llvm::APInt::getSignedMaxValue
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition: APInt.h:209

llvm::APInt::getMinValue
static APInt getMinValue(unsigned numBits)
Gets minimum unsigned value of APInt for a specific bit width.
Definition: APInt.h:216

llvm::APInt::isNegative
bool isNegative() const
Determine sign of this APInt.
Definition: APInt.h:329

llvm::APInt::sadd_ov
LLVM_ABI APInt sadd_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1928

llvm::APInt::eq
bool eq(const APInt &RHS) const
Equality comparison.
Definition: APInt.h:1079

llvm::APInt::sdiv
LLVM_ABI APInt sdiv(const APInt &RHS) const
Signed division function for APInt.
Definition: APInt.cpp:1644

llvm::APInt::uadd_ov
LLVM_ABI APInt uadd_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1935

llvm::APInt::negate
void negate()
Negate this APInt in place.
Definition: APInt.h:1468

llvm::APInt::countr_zero
unsigned countr_zero() const
Count the number of trailing zero bits.
Definition: APInt.h:1639

llvm::APInt::countl_zero
unsigned countl_zero() const
The APInt version of std::countl_zero.
Definition: APInt.h:1598

llvm::APInt::getSignedMinValue
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition: APInt.h:219

llvm::APInt::isStrictlyPositive
bool isStrictlyPositive() const
Determine if this APInt Value is positive.
Definition: APInt.h:356

llvm::APInt::flipAllBits
void flipAllBits()
Toggle every bit to its opposite value.
Definition: APInt.h:1452

llvm::APInt::countl_one
unsigned countl_one() const
Count the number of leading one bits.
Definition: APInt.h:1615

llvm::APInt::logBase2
unsigned logBase2() const
Definition: APInt.h:1761

llvm::APInt::getLimitedValue
uint64_t getLimitedValue(uint64_t Limit=UINT64_MAX) const
If this value is smaller than the specified limit, return it, otherwise return the limit value.
Definition: APInt.h:475

llvm::APInt::ashr
APInt ashr(unsigned ShiftAmt) const
Arithmetic right-shift function.
Definition: APInt.h:827

llvm::APInt::isMaxSignedValue
bool isMaxSignedValue() const
Determine if this is the largest signed value.
Definition: APInt.h:405

llvm::APInt::ule
bool ule(const APInt &RHS) const
Unsigned less or equal comparison.
Definition: APInt.h:1150

llvm::APInt::shl
APInt shl(unsigned shiftAmt) const
Left-shift function.
Definition: APInt.h:873

llvm::APInt::isPowerOf2
bool isPowerOf2() const
Check if this APInt's value is a power of two greater than zero.
Definition: APInt.h:440

llvm::APInt::getLowBitsSet
static APInt getLowBitsSet(unsigned numBits, unsigned loBitsSet)
Constructs an APInt value that has the bottom loBitsSet bits set.
Definition: APInt.h:306

llvm::APInt::getHighBitsSet
static APInt getHighBitsSet(unsigned numBits, unsigned hiBitsSet)
Constructs an APInt value that has the top hiBitsSet bits set.
Definition: APInt.h:296

llvm::APInt::getZero
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition: APInt.h:200

llvm::APInt::sge
bool sge(const APInt &RHS) const
Signed greater or equal comparison.
Definition: APInt.h:1237

llvm::APInt::ssub_ov
LLVM_ABI APInt ssub_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1941

llvm::APInt::isOne
bool isOne() const
Determine if this is a value of 1.
Definition: APInt.h:389

llvm::APInt::getBitsSetFrom
static APInt getBitsSetFrom(unsigned numBits, unsigned loBit)
Constructs an APInt value that has a contiguous range of bits set.
Definition: APInt.h:286

llvm::APInt::getOneBitSet
static APInt getOneBitSet(unsigned numBits, unsigned BitNo)
Return an APInt with exactly one bit set in the result.
Definition: APInt.h:239

llvm::APInt::lshr
APInt lshr(unsigned shiftAmt) const
Logical right-shift function.
Definition: APInt.h:851

llvm::APInt::countr_one
unsigned countr_one() const
Count the number of trailing one bits.
Definition: APInt.h:1656

llvm::APInt::uge
bool uge(const APInt &RHS) const
Unsigned greater or equal comparison.
Definition: APInt.h:1221

llvm::APSInt
An arbitrary precision integer that knows its signedness.
Definition: APSInt.h:24

llvm::AllocaInst
an instruction to allocate memory on the stack
Definition: Instructions.h:64

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::ArrayType
Class to represent array types.
Definition: DerivedTypes.h:398

llvm::BasicBlockEdge
Definition: Dominators.h:97

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:62

llvm::BasicBlock::getFirstInsertionPt
LLVM_ABI const_iterator getFirstInsertionPt() const
Returns an iterator to the first instruction in this block that is suitable for inserting a non-PHI i...
Definition: BasicBlock.cpp:393

llvm::BasicBlock::getSinglePredecessor
LLVM_ABI const BasicBlock * getSinglePredecessor() const
Return the predecessor of this block if it has a single predecessor block.
Definition: BasicBlock.cpp:437

llvm::BasicBlock::getTerminator
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
Definition: BasicBlock.h:233

llvm::BinaryOperator
Definition: InstrTypes.h:171

llvm::BinaryOperator::getOpcode
BinaryOps getOpcode() const
Definition: InstrTypes.h:374

llvm::BinaryOperator::CreateNot
static LLVM_ABI BinaryOperator * CreateNot(Value *Op, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition: Instructions.cpp:2724

llvm::BinaryOperator::Create
static LLVM_ABI BinaryOperator * Create(BinaryOps Op, Value *S1, Value *S2, const Twine &Name=Twine(), InsertPosition InsertBefore=nullptr)
Construct a binary instruction, given the opcode and the two operands.
Definition: Instructions.cpp:2703

llvm::BranchInst
Conditional or Unconditional Branch instruction.
Definition: Instructions.h:3057

llvm::CallBase::getArgOperand
Value * getArgOperand(unsigned i) const
Definition: InstrTypes.h:1292

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1510

llvm::CallInst::Create
static CallInst * Create(FunctionType *Ty, Value *F, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Definition: Instructions.h:1545

llvm::CmpInst
This class is the base class for the comparison instructions.
Definition: InstrTypes.h:666

llvm::CmpInst::makeCmpResultType
static Type * makeCmpResultType(Type *opnd_type)
Create a result type for fcmp/icmp.
Definition: InstrTypes.h:984

llvm::CmpInst::getStrictPredicate
Predicate getStrictPredicate() const
For example, SGE -> SGT, SLE -> SLT, ULE -> ULT, UGE -> UGT.
Definition: InstrTypes.h:860

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition: InstrTypes.h:678

llvm::CmpInst::FCMP_OEQ
@ FCMP_OEQ
0 0 0 1 True if ordered and equal
Definition: InstrTypes.h:681

llvm::CmpInst::BAD_ICMP_PREDICATE
@ BAD_ICMP_PREDICATE
Definition: InstrTypes.h:711

llvm::CmpInst::FCMP_TRUE
@ FCMP_TRUE
1 1 1 1 Always true (always folded)
Definition: InstrTypes.h:695

llvm::CmpInst::ICMP_SLT
@ ICMP_SLT
signed less than
Definition: InstrTypes.h:707

llvm::CmpInst::ICMP_SLE
@ ICMP_SLE
signed less or equal
Definition: InstrTypes.h:708

llvm::CmpInst::FCMP_OLT
@ FCMP_OLT
0 1 0 0 True if ordered and less than
Definition: InstrTypes.h:684

llvm::CmpInst::FCMP_ULE
@ FCMP_ULE
1 1 0 1 True if unordered, less than, or equal
Definition: InstrTypes.h:693

llvm::CmpInst::FCMP_OGT
@ FCMP_OGT
0 0 1 0 True if ordered and greater than
Definition: InstrTypes.h:682

llvm::CmpInst::FCMP_OGE
@ FCMP_OGE
0 0 1 1 True if ordered and greater than or equal
Definition: InstrTypes.h:683

llvm::CmpInst::ICMP_UGE
@ ICMP_UGE
unsigned greater or equal
Definition: InstrTypes.h:702

llvm::CmpInst::ICMP_UGT
@ ICMP_UGT
unsigned greater than
Definition: InstrTypes.h:701

llvm::CmpInst::ICMP_SGT
@ ICMP_SGT
signed greater than
Definition: InstrTypes.h:705

llvm::CmpInst::FCMP_ULT
@ FCMP_ULT
1 1 0 0 True if unordered or less than
Definition: InstrTypes.h:692

llvm::CmpInst::FCMP_ONE
@ FCMP_ONE
0 1 1 0 True if ordered and operands are unequal
Definition: InstrTypes.h:686

llvm::CmpInst::FCMP_UEQ
@ FCMP_UEQ
1 0 0 1 True if unordered or equal
Definition: InstrTypes.h:689

llvm::CmpInst::ICMP_ULT
@ ICMP_ULT
unsigned less than
Definition: InstrTypes.h:703

llvm::CmpInst::FCMP_UGT
@ FCMP_UGT
1 0 1 0 True if unordered or greater than
Definition: InstrTypes.h:690

llvm::CmpInst::FCMP_OLE
@ FCMP_OLE
0 1 0 1 True if ordered and less than or equal
Definition: InstrTypes.h:685

llvm::CmpInst::FCMP_ORD
@ FCMP_ORD
0 1 1 1 True if ordered (no nans)
Definition: InstrTypes.h:687

llvm::CmpInst::ICMP_EQ
@ ICMP_EQ
equal
Definition: InstrTypes.h:699

llvm::CmpInst::ICMP_NE
@ ICMP_NE
not equal
Definition: InstrTypes.h:700

llvm::CmpInst::ICMP_SGE
@ ICMP_SGE
signed greater or equal
Definition: InstrTypes.h:706

llvm::CmpInst::FCMP_UNE
@ FCMP_UNE
1 1 1 0 True if unordered or not equal
Definition: InstrTypes.h:694

llvm::CmpInst::ICMP_ULE
@ ICMP_ULE
unsigned less or equal
Definition: InstrTypes.h:704

llvm::CmpInst::FCMP_UGE
@ FCMP_UGE
1 0 1 1 True if unordered, greater than, or equal
Definition: InstrTypes.h:691

llvm::CmpInst::FCMP_FALSE
@ FCMP_FALSE
0 0 0 0 Always false (always folded)
Definition: InstrTypes.h:680

llvm::CmpInst::FCMP_UNO
@ FCMP_UNO
1 0 0 0 True if unordered: isnan(X) | isnan(Y)
Definition: InstrTypes.h:688

llvm::CmpInst::isSigned
bool isSigned() const
Definition: InstrTypes.h:932

llvm::CmpInst::getSwappedPredicate
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Definition: InstrTypes.h:829

llvm::CmpInst::isTrueWhenEqual
bool isTrueWhenEqual() const
This is just a convenience.
Definition: InstrTypes.h:944

llvm::CmpInst::Create
static LLVM_ABI CmpInst * Create(OtherOps Op, Predicate Pred, Value *S1, Value *S2, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Construct a compare instruction, given the opcode, the predicate and the two operands.
Definition: Instructions.cpp:3509

llvm::CmpInst::getNonStrictPredicate
Predicate getNonStrictPredicate() const
For example, SGT -> SGE, SLT -> SLE, ULT -> ULE, UGT -> UGE.
Definition: InstrTypes.h:873

llvm::CmpInst::getInversePredicate
Predicate getInversePredicate() const
For example, EQ -> NE, UGT -> ULE, SLT -> SGE, OEQ -> UNE, UGT -> OLE, OLT -> UGE,...
Definition: InstrTypes.h:791

llvm::CmpInst::getPredicate
Predicate getPredicate() const
Return the predicate for this instruction.
Definition: InstrTypes.h:767

llvm::CmpInst::isStrictPredicate
bool isStrictPredicate() const
Definition: InstrTypes.h:845

llvm::CmpInst::getFlippedStrictnessPredicate
Predicate getFlippedStrictnessPredicate() const
For predicate of kind "is X or equal to 0" returns the predicate "is X".
Definition: InstrTypes.h:895

llvm::CmpInst::isIntPredicate
bool isIntPredicate() const
Definition: InstrTypes.h:785

llvm::CmpInst::isUnsigned
bool isUnsigned() const
Definition: InstrTypes.h:938

llvm::CmpPredicate
An abstraction over a floating-point predicate, and a pack of an integer predicate with samesign info...
Definition: CmpPredicate.h:23

llvm::CmpPredicate::dropSameSign
CmpInst::Predicate dropSameSign() const
Drops samesign information.
Definition: CmpPredicate.h:47

llvm::CmpPredicate::getSwapped
static LLVM_ABI CmpPredicate getSwapped(CmpPredicate P)
Get the swapped predicate of a CmpPredicate.
Definition: Instructions.cpp:4038

llvm::ConstantExpr::getIntToPtr
static LLVM_ABI Constant * getIntToPtr(Constant *C, Type *Ty, bool OnlyIfReduced=false)
Definition: Constants.cpp:2314

llvm::ConstantExpr::getPointerBitCastOrAddrSpaceCast
static LLVM_ABI Constant * getPointerBitCastOrAddrSpaceCast(Constant *C, Type *Ty)
Create a BitCast or AddrSpaceCast for a pointer type depending on the address space.
Definition: Constants.cpp:2261

llvm::ConstantExpr::getSub
static LLVM_ABI Constant * getSub(Constant *C1, Constant *C2, bool HasNUW=false, bool HasNSW=false)
Definition: Constants.cpp:2654

llvm::ConstantExpr::getNot
static LLVM_ABI Constant * getNot(Constant *C)
Definition: Constants.cpp:2641

llvm::ConstantExpr::getPtrToInt
static LLVM_ABI Constant * getPtrToInt(Constant *C, Type *Ty, bool OnlyIfReduced=false)
Definition: Constants.cpp:2300

llvm::ConstantExpr::getXor
static LLVM_ABI Constant * getXor(Constant *C1, Constant *C2)
Definition: Constants.cpp:2661

llvm::ConstantExpr::getNeg
static LLVM_ABI Constant * getNeg(Constant *C, bool HasNSW=false)
Definition: Constants.cpp:2635

llvm::ConstantFP::getZero
static LLVM_ABI Constant * getZero(Type *Ty, bool Negative=false)
Definition: Constants.cpp:1059

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition: Constants.h:87

llvm::ConstantInt::getLimitedValue
uint64_t getLimitedValue(uint64_t Limit=~0ULL) const
getLimitedValue - If the value is smaller than the specified limit, return it, otherwise return the l...
Definition: Constants.h:264

llvm::ConstantInt::getTrue
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
Definition: Constants.cpp:868

llvm::ConstantInt::isZero
bool isZero() const
This is just a convenience method to make client code smaller for a common code.
Definition: Constants.h:214

llvm::ConstantInt::getSigned
static ConstantInt * getSigned(IntegerType *Ty, int64_t V)
Return a ConstantInt with the specified value for the specified type.
Definition: Constants.h:131

llvm::ConstantInt::getFalse
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
Definition: Constants.cpp:875

llvm::ConstantInt::getBitWidth
unsigned getBitWidth() const
getBitWidth - Return the scalar bitwidth of this constant.
Definition: Constants.h:157

llvm::ConstantInt::getValue
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition: Constants.h:154

llvm::ConstantInt::getBool
static LLVM_ABI ConstantInt * getBool(LLVMContext &Context, bool V)
Definition: Constants.cpp:882

llvm::ConstantRange
This class represents a range of values.
Definition: ConstantRange.h:47

llvm::ConstantRange::add
LLVM_ABI ConstantRange add(const ConstantRange &Other) const
Return a new range representing the possible values resulting from an addition of a value in this ran...
Definition: ConstantRange.cpp:1097

llvm::ConstantRange::exactUnionWith
LLVM_ABI std::optional< ConstantRange > exactUnionWith(const ConstantRange &CR) const
Union the two ranges and return the result if it can be represented exactly, otherwise return std::nu...
Definition: ConstantRange.cpp:780

llvm::ConstantRange::getEquivalentICmp
LLVM_ABI bool getEquivalentICmp(CmpInst::Predicate &Pred, APInt &RHS) const
Set up Pred and RHS such that ConstantRange::makeExactICmpRegion(Pred, RHS) == *this.
Definition: ConstantRange.cpp:246

llvm::ConstantRange::subtract
LLVM_ABI ConstantRange subtract(const APInt &CI) const
Subtract the specified constant from the endpoints of this constant range.
Definition: ConstantRange.cpp:559

llvm::ConstantRange::getSingleElement
const APInt * getSingleElement() const
If this set contains a single element, return it, otherwise return null.
Definition: ConstantRange.h:257

llvm::ConstantRange::difference
LLVM_ABI ConstantRange difference(const ConstantRange &CR) const
Subtract the specified range from this range (aka relative complement of the sets).
Definition: ConstantRange.cpp:567

llvm::ConstantRange::isEmptySet
LLVM_ABI bool isEmptySet() const
Return true if this set contains no members.
Definition: ConstantRange.cpp:428

llvm::ConstantRange::truncate
LLVM_ABI ConstantRange truncate(uint32_t BitWidth, unsigned NoWrapKind=0) const
Return a new range in the specified integer type, which must be strictly smaller than the current typ...
Definition: ConstantRange.cpp:875

llvm::ConstantRange::makeExactICmpRegion
static LLVM_ABI ConstantRange makeExactICmpRegion(CmpInst::Predicate Pred, const APInt &Other)
Produce the exact range such that all values in the returned range satisfy the given predicate with a...
Definition: ConstantRange.cpp:169

llvm::ConstantRange::inverse
LLVM_ABI ConstantRange inverse() const
Return a new range that is the logical not of the current set.
Definition: ConstantRange.cpp:1959

llvm::ConstantRange::exactIntersectWith
LLVM_ABI std::optional< ConstantRange > exactIntersectWith(const ConstantRange &CR) const
Intersect the two ranges and return the result if it can be represented exactly, otherwise return std...
Definition: ConstantRange.cpp:771

llvm::ConstantRange::intersectWith
LLVM_ABI ConstantRange intersectWith(const ConstantRange &CR, PreferredRangeType Type=Smallest) const
Return the range that results from the intersection of this range with another range.
Definition: ConstantRange.cpp:591

llvm::ConstantRange::sub
LLVM_ABI ConstantRange sub(const ConstantRange &Other) const
Return a new range representing the possible values resulting from a subtraction of a value in this r...
Definition: ConstantRange.cpp:1144

llvm::ConstantRange::makeExactNoWrapRegion
static LLVM_ABI ConstantRange makeExactNoWrapRegion(Instruction::BinaryOps BinOp, const APInt &Other, unsigned NoWrapKind)
Produce the range that contains X if and only if "X BinOp Other" does not wrap.
Definition: ConstantRange.cpp:399

llvm::ConstantVector::getSplat
static LLVM_ABI Constant * getSplat(ElementCount EC, Constant *Elt)
Return a ConstantVector with the specified constant in each element.
Definition: Constants.cpp:1474

llvm::Constant
This is an important base class in LLVM.
Definition: Constant.h:43

llvm::Constant::getIntegerValue
static LLVM_ABI Constant * getIntegerValue(Type *Ty, const APInt &V)
Return the value for an integer or pointer constant, or a vector thereof, with the given scalar value...
Definition: Constants.cpp:403

llvm::Constant::getAllOnesValue
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
Definition: Constants.cpp:420

llvm::Constant::getUniqueInteger
LLVM_ABI const APInt & getUniqueInteger() const
If C is a constant integer then return its value, otherwise C must be a vector of constant integers,...
Definition: Constants.cpp:1778

llvm::Constant::getNullValue
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
Definition: Constants.cpp:373

llvm::Constant::isNullValue
LLVM_ABI bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
Definition: Constants.cpp:90

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:33

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63

llvm::DataLayout::getIntPtrType
LLVM_ABI IntegerType * getIntPtrType(LLVMContext &C, unsigned AddressSpace=0) const
Returns an integer type with size at least as big as that of a pointer in the given address space.
Definition: DataLayout.cpp:850

llvm::DataLayout::getPointerTypeSizeInBits
LLVM_ABI unsigned getPointerTypeSizeInBits(Type *) const
The pointer representation size in bits for this type.
Definition: DataLayout.cpp:742

llvm::DataLayout::getIndexType
LLVM_ABI IntegerType * getIndexType(LLVMContext &C, unsigned AddressSpace) const
Returns the type of a GEP index in AddressSpace.
Definition: DataLayout.cpp:877

llvm::DataLayout::getTypeAllocSize
TypeSize getTypeAllocSize(Type *Ty) const
Returns the offset in bytes between successive objects of the specified type, including alignment pad...
Definition: DataLayout.h:504

llvm::DataLayout::getSmallestLegalIntType
LLVM_ABI Type * getSmallestLegalIntType(LLVMContext &C, unsigned Width=0) const
Returns the smallest integer type with size at least as big as Width bits.
Definition: DataLayout.cpp:865

llvm::DenseMapBase::find
iterator find(const_arg_type_t< KeyT > Val)
Definition: DenseMap.h:177

llvm::DenseMapBase::end
iterator end()
Definition: DenseMap.h:87

llvm::DenseMapBase::contains
bool contains(const_arg_type_t< KeyT > Val) const
Return true if the specified key is in the map, false otherwise.
Definition: DenseMap.h:168

llvm::DenseMap
Definition: DenseMap.h:730

llvm::DomConditionCache::conditionsFor
ArrayRef< BranchInst * > conditionsFor(const Value *V) const
Access the list of branches which affect this value.
Definition: DomConditionCache.h:43

llvm::DominatorTree::dominates
LLVM_ABI bool dominates(const BasicBlock *BB, const Use &U) const
Return true if the (end of the) basic block BB dominates the use U.
Definition: Dominators.cpp:135

llvm::ExtractValueInst::Create
static ExtractValueInst * Create(Value *Agg, ArrayRef< unsigned > Idxs, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Definition: Instructions.h:2456

llvm::FCmpInst
This instruction compares its operands according to the predicate given to the constructor.
Definition: Instructions.h:1410

llvm::FCmpInst::isEquality
bool isEquality() const
Definition: Instructions.h:1460

llvm::Function
Definition: Function.h:64

llvm::GEPNoWrapFlags
Represents flags for the getelementptr instruction/expression.
Definition: GEPNoWrapFlags.h:26

llvm::GEPNoWrapFlags::hasNoUnsignedSignedWrap
bool hasNoUnsignedSignedWrap() const
Definition: GEPNoWrapFlags.h:64

llvm::GEPNoWrapFlags::hasNoUnsignedWrap
bool hasNoUnsignedWrap() const
Definition: GEPNoWrapFlags.h:65

llvm::GEPNoWrapFlags::intersectForOffsetAdd
GEPNoWrapFlags intersectForOffsetAdd(GEPNoWrapFlags Other) const
Given (gep (gep p, x), y), determine the nowrap flags for (gep p, x+y).
Definition: GEPNoWrapFlags.h:78

llvm::GEPNoWrapFlags::none
static GEPNoWrapFlags none()
Definition: GEPNoWrapFlags.h:46

llvm::GEPOperator
Definition: Operator.h:420

llvm::GEPOperator::isInBounds
bool isInBounds() const
Test whether this is an inbounds GEP, as defined by LangRef.html.
Definition: Operator.h:430

llvm::GEPOperator::getSourceElementType
LLVM_ABI Type * getSourceElementType() const
Definition: Operator.cpp:70

llvm::GEPOperator::getPointerOperand
Value * getPointerOperand()
Definition: Operator.h:457

llvm::GEPOperator::getNoWrapFlags
GEPNoWrapFlags getNoWrapFlags() const
Definition: Operator.h:425

llvm::GEPOperator::hasAllConstantIndices
bool hasAllConstantIndices() const
Return true if all of the indices of this GEP are constant integers.
Definition: Operator.h:504

llvm::GetElementPtrInst
an instruction for type-safe pointer arithmetic to access elements of arrays and structs
Definition: Instructions.h:949

llvm::GlobalValue::getValueType
Type * getValueType() const
Definition: GlobalValue.h:298

llvm::GlobalVariable
Definition: GlobalVariable.h:40

llvm::GlobalVariable::getInitializer
const Constant * getInitializer() const
getInitializer - Return the initializer for this global variable.
Definition: GlobalVariable.h:154

llvm::GlobalVariable::isConstant
bool isConstant() const
If the value is a global constant, its value is immutable throughout the runtime execution of the pro...
Definition: GlobalVariable.h:177

llvm::GlobalVariable::hasDefinitiveInitializer
bool hasDefinitiveInitializer() const
hasDefinitiveInitializer - Whether the global variable has an initializer, and any other instances of...
Definition: GlobalVariable.h:128

llvm::ICmpInst
This instruction compares its operands according to the predicate given to the constructor.
Definition: Instructions.h:1177

llvm::ICmpInst::isGE
static bool isGE(Predicate P)
Return true if the predicate is SGE or UGE.
Definition: Instructions.h:1360

llvm::ICmpInst::compare
static LLVM_ABI bool compare(const APInt &LHS, const APInt &RHS, ICmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
Definition: Instructions.cpp:3820

llvm::ICmpInst::isLT
static bool isLT(Predicate P)
Return true if the predicate is SLT or ULT.
Definition: Instructions.h:1354

llvm::ICmpInst::isGT
static bool isGT(Predicate P)
Return true if the predicate is SGT or UGT.
Definition: Instructions.h:1348

llvm::ICmpInst::getFlippedSignednessPredicate
Predicate getFlippedSignednessPredicate() const
For example, SLT->ULT, ULT->SLT, SLE->ULE, ULE->SLE, EQ->EQ.
Definition: Instructions.h:1296

llvm::ICmpInst::getSignedPredicate
Predicate getSignedPredicate() const
For example, EQ->EQ, SLE->SLE, UGT->SGT, etc.
Definition: Instructions.h:1269

llvm::ICmpInst::isEquality
bool isEquality() const
Return true if this predicate is either EQ or NE.
Definition: Instructions.h:1322

llvm::ICmpInst::isEquality
static bool isEquality(Predicate P)
Return true if this predicate is either EQ or NE.
Definition: Instructions.h:1316

llvm::ICmpInst::isRelational
bool isRelational() const
Return true if the predicate is relational (not EQ or NE).
Definition: Instructions.h:1336

llvm::ICmpInst::getUnsignedPredicate
Predicate getUnsignedPredicate() const
For example, EQ->EQ, SLE->ULE, UGT->UGT, etc.
Definition: Instructions.h:1280

llvm::ICmpInst::isLE
static bool isLE(Predicate P)
Return true if the predicate is SLE or ULE.
Definition: Instructions.h:1366

llvm::IRBuilderBase::InsertPointGuard
Definition: IRBuilder.h:409

llvm::IRBuilderBase
Common base class shared among various IRBuilders.
Definition: IRBuilder.h:114

llvm::IRBuilderBase::CreateICmpULT
Value * CreateICmpULT(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2345

llvm::IRBuilderBase::CreateExtractElement
Value * CreateExtractElement(Value *Vec, Value *Idx, const Twine &Name="")
Definition: IRBuilder.h:2559

llvm::IRBuilderBase::getIntNTy
IntegerType * getIntNTy(unsigned N)
Fetch the type representing an N-bit integer.
Definition: IRBuilder.h:575

llvm::IRBuilderBase::CreateICmpSGT
Value * CreateICmpSGT(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2353

llvm::IRBuilderBase::CreateVectorSplat
LLVM_ABI Value * CreateVectorSplat(unsigned NumElts, Value *V, const Twine &Name="")
Return a vector value that contains.
Definition: IRBuilder.cpp:1115

llvm::IRBuilderBase::CreateExtractValue
Value * CreateExtractValue(Value *Agg, ArrayRef< unsigned > Idxs, const Twine &Name="")
Definition: IRBuilder.h:2618

llvm::IRBuilderBase::getTrue
ConstantInt * getTrue()
Get the constant value for i1 true.
Definition: IRBuilder.h:502

llvm::IRBuilderBase::CreateSelect
LLVM_ABI Value * CreateSelect(Value *C, Value *True, Value *False, const Twine &Name="", Instruction *MDFrom=nullptr)
Definition: IRBuilder.cpp:1005

llvm::IRBuilderBase::CreateLShr
Value * CreateLShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
Definition: IRBuilder.h:1513

llvm::IRBuilderBase::CreateCast
Value * CreateCast(Instruction::CastOps Op, Value *V, Type *DestTy, const Twine &Name="", MDNode *FPMathTag=nullptr, FMFSource FMFSource={})
Definition: IRBuilder.h:2238

llvm::IRBuilderBase::CreateICmpNE
Value * CreateICmpNE(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2333

llvm::IRBuilderBase::CreateGEP
Value * CreateGEP(Type *Ty, Value *Ptr, ArrayRef< Value * > IdxList, const Twine &Name="", GEPNoWrapFlags NW=GEPNoWrapFlags::none())
Definition: IRBuilder.h:1923

llvm::IRBuilderBase::CreateNeg
Value * CreateNeg(Value *V, const Twine &Name="", bool HasNSW=false)
Definition: IRBuilder.h:1781

llvm::IRBuilderBase::createIsFPClass
LLVM_ABI Value * createIsFPClass(Value *FPNum, unsigned Test)
Definition: IRBuilder.cpp:1223

llvm::IRBuilderBase::CreateIntrinsic
LLVM_ABI CallInst * CreateIntrinsic(Intrinsic::ID ID, ArrayRef< Type * > Types, ArrayRef< Value * > Args, FMFSource FMFSource={}, const Twine &Name="")
Create a call to intrinsic ID with Args, mangled using Types.
Definition: IRBuilder.cpp:834

llvm::IRBuilderBase::getInt32
ConstantInt * getInt32(uint32_t C)
Get a constant 32-bit value.
Definition: IRBuilder.h:522

llvm::IRBuilderBase::CreateCmp
Value * CreateCmp(CmpInst::Predicate Pred, Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2463

llvm::IRBuilderBase::CreatePHI
PHINode * CreatePHI(Type *Ty, unsigned NumReservedValues, const Twine &Name="")
Definition: IRBuilder.h:2494

llvm::IRBuilderBase::CreateNot
Value * CreateNot(Value *V, const Twine &Name="")
Definition: IRBuilder.h:1805

llvm::IRBuilderBase::CreateICmpEQ
Value * CreateICmpEQ(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2329

llvm::IRBuilderBase::CreateSub
Value * CreateSub(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1420

llvm::IRBuilderBase::CreateBitCast
Value * CreateBitCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2204

llvm::IRBuilderBase::CreateICmpUGT
Value * CreateICmpUGT(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2337

llvm::IRBuilderBase::CreateUnaryIntrinsic
LLVM_ABI CallInst * CreateUnaryIntrinsic(Intrinsic::ID ID, Value *V, FMFSource FMFSource={}, const Twine &Name="")
Create a call to intrinsic ID with 1 operand which is mangled on its type.
Definition: IRBuilder.cpp:815

llvm::IRBuilderBase::CreateShl
Value * CreateShl(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1492

llvm::IRBuilderBase::CreateZExt
Value * CreateZExt(Value *V, Type *DestTy, const Twine &Name="", bool IsNonNeg=false)
Definition: IRBuilder.h:2082

llvm::IRBuilderBase::CreateAnd
Value * CreateAnd(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1551

llvm::IRBuilderBase::CreateAdd
Value * CreateAdd(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1403

llvm::IRBuilderBase::getFalse
ConstantInt * getFalse()
Get the constant value for i1 false.
Definition: IRBuilder.h:507

llvm::IRBuilderBase::CreateCall
CallInst * CreateCall(FunctionType *FTy, Value *Callee, ArrayRef< Value * > Args={}, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2508

llvm::IRBuilderBase::CreateTrunc
Value * CreateTrunc(Value *V, Type *DestTy, const Twine &Name="", bool IsNUW=false, bool IsNSW=false)
Definition: IRBuilder.h:2068

llvm::IRBuilderBase::CreateBinOp
Value * CreateBinOp(Instruction::BinaryOps Opc, Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:1708

llvm::IRBuilderBase::CreateICmpSLT
Value * CreateICmpSLT(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2361

llvm::IRBuilderBase::CreateIntCast
Value * CreateIntCast(Value *V, Type *DestTy, bool isSigned, const Twine &Name="")
Definition: IRBuilder.h:2277

llvm::IRBuilderBase::CreateIsNull
Value * CreateIsNull(Value *Arg, const Twine &Name="")
Return a boolean value testing if Arg == 0.
Definition: IRBuilder.h:2646

llvm::IRBuilderBase::SetInsertPoint
void SetInsertPoint(BasicBlock *TheBB)
This specifies that created instructions should be appended to the end of the specified block.
Definition: IRBuilder.h:207

llvm::IRBuilderBase::CreateXor
Value * CreateXor(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1599

llvm::IRBuilderBase::CreateICmp
Value * CreateICmp(CmpInst::Predicate P, Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2439

llvm::IRBuilderBase::CreateOr
Value * CreateOr(Value *LHS, Value *RHS, const Twine &Name="", bool IsDisjoint=false)
Definition: IRBuilder.h:1573

llvm::IRBuilderBase::getInt8Ty
IntegerType * getInt8Ty()
Fetch the type representing an 8-bit integer.
Definition: IRBuilder.h:552

llvm::IRBuilderBase::getInt
ConstantInt * getInt(const APInt &AI)
Get a constant integer value.
Definition: IRBuilder.h:538

llvm::IRBuilderBase::CreateURem
Value * CreateURem(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1480

llvm::IRBuilderBase::CreateMul
Value * CreateMul(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1437

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition: IRBuilder.h:2780

llvm::Init
Definition: Record.h:286

llvm::InstCombinerImpl
Definition: InstCombineInternal.h:62

llvm::InstCombinerImpl::foldICmpShrConstant
Instruction * foldICmpShrConstant(ICmpInst &Cmp, BinaryOperator *Shr, const APInt &C)
Fold icmp ({al}shr X, Y), C.
Definition: InstCombineCompares.cpp:2542

llvm::InstCombinerImpl::FoldOpIntoSelect
Instruction * FoldOpIntoSelect(Instruction &Op, SelectInst *SI, bool FoldWithMultiUse=false)
Given an instruction with a select as one operand and a constant as the other operand,...
Definition: InstructionCombining.cpp:1767

llvm::InstCombinerImpl::foldICmpWithZextOrSext
Instruction * foldICmpWithZextOrSext(ICmpInst &ICmp)
Definition: InstCombineCompares.cpp:6299

llvm::InstCombinerImpl::foldICmpSelectConstant
Instruction * foldICmpSelectConstant(ICmpInst &Cmp, SelectInst *Select, ConstantInt *C)
Definition: InstCombineCompares.cpp:3394

llvm::InstCombinerImpl::foldICmpSRemConstant
Instruction * foldICmpSRemConstant(ICmpInst &Cmp, BinaryOperator *UDiv, const APInt &C)
Definition: InstCombineCompares.cpp:2706

llvm::InstCombinerImpl::foldICmpBinOpWithConstant
Instruction * foldICmpBinOpWithConstant(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Fold an icmp with BinaryOp and constant operand: icmp Pred BO, C.
Definition: InstCombineCompares.cpp:4022

llvm::InstCombinerImpl::foldICmpOrConstant
Instruction * foldICmpOrConstant(ICmpInst &Cmp, BinaryOperator *Or, const APInt &C)
Fold icmp (or X, Y), C.
Definition: InstCombineCompares.cpp:2120

llvm::InstCombinerImpl::foldICmpTruncWithTruncOrExt
Instruction * foldICmpTruncWithTruncOrExt(ICmpInst &Cmp, const SimplifyQuery &Q)
Fold icmp (trunc nuw/nsw X), (trunc nuw/nsw Y).
Definition: InstCombineCompares.cpp:1570

llvm::InstCombinerImpl::foldSignBitTest
Instruction * foldSignBitTest(ICmpInst &I)
Fold equality-comparison between zero and any (maybe truncated) right-shift by one-less-than-bitwidth...
Definition: InstCombineCompares.cpp:1207

llvm::InstCombinerImpl::foldOpIntoPhi
Instruction * foldOpIntoPhi(Instruction &I, PHINode *PN, bool AllowMultipleUses=false)
Given a binary operator, cast instruction, or select which has a PHI node as operand #0,...
Definition: InstructionCombining.cpp:1860

llvm::InstCombinerImpl::insertRangeTest
Value * insertRangeTest(Value *V, const APInt &Lo, const APInt &Hi, bool isSigned, bool Inside)
Emit a computation of: (V >= Lo && V < Hi) if Inside is true, otherwise (V < Lo || V >= Hi).
Definition: InstCombineAndOrXor.cpp:56

llvm::InstCombinerImpl::foldICmpBinOp
Instruction * foldICmpBinOp(ICmpInst &Cmp, const SimplifyQuery &SQ)
Try to fold icmp (binop), X or icmp X, (binop).
Definition: InstCombineCompares.cpp:5170

llvm::InstCombinerImpl::foldICmpSubConstant
Instruction * foldICmpSubConstant(ICmpInst &Cmp, BinaryOperator *Sub, const APInt &C)
Fold icmp (sub X, Y), C.
Definition: InstCombineCompares.cpp:3003

llvm::InstCombinerImpl::foldICmpInstWithConstantNotInt
Instruction * foldICmpInstWithConstantNotInt(ICmpInst &Cmp)
Handle icmp with constant (but not simple integer constant) RHS.
Definition: InstCombineCompares.cpp:4335

llvm::InstCombinerImpl::SimplifyDemandedBits
bool SimplifyDemandedBits(Instruction *I, unsigned Op, const APInt &DemandedMask, KnownBits &Known, const SimplifyQuery &Q, unsigned Depth=0) override
This form of SimplifyDemandedBits simplifies the specified instruction operand if possible,...
Definition: InstCombineSimplifyDemanded.cpp:95

llvm::InstCombinerImpl::foldICmpShlConstConst
Instruction * foldICmpShlConstConst(ICmpInst &I, Value *ShAmt, const APInt &C1, const APInt &C2)
Handle "(icmp eq/ne (shl AP2, A), AP1)" -> (icmp eq/ne A, TrailingZeros(AP1) - TrailingZeros(AP2)).
Definition: InstCombineCompares.cpp:1057

llvm::InstCombinerImpl::reassociateShiftAmtsOfTwoSameDirectionShifts
Value * reassociateShiftAmtsOfTwoSameDirectionShifts(BinaryOperator *Sh0, const SimplifyQuery &SQ, bool AnalyzeForSignBitExtraction=false)
Definition: InstCombineShifts.cpp:58

llvm::InstCombinerImpl::foldICmpEqIntrinsicWithConstant
Instruction * foldICmpEqIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst *II, const APInt &C)
Fold an equality icmp with LLVM intrinsic and constant operand.
Definition: InstCombineCompares.cpp:3836

llvm::InstCombinerImpl::foldMultiplicationOverflowCheck
Value * foldMultiplicationOverflowCheck(ICmpInst &Cmp)
Fold (-1 u/ x) u< y ((x * y) ?/ x) != y to @llvm.
Definition: InstCombineCompares.cpp:4913

llvm::InstCombinerImpl::foldICmpWithConstant
Instruction * foldICmpWithConstant(ICmpInst &Cmp)
Fold icmp Pred X, C.
Definition: InstCombineCompares.cpp:1357

llvm::InstCombinerImpl::canonicalizeICmpPredicate
CmpInst * canonicalizeICmpPredicate(CmpInst &I)
If we have a comparison with a non-canonical predicate, if we can update all the users,...
Definition: InstCombineCompares.cpp:7193

llvm::InstCombinerImpl::eraseInstFromFunction
Instruction * eraseInstFromFunction(Instruction &I) override
Combiner aware instruction erasure.
Definition: InstCombineInternal.h:505

llvm::InstCombinerImpl::foldICmpWithZero
Instruction * foldICmpWithZero(ICmpInst &Cmp)
Definition: InstCombineCompares.cpp:1238

llvm::InstCombinerImpl::foldICmpCommutative
Instruction * foldICmpCommutative(CmpPredicate Pred, Value *Op0, Value *Op1, ICmpInst &CxtI)
Definition: InstCombineCompares.cpp:7502

llvm::InstCombinerImpl::foldICmpBinOpEqualityWithConstant
Instruction * foldICmpBinOpEqualityWithConstant(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Fold an icmp equality instruction with binary operator LHS and constant RHS: icmp eq/ne BO,...
Definition: InstCombineCompares.cpp:3643

llvm::InstCombinerImpl::foldICmpUsingBoolRange
Instruction * foldICmpUsingBoolRange(ICmpInst &I)
If one operand of an icmp is effectively a bool (value range of {0,1}), then try to reduce patterns b...
Definition: InstCombineCompares.cpp:7083

llvm::InstCombinerImpl::foldICmpWithTrunc
Instruction * foldICmpWithTrunc(ICmpInst &Cmp)
Definition: InstCombineCompares.cpp:6256

llvm::InstCombinerImpl::foldICmpIntrinsicWithConstant
Instruction * foldICmpIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst *II, const APInt &C)
Fold an icmp with LLVM intrinsic and constant operand: icmp Pred II, C.
Definition: InstCombineCompares.cpp:4227

llvm::InstCombinerImpl::matchThreeWayIntCompare
bool matchThreeWayIntCompare(SelectInst *SI, Value *&LHS, Value *&RHS, ConstantInt *&Less, ConstantInt *&Equal, ConstantInt *&Greater)
Match a select chain which produces one of three values based on whether the LHS is less than,...
Definition: InstCombineCompares.cpp:3341

llvm::InstCombinerImpl::foldCmpLoadFromIndexedGlobal
Instruction * foldCmpLoadFromIndexedGlobal(LoadInst *LI, GetElementPtrInst *GEP, GlobalVariable *GV, CmpInst &ICI, ConstantInt *AndCst=nullptr)
This is called when we see this pattern: cmp pred (load (gep GV, ...)), cmpcst where GV is a global v...
Definition: InstCombineCompares.cpp:112

llvm::InstCombinerImpl::visitFCmpInst
Instruction * visitFCmpInst(FCmpInst &I)
Definition: InstCombineCompares.cpp:8651

llvm::InstCombinerImpl::foldICmpUsingKnownBits
Instruction * foldICmpUsingKnownBits(ICmpInst &Cmp)
Try to fold the comparison based on range information we can get by checking whether bits are known t...
Definition: InstCombineCompares.cpp:6870

llvm::InstCombinerImpl::foldICmpDivConstant
Instruction * foldICmpDivConstant(ICmpInst &Cmp, BinaryOperator *Div, const APInt &C)
Fold icmp ({su}div X, Y), C.
Definition: InstCombineCompares.cpp:2821

llvm::InstCombinerImpl::foldIRemByPowerOfTwoToBitTest
Instruction * foldIRemByPowerOfTwoToBitTest(ICmpInst &I)
If we have: icmp eq/ne (urem/srem x, y), 0 iff y is a power-of-two, we can replace this with a bit te...
Definition: InstCombineCompares.cpp:1188

llvm::InstCombinerImpl::foldFCmpIntToFPConst
Instruction * foldFCmpIntToFPConst(FCmpInst &I, Instruction *LHSI, Constant *RHSC)
Fold fcmp ([us]itofp x, cst) if possible.
Definition: InstCombineCompares.cpp:7978

llvm::InstCombinerImpl::foldICmpUDivConstant
Instruction * foldICmpUDivConstant(ICmpInst &Cmp, BinaryOperator *UDiv, const APInt &C)
Fold icmp (udiv X, Y), C.
Definition: InstCombineCompares.cpp:2788

llvm::InstCombinerImpl::foldICmpAddOpConst
Instruction * foldICmpAddOpConst(Value *X, const APInt &C, CmpPredicate Pred)
Fold "icmp pred (X+C), X".
Definition: InstCombineCompares.cpp:948

llvm::InstCombinerImpl::getLosslessTrunc
Constant * getLosslessTrunc(Constant *C, Type *TruncTy, unsigned ExtOp)
Definition: InstCombineInternal.h:225

llvm::InstCombinerImpl::foldICmpWithCastOp
Instruction * foldICmpWithCastOp(ICmpInst &ICmp)
Handle icmp (cast x), (cast or constant).
Definition: InstCombineCompares.cpp:6412

llvm::InstCombinerImpl::foldICmpTruncConstant
Instruction * foldICmpTruncConstant(ICmpInst &Cmp, TruncInst *Trunc, const APInt &C)
Fold icmp (trunc X), C.
Definition: InstCombineCompares.cpp:1483

llvm::InstCombinerImpl::foldICmpAddConstant
Instruction * foldICmpAddConstant(ICmpInst &Cmp, BinaryOperator *Add, const APInt &C)
Fold icmp (add X, Y), C.
Definition: InstCombineCompares.cpp:3176

llvm::InstCombinerImpl::foldICmpMulConstant
Instruction * foldICmpMulConstant(ICmpInst &Cmp, BinaryOperator *Mul, const APInt &C)
Fold icmp (mul X, Y), C.
Definition: InstCombineCompares.cpp:2221

llvm::InstCombinerImpl::tryFoldInstWithCtpopWithNot
Instruction * tryFoldInstWithCtpopWithNot(Instruction *I)
Definition: InstructionCombining.cpp:846

llvm::InstCombinerImpl::foldICmpXorConstant
Instruction * foldICmpXorConstant(ICmpInst &Cmp, BinaryOperator *Xor, const APInt &C)
Fold icmp (xor X, Y), C.
Definition: InstCombineCompares.cpp:1629

llvm::InstCombinerImpl::foldSelectICmp
Instruction * foldSelectICmp(CmpPredicate Pred, SelectInst *SI, Value *RHS, const ICmpInst &I)
Definition: InstCombineCompares.cpp:4366

llvm::InstCombinerImpl::foldICmpInstWithConstantAllowPoison
Instruction * foldICmpInstWithConstantAllowPoison(ICmpInst &Cmp, const APInt &C)
Try to fold integer comparisons with a constant operand: icmp Pred X, C where X is some kind of instr...
Definition: InstCombineCompares.cpp:4000

llvm::InstCombinerImpl::foldIsMultipleOfAPowerOfTwo
Instruction * foldIsMultipleOfAPowerOfTwo(ICmpInst &Cmp)
Fold icmp eq (num + mask) & ~mask, num to icmp eq (and num, mask), 0 Where mask is a low bit mask.
Definition: InstCombineCompares.cpp:1327

llvm::InstCombinerImpl::foldICmpAndShift
Instruction * foldICmpAndShift(ICmpInst &Cmp, BinaryOperator *And, const APInt &C1, const APInt &C2)
Fold icmp (and (sh X, Y), C2), C1.
Definition: InstCombineCompares.cpp:1730

llvm::InstCombinerImpl::foldICmpBinOpWithConstantViaTruthTable
Instruction * foldICmpBinOpWithConstantViaTruthTable(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Definition: InstCombineCompares.cpp:3137

llvm::InstCombinerImpl::foldICmpInstWithConstant
Instruction * foldICmpInstWithConstant(ICmpInst &Cmp)
Try to fold integer comparisons with a constant operand: icmp Pred X, C where X is some kind of instr...
Definition: InstCombineCompares.cpp:3596

llvm::InstCombinerImpl::foldICmpXorShiftConst
Instruction * foldICmpXorShiftConst(ICmpInst &Cmp, BinaryOperator *Xor, const APInt &C)
For power-of-2 C: ((X s>> ShiftC) ^ X) u< C --> (X + C) u< (C << 1) ((X s>> ShiftC) ^ X) u> (C - 1) -...
Definition: InstCombineCompares.cpp:1701

llvm::InstCombinerImpl::foldICmpShlConstant
Instruction * foldICmpShlConstant(ICmpInst &Cmp, BinaryOperator *Shl, const APInt &C)
Fold icmp (shl X, Y), C.
Definition: InstCombineCompares.cpp:2362

llvm::InstCombinerImpl::foldICmpAndConstant
Instruction * foldICmpAndConstant(ICmpInst &Cmp, BinaryOperator *And, const APInt &C)
Fold icmp (and X, Y), C.
Definition: InstCombineCompares.cpp:1964

llvm::InstCombinerImpl::foldICmpEquality
Instruction * foldICmpEquality(ICmpInst &Cmp)
Definition: InstCombineCompares.cpp:6003

llvm::InstCombinerImpl::foldICmpWithMinMax
Instruction * foldICmpWithMinMax(Instruction &I, MinMaxIntrinsic *MinMax, Value *Z, CmpPredicate Pred)
Fold icmp Pred min|max(X, Y), Z.
Definition: InstCombineCompares.cpp:5682

llvm::InstCombinerImpl::dominatesAllUses
bool dominatesAllUses(const Instruction *DI, const Instruction *UI, const BasicBlock *DB) const
True when DB dominates all uses of DI except UI.
Definition: InstCombineCompares.cpp:6767

llvm::InstCombinerImpl::foldAllocaCmp
bool foldAllocaCmp(AllocaInst *Alloca)
Definition: InstCombineCompares.cpp:870

llvm::InstCombinerImpl::visitICmpInst
Instruction * visitICmpInst(ICmpInst &I)
Definition: InstCombineCompares.cpp:7614

llvm::InstCombinerImpl::computeOverflow
OverflowResult computeOverflow(Instruction::BinaryOps BinaryOp, bool IsSigned, Value *LHS, Value *RHS, Instruction *CxtI) const
Definition: InstCombineCompares.cpp:6494

llvm::InstCombinerImpl::foldICmpWithDominatingICmp
Instruction * foldICmpWithDominatingICmp(ICmpInst &Cmp)
Canonicalize icmp instructions based on dominating conditions.
Definition: InstCombineCompares.cpp:1407

llvm::InstCombinerImpl::replacedSelectWithOperand
bool replacedSelectWithOperand(SelectInst *SI, const ICmpInst *Icmp, const unsigned SIOpd)
Try to replace select with select operand SIOpd in SI-ICmp sequence.
Definition: InstCombineCompares.cpp:6842

llvm::InstCombinerImpl::foldICmpShrConstConst
Instruction * foldICmpShrConstConst(ICmpInst &I, Value *ShAmt, const APInt &C1, const APInt &C2)
Handle "(icmp eq/ne (ashr/lshr AP2, A), AP1)" -> (icmp eq/ne A, Log2(AP2/AP1)) -> (icmp eq/ne A,...
Definition: InstCombineCompares.cpp:998

llvm::InstCombinerImpl::freelyInvertAllUsersOf
void freelyInvertAllUsersOf(Value *V, Value *IgnoredUser=nullptr)
Freely adapt every user of V as-if V was changed to !V.
Definition: InstructionCombining.cpp:1435

llvm::InstCombinerImpl::foldICmpAndConstConst
Instruction * foldICmpAndConstConst(ICmpInst &Cmp, BinaryOperator *And, const APInt &C1)
Fold icmp (and X, C2), C1.
Definition: InstCombineCompares.cpp:1817

llvm::InstCombinerImpl::foldICmpBitCast
Instruction * foldICmpBitCast(ICmpInst &Cmp)
Definition: InstCombineCompares.cpp:3442

llvm::InstCombinerImpl::foldGEPICmp
Instruction * foldGEPICmp(GEPOperator *GEPLHS, Value *RHS, CmpPredicate Cond, Instruction &I)
Fold comparisons between a GEP instruction and something else.
Definition: InstCombineCompares.cpp:686

llvm::InstCombiner
The core instruction combiner logic.
Definition: InstCombiner.h:48

llvm::InstCombiner::computeOverflowForSignedSub
OverflowResult computeOverflowForSignedSub(const Value *LHS, const Value *RHS, const Instruction *CxtI) const
Definition: InstCombiner.h:505

llvm::InstCombiner::SQ
SimplifyQuery SQ
Definition: InstCombiner.h:77

llvm::InstCombiner::ComputeMaxSignificantBits
unsigned ComputeMaxSignificantBits(const Value *Op, const Instruction *CxtI=nullptr, unsigned Depth=0) const
Definition: InstCombiner.h:462

llvm::InstCombiner::isFreeToInvert
bool isFreeToInvert(Value *V, bool WillInvertAllUses, bool &DoesConsume)
Return true if the specified value is free to invert (apply ~ to).
Definition: InstCombiner.h:228

llvm::InstCombiner::computeOverflowForUnsignedMul
OverflowResult computeOverflowForUnsignedMul(const Value *LHS, const Value *RHS, const Instruction *CxtI, bool IsNSW=false) const
Definition: InstCombiner.h:468

llvm::InstCombiner::getComplexity
static unsigned getComplexity(Value *V)
Assign a complexity or rank value to LLVM Values.
Definition: InstCombiner.h:143

llvm::InstCombiner::TLI
TargetLibraryInfo & TLI
Definition: InstCombiner.h:74

llvm::InstCombiner::replaceInstUsesWith
Instruction * replaceInstUsesWith(Instruction &I, Value *V)
A combiner-aware RAUW-like routine.
Definition: InstCombiner.h:388

llvm::InstCombiner::MaxArraySizeForCombine
uint64_t MaxArraySizeForCombine
Maximum size of array considered when transforming.
Definition: InstCombiner.h:56

llvm::InstCombiner::computeOverflowForSignedAdd
OverflowResult computeOverflowForSignedAdd(const WithCache< const Value * > &LHS, const WithCache< const Value * > &RHS, const Instruction *CxtI) const
Definition: InstCombiner.h:491

llvm::InstCombiner::SubOne
static Constant * SubOne(Constant *C)
Subtract one from a Constant.
Definition: InstCombiner.h:183

llvm::InstCombiner::computeOverflowForUnsignedSub
OverflowResult computeOverflowForUnsignedSub(const Value *LHS, const Value *RHS, const Instruction *CxtI) const
Definition: InstCombiner.h:498

llvm::InstCombiner::isCanonicalPredicate
static bool isCanonicalPredicate(CmpPredicate Pred)
Predicate canonicalization reduces the number of patterns that need to be matched by other transforms...
Definition: InstCombiner.h:160

llvm::InstCombiner::DL
const DataLayout & DL
Definition: InstCombiner.h:76

llvm::InstCombiner::DC
DomConditionCache DC
Definition: InstCombiner.h:82

llvm::InstCombiner::computeKnownBits
void computeKnownBits(const Value *V, KnownBits &Known, const Instruction *CxtI, unsigned Depth=0) const
Definition: InstCombiner.h:433

llvm::InstCombiner::canFreelyInvertAllUsersOf
bool canFreelyInvertAllUsersOf(Instruction *V, Value *IgnoredUser)
Given i1 V, can every user of V be freely adapted if V is changed to !V ? InstCombine's freelyInvertA...
Definition: InstCombiner.h:244

llvm::InstCombiner::addToWorklist
void addToWorklist(Instruction *I)
Definition: InstCombiner.h:332

llvm::InstCombiner::replaceOperand
Instruction * replaceOperand(Instruction &I, unsigned OpNum, Value *V)
Replace operand of instruction and add old operand to the worklist.
Definition: InstCombiner.h:412

llvm::InstCombiner::DT
DominatorTree & DT
Definition: InstCombiner.h:75

llvm::InstCombiner::computeOverflowForSignedMul
OverflowResult computeOverflowForSignedMul(const Value *LHS, const Value *RHS, const Instruction *CxtI) const
Definition: InstCombiner.h:476

llvm::InstCombiner::Builder
BuilderTy & Builder
Definition: InstCombiner.h:61

llvm::InstCombiner::computeOverflowForUnsignedAdd
OverflowResult computeOverflowForUnsignedAdd(const WithCache< const Value * > &LHS, const WithCache< const Value * > &RHS, const Instruction *CxtI) const
Definition: InstCombiner.h:483

llvm::InstCombiner::getFreelyInverted
Value * getFreelyInverted(Value *V, bool WillInvertAllUses, BuilderTy *Builder, bool &DoesConsume)
Definition: InstCombiner.h:209

llvm::InstCombiner::getSimplifyQuery
const SimplifyQuery & getSimplifyQuery() const
Definition: InstCombiner.h:338

llvm::InstCombiner::isKnownToBeAPowerOfTwo
bool isKnownToBeAPowerOfTwo(const Value *V, bool OrZero=false, const Instruction *CxtI=nullptr, unsigned Depth=0)
Definition: InstCombiner.h:443

llvm::Instruction
Definition: Instruction.h:69

llvm::Instruction::hasNoNaNs
LLVM_ABI bool hasNoNaNs() const LLVM_READONLY
Determine whether the no-NaNs flag is set.
Definition: Instruction.cpp:648

llvm::Instruction::hasNoUnsignedWrap
LLVM_ABI bool hasNoUnsignedWrap() const LLVM_READONLY
Determine whether the no unsigned wrap flag is set.
Definition: Instruction.cpp:411

llvm::Instruction::hasNoInfs
LLVM_ABI bool hasNoInfs() const LLVM_READONLY
Determine whether the no-infs flag is set.
Definition: Instruction.cpp:653

llvm::Instruction::isArithmeticShift
bool isArithmeticShift() const
Return true if this is an arithmetic shift right.
Definition: Instruction.h:361

llvm::Instruction::hasNoSignedWrap
LLVM_ABI bool hasNoSignedWrap() const LLVM_READONLY
Determine whether the no signed wrap flag is set.
Definition: Instruction.cpp:418

llvm::Instruction::isCommutative
LLVM_ABI bool isCommutative() const LLVM_READONLY
Return true if the instruction is commutative:
Definition: Instruction.cpp:1273

llvm::Instruction::isExact
LLVM_ABI bool isExact() const LLVM_READONLY
Determine whether the exact flag is set.
Definition: Instruction.cpp:584

llvm::Instruction::getOpcode
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
Definition: Instruction.h:312

llvm::Instruction::BinaryOps
BinaryOps
Definition: Instruction.h:998

llvm::Instruction::isShift
bool isShift() const
Definition: Instruction.h:320

llvm::Instruction::CastOps
CastOps
Definition: Instruction.h:1012

llvm::IntegerType::get
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition: Type.cpp:319

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:49

llvm::IntrinsicInst::getIntrinsicID
Intrinsic::ID getIntrinsicID() const
Return the intrinsic ID of this intrinsic.
Definition: IntrinsicInst.h:56

llvm::LoadInst
An instruction for reading from memory.
Definition: Instructions.h:180

llvm::LoadInst::isVolatile
bool isVolatile() const
Return true if this is a load from a volatile memory location.
Definition: Instructions.h:209

llvm::MinMaxIntrinsic
This class represents min/max intrinsics.
Definition: IntrinsicInst.h:764

llvm::Module
A Module instance is used to store all the information related to an LLVM module.
Definition: Module.h:67

llvm::PHINode
Definition: Instructions.h:2638

llvm::PHINode::addIncoming
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
Definition: Instructions.h:2773

llvm::PHINode::Create
static PHINode * Create(Type *Ty, unsigned NumReservedValues, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Constructors - NumReservedValues is a hint for the number of incoming edges that this phi node will h...
Definition: Instructions.h:2673

llvm::SaturatingInst
Represents a saturating add/sub intrinsic.
Definition: IntrinsicInst.h:951

llvm::SelectInst
This class represents the LLVM 'select' instruction.
Definition: Instructions.h:1689

llvm::SelectInst::Create
static SelectInst * Create(Value *C, Value *S1, Value *S2, const Twine &NameStr="", InsertPosition InsertBefore=nullptr, Instruction *MDFrom=nullptr)
Definition: Instructions.h:1714

llvm::SetVector
A vector that has set insertion semantics.
Definition: SetVector.h:59

llvm::SetVector::size
size_type size() const
Determine the number of elements in the SetVector.
Definition: SetVector.h:104

llvm::SetVector::insert
bool insert(const value_type &X)
Insert a new element into the SetVector.
Definition: SetVector.h:168

llvm::SetVector::contains
bool contains(const key_type &key) const
Check if the SetVector contains the given key.
Definition: SetVector.h:269

llvm::ShuffleVectorInst
This instruction constructs a fixed permutation of two input vectors.
Definition: Instructions.h:1934

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:82

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:574

llvm::SmallVectorImpl::pop_back_val
T pop_back_val()
Definition: SmallVector.h:674

llvm::SmallVectorImpl::emplace_back
reference emplace_back(ArgTypes &&... Args)
Definition: SmallVector.h:938

llvm::SmallVectorTemplateBase::pop_back
void pop_back()
Definition: SmallVector.h:426

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:414

llvm::SmallVectorTemplateCommon::rbegin
reverse_iterator rbegin()
Definition: SmallVector.h:274

llvm::SmallVectorTemplateCommon::back
reference back()
Definition: SmallVector.h:309

llvm::SmallVectorTemplateCommon::rend
reverse_iterator rend()
Definition: SmallVector.h:276

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1197

llvm::StructType
Class to represent struct types.
Definition: DerivedTypes.h:218

llvm::TruncInst
This class represents a truncation of integer types.
Definition: Instructions.h:4555

llvm::TruncInst::NoUnsignedWrap
@ NoUnsignedWrap
Definition: Instructions.h:4564

llvm::TruncInst::NoSignedWrap
@ NoSignedWrap
Definition: Instructions.h:4564

llvm::TruncInst::hasNoSignedWrap
bool hasNoSignedWrap() const
Test whether this operation is known to never undergo signed overflow, aka the nsw property.
Definition: Instructions.h:4600

llvm::TruncInst::hasNoUnsignedWrap
bool hasNoUnsignedWrap() const
Test whether this operation is known to never undergo unsigned overflow, aka the nuw property.
Definition: Instructions.h:4594

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::getPrimitiveSizeInBits
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.

llvm::Type::isVectorTy
bool isVectorTy() const
True if this is an instance of VectorType.
Definition: Type.h:273

llvm::Type::getFPMantissaWidth
LLVM_ABI int getFPMantissaWidth() const
Return the width of the mantissa of this type.

llvm::Type::isArrayTy
bool isArrayTy() const
True if this is an instance of ArrayType.
Definition: Type.h:264

llvm::Type::isIntOrIntVectorTy
bool isIntOrIntVectorTy() const
Return true if this is an integer type or a vector of integer types.
Definition: Type.h:246

llvm::Type::isPointerTy
bool isPointerTy() const
True if this is an instance of PointerType.
Definition: Type.h:267

llvm::Type::getArrayElementType
Type * getArrayElementType() const
Definition: Type.h:408

llvm::Type::getInt1Ty
static LLVM_ABI IntegerType * getInt1Ty(LLVMContext &C)

llvm::Type::isPPC_FP128Ty
bool isPPC_FP128Ty() const
Return true if this is powerpc long double.
Definition: Type.h:165

llvm::Type::getWithNewBitWidth
LLVM_ABI Type * getWithNewBitWidth(unsigned NewBitWidth) const
Given an integer or vector type, change the lane bitwidth to NewBitwidth, whilst keeping the old numb...

llvm::Type::getPointerAddressSpace
LLVM_ABI unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.

llvm::Type::getContext
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition: Type.h:128

llvm::Type::getFltSemantics
LLVM_ABI const fltSemantics & getFltSemantics() const

llvm::Type::getScalarSizeInBits
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition: Type.h:240

llvm::Type::getScalarType
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition: Type.h:352

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition: Use.h:35

llvm::User
Definition: User.h:44

llvm::User::setOperand
void setOperand(unsigned i, Value *Val)
Definition: User.h:237

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition: User.h:232

llvm::User::getNumOperands
unsigned getNumOperands() const
Definition: User.h:254

llvm::Value
LLVM Value Representation.
Definition: Value.h:75

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:256

llvm::Value::hasOneUse
bool hasOneUse() const
Return true if there is exactly one use of this value.
Definition: Value.h:439

llvm::Value::users
iterator_range< user_iterator > users()
Definition: Value.h:426

llvm::Value::hasNUsesOrMore
LLVM_ABI bool hasNUsesOrMore(unsigned N) const
Return true if this value has N uses or more.
Definition: Value.cpp:158

llvm::Value::stripAndAccumulateConstantOffsets
LLVM_ABI const Value * stripAndAccumulateConstantOffsets(const DataLayout &DL, APInt &Offset, bool AllowNonInbounds, bool AllowInvariantGroup=false, function_ref< bool(Value &Value, APInt &Offset)> ExternalAnalysis=nullptr, bool LookThroughIntToPtr=false) const
Accumulate the constant offset this value has compared to a base pointer.

llvm::Value::stripPointerCasts
LLVM_ABI const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
Definition: Value.cpp:701

llvm::Value::getContext
LLVM_ABI LLVMContext & getContext() const
All values hold a context through their type.
Definition: Value.cpp:1098

llvm::Value::uses
iterator_range< use_iterator > uses()
Definition: Value.h:380

llvm::Value::getName
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
Definition: Value.cpp:322

llvm::Value::takeName
LLVM_ABI void takeName(Value *V)
Transfer the name from V to this value.
Definition: Value.cpp:396

llvm::VectorType::get
static LLVM_ABI VectorType * get(Type *ElementType, ElementCount EC)
This static method is the primary way to construct an VectorType.

llvm::details::FixedOrScalableQuantity::getFixedValue
constexpr ScalarTy getFixedValue() const
Definition: TypeSize.h:203

llvm::ilist_detail::node_parent_access::getParent
const ParentTy * getParent() const
Definition: ilist_node.h:34

uint32_t

uint64_t

unsigned

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:164

llvm::APIntOps::RoundingUDiv
LLVM_ABI APInt RoundingUDiv(const APInt &A, const APInt &B, APInt::Rounding RM)
Return A unsign-divided by B, rounded by the given rounding mode.
Definition: APInt.cpp:2763

llvm::APIntOps::RoundingSDiv
LLVM_ABI APInt RoundingSDiv(const APInt &A, const APInt &B, APInt::Rounding RM)
Return A sign-divided by B, rounded by the given rounding mode.
Definition: APInt.cpp:2781

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::Intrinsic::getOrInsertDeclaration
LLVM_ABI Function * getOrInsertDeclaration(Module *M, ID id, ArrayRef< Type * > Tys={})
Look up the Function declaration of the intrinsic id in the Module M.
Definition: Intrinsics.cpp:751

llvm::MIPatternMatch::m_ZeroInt
SpecificConstantMatch m_ZeroInt()
Convenience matchers for specific integer values.
Definition: MIPatternMatch.h:277

llvm::MIPatternMatch::m_Neg
BinaryOp_match< SpecificConstantMatch, SrcTy, TargetOpcode::G_SUB > m_Neg(const SrcTy &&Src)
Matches a register negated by a G_SUB.
Definition: MIPatternMatch.h:928

llvm::MIPatternMatch::m_Not
BinaryOp_match< SrcTy, SpecificConstantMatch, TargetOpcode::G_XOR, true > m_Not(const SrcTy &&Src)
Matches a register not-ed by a G_XOR.
Definition: MIPatternMatch.h:936

llvm::MIPatternMatch::m_OneUse
OneUse_match< SubPat > m_OneUse(const SubPat &SP)
Definition: MIPatternMatch.h:56

llvm::PatternMatch::m_AllOnes
cst_pred_ty< is_all_ones > m_AllOnes()
Match an integer or vector with all bits set.
Definition: PatternMatch.h:524

llvm::PatternMatch::m_LowBitMask
cst_pred_ty< is_lowbit_mask > m_LowBitMask()
Match an integer or vector with only the low bit(s) set.
Definition: PatternMatch.h:673

llvm::PatternMatch::m_And
BinaryOp_match< LHS, RHS, Instruction::And > m_And(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1296

llvm::PatternMatch::m_Negative
cst_pred_ty< is_negative > m_Negative()
Match an integer or vector of negative values.
Definition: PatternMatch.h:550

llvm::PatternMatch::m_Add
BinaryOp_match< LHS, RHS, Instruction::Add > m_Add(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1182

llvm::PatternMatch::m_BinOp
class_match< BinaryOperator > m_BinOp()
Match an arbitrary binary operation and ignore it.
Definition: PatternMatch.h:100

llvm::PatternMatch::m_SignMask
cst_pred_ty< is_sign_mask > m_SignMask()
Match an integer or vector with only the sign bit(s) set.
Definition: PatternMatch.h:664

llvm::PatternMatch::m_NUWAdd
OverflowingBinaryOp_match< LHS, RHS, Instruction::Add, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWAdd(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1441

llvm::PatternMatch::m_AShr
BinaryOp_match< LHS, RHS, Instruction::AShr > m_AShr(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1326

llvm::PatternMatch::m_Power2
cst_pred_ty< is_power2 > m_Power2()
Match an integer or vector power-of-2.
Definition: PatternMatch.h:619

llvm::PatternMatch::m_URem
BinaryOp_match< LHS, RHS, Instruction::URem > m_URem(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1278

llvm::PatternMatch::m_TruncOrSelf
match_combine_or< CastInst_match< OpTy, TruncInst >, OpTy > m_TruncOrSelf(const OpTy &Op)
Definition: PatternMatch.h:2231

llvm::PatternMatch::m_Constant
class_match< Constant > m_Constant()
Match an arbitrary Constant and ignore it.
Definition: PatternMatch.h:165

llvm::PatternMatch::m_c_And
BinaryOp_match< LHS, RHS, Instruction::And, true > m_c_And(const LHS &L, const RHS &R)
Matches an And with LHS and RHS in either order.
Definition: PatternMatch.h:2958

llvm::PatternMatch::m_Trunc
CastInst_match< OpTy, TruncInst > m_Trunc(const OpTy &Op)
Matches Trunc.
Definition: PatternMatch.h:2211

llvm::PatternMatch::m_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor > m_Xor(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1308

llvm::PatternMatch::m_SpecificInt
specific_intval< false > m_SpecificInt(const APInt &V)
Match a specific integer value or vector with all elements equal to the value.
Definition: PatternMatch.h:1060

llvm::PatternMatch::m_ZExtOrSelf
match_combine_or< CastInst_match< OpTy, ZExtInst >, OpTy > m_ZExtOrSelf(const OpTy &Op)
Definition: PatternMatch.h:2254

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition: PatternMatch.h:49

llvm::PatternMatch::m_IDiv
BinOpPred_match< LHS, RHS, is_idiv_op > m_IDiv(const LHS &L, const RHS &R)
Matches integer division operations.
Definition: PatternMatch.h:1680

llvm::PatternMatch::m_Instruction
bind_ty< Instruction > m_Instruction(Instruction *&I)
Match an instruction, capturing it if we match.
Definition: PatternMatch.h:862

llvm::PatternMatch::m_AnyZeroFP
cstfp_pred_ty< is_any_zero_fp > m_AnyZeroFP()
Match a floating-point negative zero or positive zero.
Definition: PatternMatch.h:766

llvm::PatternMatch::m_Specific
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
Definition: PatternMatch.h:962

llvm::PatternMatch::m_Shr
BinOpPred_match< LHS, RHS, is_right_shift_op > m_Shr(const LHS &L, const RHS &R)
Matches logical shift operations.
Definition: PatternMatch.h:1652

llvm::PatternMatch::m_SpecificIntAllowPoison
specific_intval< true > m_SpecificIntAllowPoison(const APInt &V)
Definition: PatternMatch.h:1068

llvm::PatternMatch::m_c_ICmp
CmpClass_match< LHS, RHS, ICmpInst, true > m_c_ICmp(CmpPredicate &Pred, const LHS &L, const RHS &R)
Matches an ICmp with a predicate over LHS and RHS in either order.
Definition: PatternMatch.h:2925

llvm::PatternMatch::m_NSWNeg
OverflowingBinaryOp_match< cst_pred_ty< is_zero_int >, ValTy, Instruction::Sub, OverflowingBinaryOperator::NoSignedWrap > m_NSWNeg(const ValTy &V)
Matches a 'Neg' as 'sub nsw 0, V'.
Definition: PatternMatch.h:2989

llvm::PatternMatch::m_NonNegative
cst_pred_ty< is_nonnegative > m_NonNegative()
Match an integer or vector of non-negative values.
Definition: PatternMatch.h:560

llvm::PatternMatch::m_ConstantInt
class_match< ConstantInt > m_ConstantInt()
Match an arbitrary ConstantInt and ignore it.
Definition: PatternMatch.h:168

llvm::PatternMatch::m_One
cst_pred_ty< is_one > m_One()
Match an integer 1 or a vector with all elements equal to 1.
Definition: PatternMatch.h:592

llvm::PatternMatch::m_Select
ThreeOps_match< Cond, LHS, RHS, Instruction::Select > m_Select(const Cond &C, const LHS &L, const RHS &R)
Matches SelectInst.
Definition: PatternMatch.h:1928

llvm::PatternMatch::m_LogicalShift
BinOpPred_match< LHS, RHS, is_logical_shift_op > m_LogicalShift(const LHS &L, const RHS &R)
Matches logical shift operations.
Definition: PatternMatch.h:1660

llvm::PatternMatch::m_CombineAnd
match_combine_and< LTy, RTy > m_CombineAnd(const LTy &L, const RTy &R)
Combine two pattern matchers matching L && R.
Definition: PatternMatch.h:245

llvm::PatternMatch::m_SMin
MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > m_SMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2484

llvm::PatternMatch::m_Sqrt
m_Intrinsic_Ty< Opnd0 >::Ty m_Sqrt(const Opnd0 &Op0)
Definition: PatternMatch.h:2896

llvm::PatternMatch::m_c_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor, true > m_c_Xor(const LHS &L, const RHS &R)
Matches an Xor with LHS and RHS in either order.
Definition: PatternMatch.h:2972

llvm::PatternMatch::m_FAdd
BinaryOp_match< LHS, RHS, Instruction::FAdd > m_FAdd(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1188

llvm::PatternMatch::m_Mul
BinaryOp_match< LHS, RHS, Instruction::Mul > m_Mul(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1248

llvm::PatternMatch::m_Deferred
deferredval_ty< Value > m_Deferred(Value *const &V)
Like m_Specific(), but works if the specific value to match is determined as part of the same match()...
Definition: PatternMatch.h:980

llvm::PatternMatch::m_APIntAllowPoison
apint_match m_APIntAllowPoison(const APInt *&Res)
Match APInt while allowing poison in splat vector constants.
Definition: PatternMatch.h:305

llvm::PatternMatch::m_NSWTrunc
NoWrapTrunc_match< OpTy, TruncInst::NoSignedWrap > m_NSWTrunc(const OpTy &Op)
Matches trunc nsw.
Definition: PatternMatch.h:2225

llvm::PatternMatch::m_Shuffle
TwoOps_match< V1_t, V2_t, Instruction::ShuffleVector > m_Shuffle(const V1_t &v1, const V2_t &v2)
Matches ShuffleVectorInst independently of mask value.
Definition: PatternMatch.h:2040

llvm::PatternMatch::m_c_Select
ThreeOps_match< decltype(m_Value()), LHS, RHS, Instruction::Select, true > m_c_Select(const LHS &L, const RHS &R)
Match Select(C, LHS, RHS) or Select(C, RHS, LHS)
Definition: PatternMatch.h:1944

llvm::PatternMatch::m_FPExt
CastInst_match< OpTy, FPExtInst > m_FPExt(const OpTy &Op)
Definition: PatternMatch.h:2312

llvm::PatternMatch::m_ZExt
CastInst_match< OpTy, ZExtInst > m_ZExt(const OpTy &Op)
Matches ZExt.
Definition: PatternMatch.h:2243

llvm::PatternMatch::m_NUWShl
OverflowingBinaryOp_match< LHS, RHS, Instruction::Shl, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWShl(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1475

llvm::PatternMatch::m_NUWMul
OverflowingBinaryOp_match< LHS, RHS, Instruction::Mul, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWMul(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1467

llvm::PatternMatch::m_UDiv
BinaryOp_match< LHS, RHS, Instruction::UDiv > m_UDiv(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1260

llvm::PatternMatch::m_ImmConstant
match_immconstant_ty m_ImmConstant()
Match an arbitrary immediate Constant and ignore it.
Definition: PatternMatch.h:931

llvm::PatternMatch::m_NegatedPower2OrZero
cst_pred_ty< is_negated_power2_or_zero > m_NegatedPower2OrZero()
Match a integer or vector negated power-of-2.
Definition: PatternMatch.h:639

llvm::PatternMatch::m_NUWTrunc
NoWrapTrunc_match< OpTy, TruncInst::NoUnsignedWrap > m_NUWTrunc(const OpTy &Op)
Matches trunc nuw.
Definition: PatternMatch.h:2218

llvm::PatternMatch::m_CheckedInt
cst_pred_ty< custom_checkfn< APInt > > m_CheckedInt(function_ref< bool(const APInt &)> CheckFn)
Match an integer or vector where CheckFn(ele) for each element is true.
Definition: PatternMatch.h:481

llvm::PatternMatch::m_LowBitMaskOrZero
cst_pred_ty< is_lowbit_mask_or_zero > m_LowBitMaskOrZero()
Match an integer or vector with only the low bit(s) set.
Definition: PatternMatch.h:683

llvm::PatternMatch::m_c_Add
BinaryOp_match< LHS, RHS, Instruction::Add, true > m_c_Add(const LHS &L, const RHS &R)
Matches a Add with LHS and RHS in either order.
Definition: PatternMatch.h:2944

llvm::PatternMatch::m_AddLike
match_combine_or< BinaryOp_match< LHS, RHS, Instruction::Add >, DisjointOr_match< LHS, RHS > > m_AddLike(const LHS &L, const RHS &R)
Match either "add" or "or disjoint".
Definition: PatternMatch.h:1536

llvm::PatternMatch::m_UIToFP
CastInst_match< OpTy, UIToFPInst > m_UIToFP(const OpTy &Op)
Definition: PatternMatch.h:2287

llvm::PatternMatch::m_BitCast
CastOperator_match< OpTy, Instruction::BitCast > m_BitCast(const OpTy &Op)
Matches BitCast.
Definition: PatternMatch.h:2150

llvm::PatternMatch::m_SDiv
BinaryOp_match< LHS, RHS, Instruction::SDiv > m_SDiv(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1266

llvm::PatternMatch::m_APInt
apint_match m_APInt(const APInt *&Res)
Match a ConstantInt or splatted ConstantVector, binding the specified pointer to the contained APInt.
Definition: PatternMatch.h:299

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition: PatternMatch.h:92

llvm::PatternMatch::m_Signum
Signum_match< Val_t > m_Signum(const Val_t &V)
Matches a signum pattern.
Definition: PatternMatch.h:3087

llvm::PatternMatch::m_SIToFP
CastInst_match< OpTy, SIToFPInst > m_SIToFP(const OpTy &Op)
Definition: PatternMatch.h:2292

llvm::PatternMatch::m_LShr
BinaryOp_match< LHS, RHS, Instruction::LShr > m_LShr(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1320

llvm::PatternMatch::m_ICmp
CmpClass_match< LHS, RHS, ICmpInst > m_ICmp(CmpPredicate &Pred, const LHS &L, const RHS &R)
Definition: PatternMatch.h:1754

llvm::PatternMatch::m_ZExtOrSExt
match_combine_or< CastInst_match< OpTy, ZExtInst >, CastInst_match< OpTy, SExtInst > > m_ZExtOrSExt(const OpTy &Op)
Definition: PatternMatch.h:2274

llvm::PatternMatch::m_FNeg
FNeg_match< OpTy > m_FNeg(const OpTy &X)
Match 'fneg X' as 'fsub -0.0, X'.
Definition: PatternMatch.h:1236

llvm::PatternMatch::m_PosZeroFP
cstfp_pred_ty< is_pos_zero_fp > m_PosZeroFP()
Match a floating-point positive zero.
Definition: PatternMatch.h:775

llvm::PatternMatch::m_Shl
BinaryOp_match< LHS, RHS, Instruction::Shl > m_Shl(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1314

llvm::PatternMatch::m_UAddWithOverflow
UAddWithOverflow_match< LHS_t, RHS_t, Sum_t > m_UAddWithOverflow(const LHS_t &L, const RHS_t &R, const Sum_t &S)
Match an icmp instruction checking for unsigned overflow on addition.
Definition: PatternMatch.h:2684

llvm::PatternMatch::m_VecReverse
m_Intrinsic_Ty< Opnd0 >::Ty m_VecReverse(const Opnd0 &Op0)
Definition: PatternMatch.h:2907

llvm::PatternMatch::m_IRem
BinOpPred_match< LHS, RHS, is_irem_op > m_IRem(const LHS &L, const RHS &R)
Matches integer remainder operations.
Definition: PatternMatch.h:1687

llvm::PatternMatch::m_APFloat
apfloat_match m_APFloat(const APFloat *&Res)
Match a ConstantFP or splatted ConstantVector, binding the specified pointer to the contained APFloat...
Definition: PatternMatch.h:316

llvm::PatternMatch::m_MaxOrMin
match_combine_or< match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > >, match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty > > > m_MaxOrMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2507

llvm::PatternMatch::m_FPTrunc
CastInst_match< OpTy, FPTruncInst > m_FPTrunc(const OpTy &Op)
Definition: PatternMatch.h:2307

llvm::PatternMatch::m_Undef
auto m_Undef()
Match an arbitrary undef constant.
Definition: PatternMatch.h:152

llvm::PatternMatch::m_Or
BinaryOp_match< LHS, RHS, Instruction::Or > m_Or(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1302

llvm::PatternMatch::m_SExt
CastInst_match< OpTy, SExtInst > m_SExt(const OpTy &Op)
Matches SExt.
Definition: PatternMatch.h:2237

llvm::PatternMatch::m_Zero
is_zero m_Zero()
Match any null constant or a vector with all elements equal to 0.
Definition: PatternMatch.h:612

llvm::PatternMatch::m_c_Or
BinaryOp_match< LHS, RHS, Instruction::Or, true > m_c_Or(const LHS &L, const RHS &R)
Matches an Or with LHS and RHS in either order.
Definition: PatternMatch.h:2965

llvm::PatternMatch::m_ElementWiseBitCast
ElementWiseBitCast_match< OpTy > m_ElementWiseBitCast(const OpTy &Op)
Definition: PatternMatch.h:2178

llvm::PatternMatch::m_FAbs
m_Intrinsic_Ty< Opnd0 >::Ty m_FAbs(const Opnd0 &Op0)
Definition: PatternMatch.h:2838

llvm::PatternMatch::m_c_Mul
BinaryOp_match< LHS, RHS, Instruction::Mul, true > m_c_Mul(const LHS &L, const RHS &R)
Matches a Mul with LHS and RHS in either order.
Definition: PatternMatch.h:2951

llvm::PatternMatch::m_PtrToInt
CastOperator_match< OpTy, Instruction::PtrToInt > m_PtrToInt(const OpTy &Op)
Matches PtrToInt.
Definition: PatternMatch.h:2185

llvm::PatternMatch::m_Sub
BinaryOp_match< LHS, RHS, Instruction::Sub > m_Sub(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1194

llvm::PatternMatch::m_Unless
match_unless< Ty > m_Unless(const Ty &M)
Match if the inner matcher does NOT match.
Definition: PatternMatch.h:203

llvm::PatternMatch::m_CombineOr
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
Definition: PatternMatch.h:239

llvm::PatternMatch::m_SpecificInt_ICMP
cst_pred_ty< icmp_pred_with_threshold > m_SpecificInt_ICMP(ICmpInst::Predicate Predicate, const APInt &Threshold)
Match an integer or vector with every element comparing 'pred' (eg/ne/...) to Threshold.
Definition: PatternMatch.h:700

llvm::sampleprof::Base
@ Base
Definition: Discriminator.h:58

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::Offset
@ Offset
Definition: DWP.cpp:477

llvm::zip
detail::zippy< detail::zip_shortest, T, U, Args... > zip(T &&t, U &&u, Args &&...args)
zip iterator for two or more iteratable types.
Definition: STLExtras.h:860

llvm::OverflowResult
OverflowResult
Definition: ValueTracking.h:616

llvm::OverflowResult::NeverOverflows
@ NeverOverflows
Never overflows.

llvm::OverflowResult::AlwaysOverflowsHigh
@ AlwaysOverflowsHigh
Always overflows in the direction of signed/unsigned max value.

llvm::OverflowResult::AlwaysOverflowsLow
@ AlwaysOverflowsLow
Always overflows in the direction of signed/unsigned min value.

llvm::OverflowResult::MayOverflow
@ MayOverflow
May or may not overflow.

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1744

llvm::isKnownNeverInfinity
LLVM_ABI bool isKnownNeverInfinity(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Return true if the floating-point scalar value is not an infinity or if the floating-point vector val...
Definition: ValueTracking.cpp:5948

llvm::isSignBitCheck
LLVM_ABI bool isSignBitCheck(ICmpInst::Predicate Pred, const APInt &RHS, bool &TrueIfSigned)
Given an exploded icmp instruction, return true if the comparison only checks the sign bit.
Definition: ValueTracking.cpp:4544

llvm::Depth
@ Depth
Definition: SIMachineScheduler.h:36

llvm::LoopIdiomVectorizeStyle::Masked
@ Masked

llvm::stripNullTest
LLVM_ABI Value * stripNullTest(Value *V)
Returns the inner value X if the expression has the form f(X) where f(X) == 0 if and only if X == 0,...
Definition: ValueTracking.cpp:10259

llvm::ConstantFoldCompareInstOperands
LLVM_ABI Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
Definition: ConstantFolding.cpp:1198

llvm::make_early_inc_range
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
Definition: STLExtras.h:663

llvm::simplifyFCmpInst
LLVM_ABI Value * simplifyFCmpInst(CmpPredicate Predicate, Value *LHS, Value *RHS, FastMathFlags FMF, const SimplifyQuery &Q)
Given operands for an FCmpInst, fold the result or return null.
Definition: InstructionSimplify.cpp:4289

llvm::ilogb
int ilogb(const APFloat &Arg)
Returns the exponent of the internal representation of the APFloat.
Definition: APFloat.h:1534

llvm::computeConstantRange
LLVM_ABI ConstantRange computeConstantRange(const Value *V, bool ForSigned, bool UseInstrInfo=true, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Determine the possible constant range of an integer or vector of integer value.
Definition: ValueTracking.cpp:10020

llvm::ConstantFoldExtractValueInstruction
LLVM_ABI Constant * ConstantFoldExtractValueInstruction(Constant *Agg, ArrayRef< unsigned > Idxs)
Attempt to constant fold an extractvalue instruction with the specified operands and indices.
Definition: ConstantFold.cpp:506

llvm::MaskedValueIsZero
LLVM_ABI bool MaskedValueIsZero(const Value *V, const APInt &Mask, const SimplifyQuery &SQ, unsigned Depth=0)
Return true if 'V & Mask' is known to be zero.
Definition: ValueTracking.cpp:315

llvm::countr_zero
int countr_zero(T Val)
Count number of 0's from the least significant bit to the most stopping at the first 1.
Definition: bit.h:157

llvm::simplifyAddInst
LLVM_ABI Value * simplifyAddInst(Value *LHS, Value *RHS, bool IsNSW, bool IsNUW, const SimplifyQuery &Q)
Given operands for an Add, fold the result or return null.
Definition: InstructionSimplify.cpp:659

llvm::ConstantFoldConstant
LLVM_ABI Constant * ConstantFoldConstant(const Constant *C, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldConstant - Fold the constant using the specified DataLayout.
Definition: ConstantFolding.cpp:1183

llvm::isSplatValue
LLVM_ABI bool isSplatValue(const Value *V, int Index=-1, unsigned Depth=0)
Return true if each element of the vector value V is poisoned or equal to every other non-poisoned el...
Definition: VectorUtils.cpp:404

llvm::Log2_32
unsigned Log2_32(uint32_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
Definition: MathExtras.h:336

llvm::countl_zero
int countl_zero(T Val)
Count number of 0's from the most significant bit to the least stopping at the first 1.
Definition: bit.h:203

llvm::emitGEPOffset
LLVM_ABI Value * emitGEPOffset(IRBuilderBase *Builder, const DataLayout &DL, User *GEP, bool NoAssumptions=false)
Given a getelementptr instruction/constantexpr, emit the code necessary to compute the offset from th...
Definition: Local.cpp:22

llvm::MaxAnalysisRecursionDepth
constexpr unsigned MaxAnalysisRecursionDepth
Definition: ValueTracking.h:47

llvm::ConstantFoldUnaryOpOperand
LLVM_ABI Constant * ConstantFoldUnaryOpOperand(unsigned Opcode, Constant *Op, const DataLayout &DL)
Attempt to constant fold a unary operation with the specified operand.
Definition: ConstantFolding.cpp:1310

llvm::HexPrintStyle::Upper
@ Upper

llvm::HexPrintStyle::Lower
@ Lower

llvm::isKnownNegative
LLVM_ABI bool isKnownNegative(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Returns true if the given value is known be negative (i.e.
Definition: ValueTracking.cpp:295

llvm::SelectPatternFlavor
SelectPatternFlavor
Specific patterns of select instructions we can match.
Definition: ValueTracking.h:828

llvm::SPF_UNKNOWN
@ SPF_UNKNOWN
Definition: ValueTracking.h:829

llvm::impliesPoison
LLVM_ABI bool impliesPoison(const Value *ValAssumedPoison, const Value *V)
Return true if V is poison given that ValAssumedPoison is already poison.
Definition: ValueTracking.cpp:7565

llvm::isFinite
LLVM_ABI bool isFinite(const Loop *L)
Return true if this loop can be assumed to run for a finite number of iterations.
Definition: LoopInfo.cpp:1164

llvm::FPClassTest
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
Definition: FloatingPointMode.h:240

llvm::fcInf
@ fcInf
Definition: FloatingPointMode.h:255

llvm::fcSubnormal
@ fcSubnormal
Definition: FloatingPointMode.h:257

llvm::fcZero
@ fcZero
Definition: FloatingPointMode.h:258

llvm::fcAllFlags
@ fcAllFlags
Definition: FloatingPointMode.h:265

llvm::fcNan
@ fcNan
Definition: FloatingPointMode.h:254

llvm::scalbn
APFloat scalbn(APFloat X, int Exp, APFloat::roundingMode RM)
Returns: X * 2^Exp for integral exponents.
Definition: APFloat.h:1543

llvm::computeKnownBits
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
Definition: ValueTracking.cpp:148

llvm::matchSelectPattern
LLVM_ABI SelectPatternResult matchSelectPattern(Value *V, Value *&LHS, Value *&RHS, Instruction::CastOps *CastOp=nullptr, unsigned Depth=0)
Pattern match integer [SU]MIN, [SU]MAX and ABS idioms, returning the kind and providing the out param...
Definition: ValueTracking.cpp:8954

llvm::NullPointerIsDefined
LLVM_ABI bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
Definition: Function.cpp:1172

llvm::none_of
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1758

llvm::simplifyICmpInst
LLVM_ABI Value * simplifyICmpInst(CmpPredicate Pred, Value *LHS, Value *RHS, const SimplifyQuery &Q)
Given operands for an ICmpInst, fold the result or return null.
Definition: InstructionSimplify.cpp:4057

llvm::ConstantFoldCastOperand
LLVM_ABI Constant * ConstantFoldCastOperand(unsigned Opcode, Constant *C, Type *DestTy, const DataLayout &DL)
Attempt to constant fold a cast with the specified operand.
Definition: ConstantFolding.cpp:1482

llvm::CodeGenOptLevel::Less
@ Less
-O1

llvm::ConstantFoldBinaryOpOperands
LLVM_ABI Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
Definition: ConstantFolding.cpp:1317

llvm::isKnownNonZero
LLVM_ABI bool isKnownNonZero(const Value *V, const SimplifyQuery &Q, unsigned Depth=0)
Return true if the given value is known to be non-zero when defined.
Definition: ValueTracking.cpp:3551

llvm::IRMemLocation::Other
@ Other
Any other memory.

llvm::IRMemLocation::First
@ First
Helpers to iterate all locations in the MemoryEffectsBase class.

llvm::simplifyBinOp
LLVM_ABI Value * simplifyBinOp(unsigned Opcode, Value *LHS, Value *RHS, const SimplifyQuery &Q)
Given operands for a BinaryOperator, fold the result or return null.
Definition: InstructionSimplify.cpp:6119

llvm::RecurKind::UMin
@ UMin
Unsigned integer min implemented in terms of select(cmp()).

llvm::RecurKind::Mul
@ Mul
Product of integers.

llvm::RecurKind::Xor
@ Xor
Bitwise or logical XOR of integers.

llvm::RecurKind::SMax
@ SMax
Signed integer max implemented in terms of select(cmp()).

llvm::RecurKind::SMin
@ SMin
Signed integer min implemented in terms of select(cmp()).

llvm::RecurKind::Sub
@ Sub
Subtraction of integers.

llvm::RecurKind::Add
@ Add
Sum of integers.

llvm::RecurKind::UMax
@ UMax
Unsigned integer max implemented in terms of select(cmp()).

llvm::isKnownNonEqual
LLVM_ABI bool isKnownNonEqual(const Value *V1, const Value *V2, const SimplifyQuery &SQ, unsigned Depth=0)
Return true if the given values are known to be non-equal when defined.
Definition: ValueTracking.cpp:304

llvm::Op
DWARFExpression::Operation Op
Definition: DWARFExpressionPrinter.cpp:22

llvm::PointerMayBeCaptured
LLVM_ABI bool PointerMayBeCaptured(const Value *V, bool ReturnCaptures, unsigned MaxUsesToExplore=0)
PointerMayBeCaptured - Return true if this pointer value may be captured by the enclosing function (w...
Definition: CaptureTracking.cpp:213

llvm::BitWidth
constexpr unsigned BitWidth
Definition: BitmaskEnum.h:223

llvm::count_if
auto count_if(R &&Range, UnaryPredicate P)
Wrapper function around std::count_if to count the number of times an element satisfying a given pred...
Definition: STLExtras.h:1980

llvm::isKnownNeverNaN
LLVM_ABI bool isKnownNeverNaN(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Return true if the floating-point scalar value is not a NaN or if the floating-point vector value has...
Definition: ValueTracking.cpp:5964

llvm::getFlippedStrictnessPredicateAndConstant
LLVM_ABI std::optional< std::pair< CmpPredicate, Constant * > > getFlippedStrictnessPredicateAndConstant(CmpPredicate Pred, Constant *C)
Convert an integer comparison with a constant RHS into an equivalent form with the strictness flipped...
Definition: ValueTracking.cpp:8571

llvm::all_equal
bool all_equal(std::initializer_list< T > Values)
Returns true if all Values in the initializer lists are equal or the list.
Definition: STLExtras.h:2127

llvm::isKnownToBeAPowerOfTwo
LLVM_ABI bool isKnownToBeAPowerOfTwo(const Value *V, const DataLayout &DL, bool OrZero=false, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Return true if the given value is known to have exactly one bit set when defined.
Definition: ValueTracking.cpp:265

llvm::Continue
@ Continue
Definition: DWP.h:22

llvm::getUnderlyingObject
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
Definition: ValueTracking.cpp:6646

llvm::isKnownPositive
LLVM_ABI bool isKnownPositive(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Returns true if the given value is known be positive (i.e.
Definition: ValueTracking.cpp:283

llvm::isKnownNonNegative
LLVM_ABI bool isKnownNonNegative(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Returns true if the give value is known to be non-negative.
Definition: ValueTracking.cpp:278

llvm::fltNanEncoding::AllOnes
@ AllOnes

llvm::Invalid
@ Invalid
Definition: PGOCtxProfWriter.h:24

llvm::isImpliedCondition
LLVM_ABI std::optional< bool > isImpliedCondition(const Value *LHS, const Value *RHS, const DataLayout &DL, bool LHSIsTrue=true, unsigned Depth=0)
Return true if RHS is known to be implied true by LHS.
Definition: ValueTracking.cpp:9503

llvm::decomposeBitTestICmp
std::optional< DecomposedBitTest > decomposeBitTestICmp(Value *LHS, Value *RHS, CmpInst::Predicate Pred, bool LookThroughTrunc=true, bool AllowNonZeroC=false, bool DecomposeAnd=false)
Decompose an icmp into the form ((X & Mask) pred C) if possible.
Definition: CmpInstAnalysis.cpp:77

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition: BitVector.h:858

NC
#define NC
Definition: regutils.h:42

OffsetResult
Definition: InstCombineCompares.cpp:5913

OffsetResult::Kind
OffsetKind Kind
Definition: InstCombineCompares.cpp:5914

OffsetResult::materialize
Value * materialize(InstCombiner::BuilderTy &Builder) const
Definition: InstCombineCompares.cpp:5927

OffsetResult::isValid
bool isValid() const
Definition: InstCombineCompares.cpp:5926

OffsetResult::value
static OffsetResult value(Value *V)
Definition: InstCombineCompares.cpp:5920

OffsetResult::select
static OffsetResult select(Value *Cond, Value *TrueV, Value *FalseV)
Definition: InstCombineCompares.cpp:5923

OffsetResult::V0
Value * V0
Definition: InstCombineCompares.cpp:5915

OffsetResult::invalid
static OffsetResult invalid()
Definition: InstCombineCompares.cpp:5917

llvm::APFloatBase::rmNearestTiesToEven
static constexpr roundingMode rmNearestTiesToEven
Definition: APFloat.h:304

llvm::APFloatBase::rmTowardZero
static constexpr roundingMode rmTowardZero
Definition: APFloat.h:308

llvm::APFloatBase::IEK_Inf
@ IEK_Inf
Definition: APFloat.h:346

llvm::CaptureTracker
This callback is used in conjunction with PointerMayBeCaptured.
Definition: CaptureTracking.h:139

llvm::CommonPointerBase
Definition: InstCombineInternal.h:901

llvm::CommonPointerBase::compute
static CommonPointerBase compute(Value *LHS, Value *RHS)
Definition: InstCombineAddSub.cpp:2100

llvm::DenormalMode
Represent subnormal handling kind for floating point instruction inputs and outputs.
Definition: FloatingPointMode.h:71

llvm::DenormalMode::PreserveSign
@ PreserveSign
The sign of a flushed-to-zero number is preserved in the sign of 0.
Definition: FloatingPointMode.h:81

llvm::DenormalMode::PositiveZero
@ PositiveZero
Denormals are flushed to positive zero.
Definition: FloatingPointMode.h:84

llvm::DenormalMode::getIEEE
static constexpr DenormalMode getIEEE()
Definition: FloatingPointMode.h:115

llvm::KnownBits
Definition: KnownBits.h:24

llvm::KnownBits::isNonNegative
bool isNonNegative() const
Returns true if this value is known to be non-negative.
Definition: KnownBits.h:101

llvm::KnownBits::isZero
bool isZero() const
Returns true if value is all zero.
Definition: KnownBits.h:80

llvm::KnownBits::countMinTrailingZeros
unsigned countMinTrailingZeros() const
Returns the minimum number of trailing zero bits.
Definition: KnownBits.h:235

llvm::KnownBits::countMaxTrailingZeros
unsigned countMaxTrailingZeros() const
Returns the maximum number of trailing zero bits possible.
Definition: KnownBits.h:267

llvm::KnownBits::getSignedMaxValue
APInt getSignedMaxValue() const
Return the maximal signed value possible given these KnownBits.
Definition: KnownBits.h:144

llvm::KnownBits::countMaxPopulation
unsigned countMaxPopulation() const
Returns the maximum number of bits that could be one.
Definition: KnownBits.h:282

llvm::KnownBits::getBitWidth
unsigned getBitWidth() const
Get the bit width of this value.
Definition: KnownBits.h:44

llvm::KnownBits::isConstant
bool isConstant() const
Returns true if we know the value of all bits.
Definition: KnownBits.h:54

llvm::KnownBits::countMinLeadingZeros
unsigned countMinLeadingZeros() const
Returns the minimum number of leading zero bits.
Definition: KnownBits.h:241

llvm::KnownBits::getMaxValue
APInt getMaxValue() const
Return the maximal unsigned value possible given these KnownBits.
Definition: KnownBits.h:138

llvm::KnownBits::getMinValue
APInt getMinValue() const
Return the minimal unsigned value possible given these KnownBits.
Definition: KnownBits.h:122

llvm::KnownBits::isStrictlyPositive
bool isStrictlyPositive() const
Returns true if this value is known to be positive.
Definition: KnownBits.h:107

llvm::KnownBits::isNegative
bool isNegative() const
Returns true if this value is known to be negative.
Definition: KnownBits.h:98

llvm::KnownBits::One
APInt One
Definition: KnownBits.h:26

llvm::KnownBits::Zero
APInt Zero
Definition: KnownBits.h:25

llvm::KnownBits::countMinPopulation
unsigned countMinPopulation() const
Returns the number of bits known to be one.
Definition: KnownBits.h:279

llvm::KnownBits::getSignedMinValue
APInt getSignedMinValue() const
Return the minimal signed value possible given these KnownBits.
Definition: KnownBits.h:128

llvm::KnownBits::getConstant
const APInt & getConstant() const
Returns the value when all bits have a known value.
Definition: KnownBits.h:60

llvm::MIPatternMatch::And
Matching combinators.
Definition: MIPatternMatch.h:313

llvm::MIPatternMatch::Or
Definition: MIPatternMatch.h:332

llvm::MinMax
Definition: AssumeBundleQueries.h:72

llvm::PatternMatch::m_Mask
Definition: PatternMatch.h:1988

llvm::PatternMatch::m_SpecificMask
Definition: PatternMatch.h:2003

llvm::PatternMatch::m_SplatOrPoisonMask
Definition: PatternMatch.h:2009

llvm::SelectPatternResult
Definition: ValueTracking.h:851

llvm::SelectPatternResult::Flavor
SelectPatternFlavor Flavor
Definition: ValueTracking.h:852

llvm::SelectPatternResult::isMinOrMax
static bool isMinOrMax(SelectPatternFlavor SPF)
When implementing this min/max pattern as fcmp; select, does the fcmp have to be ordered?
Definition: ValueTracking.h:860

llvm::SimplifyQuery
Definition: SimplifyQuery.h:71

llvm::SimplifyQuery::DL
const DataLayout & DL
Definition: SimplifyQuery.h:72

llvm::SimplifyQuery::CxtI
const Instruction * CxtI
Definition: SimplifyQuery.h:76

llvm::SimplifyQuery::DT
const DominatorTree * DT
Definition: SimplifyQuery.h:74

llvm::SimplifyQuery::getWithInstruction
SimplifyQuery getWithInstruction(const Instruction *I) const
Definition: SimplifyQuery.h:108

llvm::SimplifyQuery::AC
AssumptionCache * AC
Definition: SimplifyQuery.h:75

llvm::SimplifyQuery::getWithoutDomCondCache
SimplifyQuery getWithoutDomCondCache() const
Definition: SimplifyQuery.h:123

llvm::SmallMapVector
A MapVector that performs no allocations if smaller than a certain size.
Definition: MapVector.h:249

llvm::UseCaptureInfo
Capture information for a specific Use.
Definition: CaptureTracking.h:115

llvm::fltSemantics
Definition: APFloat.cpp:103