docs/doxygen/InstCombineCalls_8cpp_source.html

//===- InstCombineCalls.cpp -----------------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the visitCall, visitInvoke, and visitCallBr functions.

//

//===----------------------------------------------------------------------===//


#include "InstCombineInternal.h"

#include "llvm/ADT/APFloat.h"

#include "llvm/ADT/APInt.h"

#include "llvm/ADT/APSInt.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/ADT/STLFunctionalExtras.h"

#include "llvm/ADT/SmallBitVector.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/AliasAnalysis.h"

#include "llvm/Analysis/AssumeBundleQueries.h"

#include "llvm/Analysis/AssumptionCache.h"

#include "llvm/Analysis/InstructionSimplify.h"

#include "llvm/Analysis/Loads.h"

#include "llvm/Analysis/MemoryBuiltins.h"

#include "llvm/Analysis/ValueTracking.h"

#include "llvm/Analysis/VectorUtils.h"

#include "llvm/IR/AttributeMask.h"

#include "llvm/IR/Attributes.h"

#include "llvm/IR/BasicBlock.h"

#include "llvm/IR/Constant.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/IR/DebugInfo.h"

#include "llvm/IR/DerivedTypes.h"

#include "llvm/IR/Function.h"

#include "llvm/IR/GlobalVariable.h"

#include "llvm/IR/InlineAsm.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Instruction.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Intrinsics.h"

#include "llvm/IR/IntrinsicsAArch64.h"

#include "llvm/IR/IntrinsicsAMDGPU.h"

#include "llvm/IR/IntrinsicsARM.h"

#include "llvm/IR/IntrinsicsHexagon.h"

#include "llvm/IR/LLVMContext.h"

#include "llvm/IR/Metadata.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/IR/Statepoint.h"

#include "llvm/IR/Type.h"

#include "llvm/IR/User.h"

#include "llvm/IR/Value.h"

#include "llvm/IR/ValueHandle.h"

#include "llvm/Support/AtomicOrdering.h"

#include "llvm/Support/Casting.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/KnownBits.h"

#include "llvm/Support/KnownFPClass.h"

#include "llvm/Support/MathExtras.h"

#include "llvm/Support/TypeSize.h"

#include "llvm/Support/raw_ostream.h"

#include "llvm/Transforms/InstCombine/InstCombiner.h"

#include "llvm/Transforms/Utils/AssumeBundleBuilder.h"

#include "llvm/Transforms/Utils/Local.h"

#include "llvm/Transforms/Utils/SimplifyLibCalls.h"

#include <algorithm>

#include <cassert>

#include <cstdint>

#include <optional>

#include <utility>

#include <vector>


#define DEBUG_TYPE "instcombine"

#include "llvm/Transforms/Utils/InstructionWorklist.h"


using namespace llvm;

using namespace PatternMatch;


STATISTIC(NumSimplified, "Number of library calls simplified");


static cl::opt<unsigned> GuardWideningWindow(

    "instcombine-guard-widening-window",

    cl::init(3),

    cl::desc("How wide an instruction window to bypass looking for "

             "another guard"));


/// Return the specified type promoted as it would be to pass though a va_arg

/// area.


static Type *getPromotedType(Type *Ty) {

  if (IntegerType* ITy = dyn_cast<IntegerType>(Ty)) {

    if (ITy->getBitWidth() < 32)

      return Type::getInt32Ty(Ty->getContext());

  }

  return Ty;

}


/// Recognize a memcpy/memmove from a trivially otherwise unused alloca.

/// TODO: This should probably be integrated with visitAllocSites, but that

/// requires a deeper change to allow either unread or unwritten objects.


static bool hasUndefSource(AnyMemTransferInst *MI) {

  auto *Src = MI->getRawSource();

  while (isa<GetElementPtrInst>(Src)) {

    if (!Src->hasOneUse())

      return false;

    Src = cast<Instruction>(Src)->getOperand(0);

  }

  return isa<AllocaInst>(Src) && Src->hasOneUse();

}


Instruction *InstCombinerImpl::SimplifyAnyMemTransfer(AnyMemTransferInst *MI) {

  Align DstAlign = getKnownAlignment(MI->getRawDest(), DL, MI, &AC, &DT);

  MaybeAlign CopyDstAlign = MI->getDestAlign();

  if (!CopyDstAlign || *CopyDstAlign < DstAlign) {

    MI->setDestAlignment(DstAlign);

    return MI;

  }


  Align SrcAlign = getKnownAlignment(MI->getRawSource(), DL, MI, &AC, &DT);

  MaybeAlign CopySrcAlign = MI->getSourceAlign();

  if (!CopySrcAlign || *CopySrcAlign < SrcAlign) {

    MI->setSourceAlignment(SrcAlign);

    return MI;

  }


  // If we have a store to a location which is known constant, we can conclude

  // that the store must be storing the constant value (else the memory

  // wouldn't be constant), and this must be a noop.

  if (!isModSet(AA->getModRefInfoMask(MI->getDest()))) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength((uint64_t)0);

    return MI;

  }


  // If the source is provably undef, the memcpy/memmove doesn't do anything

  // (unless the transfer is volatile).

  if (hasUndefSource(MI) && !MI->isVolatile()) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength((uint64_t)0);

    return MI;

  }


  // If MemCpyInst length is 1/2/4/8 bytes then replace memcpy with

  // load/store.

  ConstantInt *MemOpLength = dyn_cast<ConstantInt>(MI->getLength());

  if (!MemOpLength) return nullptr;


  // Source and destination pointer types are always "i8*" for intrinsic.  See

  // if the size is something we can handle with a single primitive load/store.

  // A single load+store correctly handles overlapping memory in the memmove

  // case.

  uint64_t Size = MemOpLength->getLimitedValue();

  assert(Size && "0-sized memory transferring should be removed already.");


  if (Size > 8 || (Size&(Size-1)))

    return nullptr;  // If not 1/2/4/8 bytes, exit.


  // If it is an atomic and alignment is less than the size then we will

  // introduce the unaligned memory access which will be later transformed

  // into libcall in CodeGen. This is not evident performance gain so disable

  // it now.

  if (MI->isAtomic())

    if (*CopyDstAlign < Size || *CopySrcAlign < Size)

      return nullptr;


  // Use an integer load+store unless we can find something better.

  IntegerType* IntType = IntegerType::get(MI->getContext(), Size<<3);


  // If the memcpy has metadata describing the members, see if we can get the

  // TBAA, scope and noalias tags describing our copy.

  AAMDNodes AACopyMD = MI->getAAMetadata().adjustForAccess(Size);


  Value *Src = MI->getArgOperand(1);

  Value *Dest = MI->getArgOperand(0);

  LoadInst *L = Builder.CreateLoad(IntType, Src);

  // Alignment from the mem intrinsic will be better, so use it.

  L->setAlignment(*CopySrcAlign);

  L->setAAMetadata(AACopyMD);

  MDNode *LoopMemParallelMD =

    MI->getMetadata(LLVMContext::MD_mem_parallel_loop_access);

  if (LoopMemParallelMD)

    L->setMetadata(LLVMContext::MD_mem_parallel_loop_access, LoopMemParallelMD);

  MDNode *AccessGroupMD = MI->getMetadata(LLVMContext::MD_access_group);

  if (AccessGroupMD)

    L->setMetadata(LLVMContext::MD_access_group, AccessGroupMD);


  StoreInst *S = Builder.CreateStore(L, Dest);

  // Alignment from the mem intrinsic will be better, so use it.

  S->setAlignment(*CopyDstAlign);

  S->setAAMetadata(AACopyMD);

  if (LoopMemParallelMD)

    S->setMetadata(LLVMContext::MD_mem_parallel_loop_access, LoopMemParallelMD);

  if (AccessGroupMD)

    S->setMetadata(LLVMContext::MD_access_group, AccessGroupMD);

  S->copyMetadata(*MI, LLVMContext::MD_DIAssignID);


  if (auto *MT = dyn_cast<MemTransferInst>(MI)) {

    // non-atomics can be volatile

    L->setVolatile(MT->isVolatile());

    S->setVolatile(MT->isVolatile());

  }

  if (MI->isAtomic()) {

    // atomics have to be unordered

    L->setOrdering(AtomicOrdering::Unordered);

    S->setOrdering(AtomicOrdering::Unordered);

  }


  // Set the size of the copy to 0, it will be deleted on the next iteration.

  MI->setLength((uint64_t)0);

  return MI;

}


Instruction *InstCombinerImpl::SimplifyAnyMemSet(AnyMemSetInst *MI) {

  const Align KnownAlignment =

      getKnownAlignment(MI->getDest(), DL, MI, &AC, &DT);

  MaybeAlign MemSetAlign = MI->getDestAlign();

  if (!MemSetAlign || *MemSetAlign < KnownAlignment) {

    MI->setDestAlignment(KnownAlignment);

    return MI;

  }


  // If we have a store to a location which is known constant, we can conclude

  // that the store must be storing the constant value (else the memory

  // wouldn't be constant), and this must be a noop.

  if (!isModSet(AA->getModRefInfoMask(MI->getDest()))) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength((uint64_t)0);

    return MI;

  }


  // Remove memset with an undef value.

  // FIXME: This is technically incorrect because it might overwrite a poison

  // value. Change to PoisonValue once #52930 is resolved.

  if (isa<UndefValue>(MI->getValue())) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength((uint64_t)0);

    return MI;

  }


  // Extract the length and alignment and fill if they are constant.

  ConstantInt *LenC = dyn_cast<ConstantInt>(MI->getLength());

  ConstantInt *FillC = dyn_cast<ConstantInt>(MI->getValue());

  if (!LenC || !FillC || !FillC->getType()->isIntegerTy(8))

    return nullptr;

  const uint64_t Len = LenC->getLimitedValue();

  assert(Len && "0-sized memory setting should be removed already.");

  const Align Alignment = MI->getDestAlign().valueOrOne();


  // If it is an atomic and alignment is less than the size then we will

  // introduce the unaligned memory access which will be later transformed

  // into libcall in CodeGen. This is not evident performance gain so disable

  // it now.

  if (MI->isAtomic() && Alignment < Len)

    return nullptr;


  // memset(s,c,n) -> store s, c (for n=1,2,4,8)

  if (Len <= 8 && isPowerOf2_32((uint32_t)Len)) {

    Value *Dest = MI->getDest();


    // Extract the fill value and store.

    Constant *FillVal = ConstantInt::get(

        MI->getContext(), APInt::getSplat(Len * 8, FillC->getValue()));

    StoreInst *S = Builder.CreateStore(FillVal, Dest, MI->isVolatile());

    S->copyMetadata(*MI, LLVMContext::MD_DIAssignID);

    for (DbgVariableRecord *DbgAssign : at::getDVRAssignmentMarkers(S)) {

      if (llvm::is_contained(DbgAssign->location_ops(), FillC))

        DbgAssign->replaceVariableLocationOp(FillC, FillVal);

    }


    S->setAlignment(Alignment);

    if (MI->isAtomic())

      S->setOrdering(AtomicOrdering::Unordered);


    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength((uint64_t)0);

    return MI;

  }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Narrow width by halfs excluding zero/undef lanes

Value *InstCombinerImpl::simplifyMaskedLoad(IntrinsicInst &II) {

  Value *LoadPtr = II.getArgOperand(0);

  const Align Alignment = II.getParamAlign(0).valueOrOne();


  // If the mask is all ones or undefs, this is a plain vector load of the 1st

  // argument.

  if (maskIsAllOneOrUndef(II.getArgOperand(1))) {

    LoadInst *L = Builder.CreateAlignedLoad(II.getType(), LoadPtr, Alignment,

                                            "unmaskedload");

    L->copyMetadata(II);

    return L;

  }


  // If we can unconditionally load from this address, replace with a

  // load/select idiom. TODO: use DT for context sensitive query

  if (isDereferenceablePointer(LoadPtr, II.getType(),

                               II.getDataLayout(), &II, &AC)) {

    LoadInst *LI = Builder.CreateAlignedLoad(II.getType(), LoadPtr, Alignment,

                                             "unmaskedload");

    LI->copyMetadata(II);

    return Builder.CreateSelect(II.getArgOperand(1), LI, II.getArgOperand(2));

  }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane -> store

// * Narrow width by halfs excluding zero/undef lanes

Instruction *InstCombinerImpl::simplifyMaskedStore(IntrinsicInst &II) {

  Value *StorePtr = II.getArgOperand(1);

  Align Alignment = II.getParamAlign(1).valueOrOne();

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(2));

  if (!ConstMask)

    return nullptr;


  // If the mask is all zeros, this instruction does nothing.

  if (maskIsAllZeroOrUndef(ConstMask))

    return eraseInstFromFunction(II);


  // If the mask is all ones, this is a plain vector store of the 1st argument.

  if (maskIsAllOneOrUndef(ConstMask)) {

    StoreInst *S =

        new StoreInst(II.getArgOperand(0), StorePtr, false, Alignment);

    S->copyMetadata(II);

    return S;

  }


  if (isa<ScalableVectorType>(ConstMask->getType()))

    return nullptr;


  // Use masked off lanes to simplify operands via SimplifyDemandedVectorElts

  APInt DemandedElts = possiblyDemandedEltsInMask(ConstMask);

  APInt PoisonElts(DemandedElts.getBitWidth(), 0);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(0), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 0, V);


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane load -> load

// * Dereferenceable address & few lanes -> scalarize speculative load/selects

// * Adjacent vector addresses -> masked.load

// * Narrow width by halfs excluding zero/undef lanes

// * Vector incrementing address -> vector masked load

Instruction *InstCombinerImpl::simplifyMaskedGather(IntrinsicInst &II) {

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(1));

  if (!ConstMask)

    return nullptr;


  // Vector splat address w/known mask -> scalar load

  // Fold the gather to load the source vector first lane

  // because it is reloading the same value each time

  if (ConstMask->isAllOnesValue())

    if (auto *SplatPtr = getSplatValue(II.getArgOperand(0))) {

      auto *VecTy = cast<VectorType>(II.getType());

      const Align Alignment = II.getParamAlign(0).valueOrOne();

      LoadInst *L = Builder.CreateAlignedLoad(VecTy->getElementType(), SplatPtr,

                                              Alignment, "load.scalar");

      Value *Shuf =

          Builder.CreateVectorSplat(VecTy->getElementCount(), L, "broadcast");

      return replaceInstUsesWith(II, cast<Instruction>(Shuf));

    }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane -> store

// * Adjacent vector addresses -> masked.store

// * Narrow store width by halfs excluding zero/undef lanes

// * Vector incrementing address -> vector masked store

Instruction *InstCombinerImpl::simplifyMaskedScatter(IntrinsicInst &II) {

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(2));

  if (!ConstMask)

    return nullptr;


  // If the mask is all zeros, a scatter does nothing.

  if (maskIsAllZeroOrUndef(ConstMask))

    return eraseInstFromFunction(II);


  // Vector splat address -> scalar store

  if (auto *SplatPtr = getSplatValue(II.getArgOperand(1))) {

    // scatter(splat(value), splat(ptr), non-zero-mask) -> store value, ptr

    if (auto *SplatValue = getSplatValue(II.getArgOperand(0))) {

      if (maskContainsAllOneOrUndef(ConstMask)) {

        Align Alignment = II.getParamAlign(1).valueOrOne();

        StoreInst *S = new StoreInst(SplatValue, SplatPtr, /*IsVolatile=*/false,

                                     Alignment);

        S->copyMetadata(II);

        return S;

      }

    }

    // scatter(vector, splat(ptr), splat(true)) -> store extract(vector,

    // lastlane), ptr

    if (ConstMask->isAllOnesValue()) {

      Align Alignment = II.getParamAlign(1).valueOrOne();

      VectorType *WideLoadTy = cast<VectorType>(II.getArgOperand(1)->getType());

      ElementCount VF = WideLoadTy->getElementCount();

      Value *RunTimeVF = Builder.CreateElementCount(Builder.getInt32Ty(), VF);

      Value *LastLane = Builder.CreateSub(RunTimeVF, Builder.getInt32(1));

      Value *Extract =

          Builder.CreateExtractElement(II.getArgOperand(0), LastLane);

      StoreInst *S =

          new StoreInst(Extract, SplatPtr, /*IsVolatile=*/false, Alignment);

      S->copyMetadata(II);

      return S;

    }

  }

  if (isa<ScalableVectorType>(ConstMask->getType()))

    return nullptr;


  // Use masked off lanes to simplify operands via SimplifyDemandedVectorElts

  APInt DemandedElts = possiblyDemandedEltsInMask(ConstMask);

  APInt PoisonElts(DemandedElts.getBitWidth(), 0);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(0), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 0, V);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(1), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 1, V);


  return nullptr;

}


/// This function transforms launder.invariant.group and strip.invariant.group

/// like:

/// launder(launder(%x)) -> launder(%x)       (the result is not the argument)

/// launder(strip(%x)) -> launder(%x)

/// strip(strip(%x)) -> strip(%x)             (the result is not the argument)

/// strip(launder(%x)) -> strip(%x)

/// This is legal because it preserves the most recent information about

/// the presence or absence of invariant.group.


static Instruction *simplifyInvariantGroupIntrinsic(IntrinsicInst &II,

                                                    InstCombinerImpl &IC) {

  auto *Arg = II.getArgOperand(0);

  auto *StrippedArg = Arg->stripPointerCasts();

  auto *StrippedInvariantGroupsArg = StrippedArg;

  while (auto *Intr = dyn_cast<IntrinsicInst>(StrippedInvariantGroupsArg)) {

    if (Intr->getIntrinsicID() != Intrinsic::launder_invariant_group &&

        Intr->getIntrinsicID() != Intrinsic::strip_invariant_group)

      break;

    StrippedInvariantGroupsArg = Intr->getArgOperand(0)->stripPointerCasts();

  }

  if (StrippedArg == StrippedInvariantGroupsArg)

    return nullptr; // No launders/strips to remove.


  Value *Result = nullptr;


  if (II.getIntrinsicID() == Intrinsic::launder_invariant_group)

    Result = IC.Builder.CreateLaunderInvariantGroup(StrippedInvariantGroupsArg);

  else if (II.getIntrinsicID() == Intrinsic::strip_invariant_group)

    Result = IC.Builder.CreateStripInvariantGroup(StrippedInvariantGroupsArg);

  else

    llvm_unreachable(

        "simplifyInvariantGroupIntrinsic only handles launder and strip");

  if (Result->getType()->getPointerAddressSpace() !=

      II.getType()->getPointerAddressSpace())

    Result = IC.Builder.CreateAddrSpaceCast(Result, II.getType());


  return cast<Instruction>(Result);

}


static Instruction *foldCttzCtlz(IntrinsicInst &II, InstCombinerImpl &IC) {

  assert((II.getIntrinsicID() == Intrinsic::cttz ||

          II.getIntrinsicID() == Intrinsic::ctlz) &&

         "Expected cttz or ctlz intrinsic");

  bool IsTZ = II.getIntrinsicID() == Intrinsic::cttz;

  Value *Op0 = II.getArgOperand(0);

  Value *Op1 = II.getArgOperand(1);

  Value *X;

  // ctlz(bitreverse(x)) -> cttz(x)

  // cttz(bitreverse(x)) -> ctlz(x)

  if (match(Op0, m_BitReverse(m_Value(X)))) {

    Intrinsic::ID ID = IsTZ ? Intrinsic::ctlz : Intrinsic::cttz;

    Function *F =

        Intrinsic::getOrInsertDeclaration(II.getModule(), ID, II.getType());

    return CallInst::Create(F, {X, II.getArgOperand(1)});

  }


  if (II.getType()->isIntOrIntVectorTy(1)) {

    // ctlz/cttz i1 Op0 --> not Op0

    if (match(Op1, m_Zero()))

      return BinaryOperator::CreateNot(Op0);

    // If zero is poison, then the input can be assumed to be "true", so the

    // instruction simplifies to "false".

    assert(match(Op1, m_One()) && "Expected ctlz/cttz operand to be 0 or 1");

    return IC.replaceInstUsesWith(II, ConstantInt::getNullValue(II.getType()));

  }


  // If ctlz/cttz is only used as a shift amount, set is_zero_poison to true.

  if (II.hasOneUse() && match(Op1, m_Zero()) &&

      match(II.user_back(), m_Shift(m_Value(), m_Specific(&II)))) {

    II.dropUBImplyingAttrsAndMetadata();

    return IC.replaceOperand(II, 1, IC.Builder.getTrue());

  }


  Constant *C;


  if (IsTZ) {

    // cttz(-x) -> cttz(x)

    if (match(Op0, m_Neg(m_Value(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(-x & x) -> cttz(x)

    if (match(Op0, m_c_And(m_Neg(m_Value(X)), m_Deferred(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(sext(x)) -> cttz(zext(x))

    if (match(Op0, m_OneUse(m_SExt(m_Value(X))))) {

      auto *Zext = IC.Builder.CreateZExt(X, II.getType());

      auto *CttzZext =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, Zext, Op1);

      return IC.replaceInstUsesWith(II, CttzZext);

    }


    // Zext doesn't change the number of trailing zeros, so narrow:

    // cttz(zext(x)) -> zext(cttz(x)) if the 'ZeroIsPoison' parameter is 'true'.

    if (match(Op0, m_OneUse(m_ZExt(m_Value(X)))) && match(Op1, m_One())) {

      auto *Cttz = IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, X,

                                                    IC.Builder.getTrue());

      auto *ZextCttz = IC.Builder.CreateZExt(Cttz, II.getType());

      return IC.replaceInstUsesWith(II, ZextCttz);

    }


    // cttz(abs(x)) -> cttz(x)

    // cttz(nabs(x)) -> cttz(x)

    Value *Y;

    SelectPatternFlavor SPF = matchSelectPattern(Op0, X, Y).Flavor;

    if (SPF == SPF_ABS || SPF == SPF_NABS)

      return IC.replaceOperand(II, 0, X);


    if (match(Op0, m_Intrinsic<Intrinsic::abs>(m_Value(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(shl(%const, %val), 1) --> add(cttz(%const, 1), %val)

    if (match(Op0, m_Shl(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCttz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, C, Op1);

      return BinaryOperator::CreateAdd(ConstCttz, X);

    }


    // cttz(lshr exact (%const, %val), 1) --> sub(cttz(%const, 1), %val)

    if (match(Op0, m_Exact(m_LShr(m_ImmConstant(C), m_Value(X)))) &&

        match(Op1, m_One())) {

      Value *ConstCttz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, C, Op1);

      return BinaryOperator::CreateSub(ConstCttz, X);

    }


    // cttz(add(lshr(UINT_MAX, %val), 1)) --> sub(width, %val)

    if (match(Op0, m_Add(m_LShr(m_AllOnes(), m_Value(X)), m_One()))) {

      Value *Width =

          ConstantInt::get(II.getType(), II.getType()->getScalarSizeInBits());

      return BinaryOperator::CreateSub(Width, X);

    }

  } else {

    // ctlz(lshr(%const, %val), 1) --> add(ctlz(%const, 1), %val)

    if (match(Op0, m_LShr(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCtlz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::ctlz, C, Op1);

      return BinaryOperator::CreateAdd(ConstCtlz, X);

    }


    // ctlz(shl nuw (%const, %val), 1) --> sub(ctlz(%const, 1), %val)

    if (match(Op0, m_NUWShl(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCtlz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::ctlz, C, Op1);

      return BinaryOperator::CreateSub(ConstCtlz, X);

    }


    // ctlz(~x & (x - 1)) -> bitwidth - cttz(x, false)

    if (Op0->hasOneUse() &&

        match(Op0,

              m_c_And(m_Not(m_Value(X)), m_Add(m_Deferred(X), m_AllOnes())))) {

      Type *Ty = II.getType();

      unsigned BitWidth = Ty->getScalarSizeInBits();

      auto *Cttz = IC.Builder.CreateIntrinsic(Intrinsic::cttz, Ty,

                                              {X, IC.Builder.getFalse()});

      auto *Bw = ConstantInt::get(Ty, APInt(BitWidth, BitWidth));

      return IC.replaceInstUsesWith(II, IC.Builder.CreateSub(Bw, Cttz));

    }

  }


  // cttz(Pow2) -> Log2(Pow2)

  // ctlz(Pow2) -> BitWidth - 1 - Log2(Pow2)

  if (auto *R = IC.tryGetLog2(Op0, match(Op1, m_One()))) {

    if (IsTZ)

      return IC.replaceInstUsesWith(II, R);

    BinaryOperator *BO = BinaryOperator::CreateSub(

        ConstantInt::get(R->getType(), R->getType()->getScalarSizeInBits() - 1),

        R);

    BO->setHasNoSignedWrap();

    BO->setHasNoUnsignedWrap();

    return BO;

  }


  KnownBits Known = IC.computeKnownBits(Op0, &II);


  // Create a mask for bits above (ctlz) or below (cttz) the first known one.

  unsigned PossibleZeros = IsTZ ? Known.countMaxTrailingZeros()

                                : Known.countMaxLeadingZeros();

  unsigned DefiniteZeros = IsTZ ? Known.countMinTrailingZeros()

                                : Known.countMinLeadingZeros();


  // If all bits above (ctlz) or below (cttz) the first known one are known

  // zero, this value is constant.

  // FIXME: This should be in InstSimplify because we're replacing an

  // instruction with a constant.

  if (PossibleZeros == DefiniteZeros) {

    auto *C = ConstantInt::get(Op0->getType(), DefiniteZeros);

    return IC.replaceInstUsesWith(II, C);

  }


  // If the input to cttz/ctlz is known to be non-zero,

  // then change the 'ZeroIsPoison' parameter to 'true'

  // because we know the zero behavior can't affect the result.

  if (!Known.One.isZero() ||

      isKnownNonZero(Op0, IC.getSimplifyQuery().getWithInstruction(&II))) {

    if (!match(II.getArgOperand(1), m_One()))

      return IC.replaceOperand(II, 1, IC.Builder.getTrue());

  }


  // Add range attribute since known bits can't completely reflect what we know.

  unsigned BitWidth = Op0->getType()->getScalarSizeInBits();

  if (BitWidth != 1 && !II.hasRetAttr(Attribute::Range) &&

      !II.getMetadata(LLVMContext::MD_range)) {

    ConstantRange Range(APInt(BitWidth, DefiniteZeros),

                        APInt(BitWidth, PossibleZeros + 1));

    II.addRangeRetAttr(Range);

    return &II;

  }


  return nullptr;

}


static Instruction *foldCtpop(IntrinsicInst &II, InstCombinerImpl &IC) {

  assert(II.getIntrinsicID() == Intrinsic::ctpop &&

         "Expected ctpop intrinsic");

  Type *Ty = II.getType();

  unsigned BitWidth = Ty->getScalarSizeInBits();

  Value *Op0 = II.getArgOperand(0);

  Value *X, *Y;


  // ctpop(bitreverse(x)) -> ctpop(x)

  // ctpop(bswap(x)) -> ctpop(x)

  if (match(Op0, m_BitReverse(m_Value(X))) || match(Op0, m_BSwap(m_Value(X))))

    return IC.replaceOperand(II, 0, X);


  // ctpop(rot(x)) -> ctpop(x)

  if ((match(Op0, m_FShl(m_Value(X), m_Value(Y), m_Value())) ||

       match(Op0, m_FShr(m_Value(X), m_Value(Y), m_Value()))) &&

      X == Y)

    return IC.replaceOperand(II, 0, X);


  // ctpop(x | -x) -> bitwidth - cttz(x, false)

  if (Op0->hasOneUse() &&

      match(Op0, m_c_Or(m_Value(X), m_Neg(m_Deferred(X))))) {

    auto *Cttz = IC.Builder.CreateIntrinsic(Intrinsic::cttz, Ty,

                                            {X, IC.Builder.getFalse()});

    auto *Bw = ConstantInt::get(Ty, APInt(BitWidth, BitWidth));

    return IC.replaceInstUsesWith(II, IC.Builder.CreateSub(Bw, Cttz));

  }


  // ctpop(~x & (x - 1)) -> cttz(x, false)

  if (match(Op0,

            m_c_And(m_Not(m_Value(X)), m_Add(m_Deferred(X), m_AllOnes())))) {

    Function *F =

        Intrinsic::getOrInsertDeclaration(II.getModule(), Intrinsic::cttz, Ty);

    return CallInst::Create(F, {X, IC.Builder.getFalse()});

  }


  // Zext doesn't change the number of set bits, so narrow:

  // ctpop (zext X) --> zext (ctpop X)

  if (match(Op0, m_OneUse(m_ZExt(m_Value(X))))) {

    Value *NarrowPop = IC.Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, X);

    return CastInst::Create(Instruction::ZExt, NarrowPop, Ty);

  }


  KnownBits Known(BitWidth);

  IC.computeKnownBits(Op0, Known, &II);


  // If all bits are zero except for exactly one fixed bit, then the result

  // must be 0 or 1, and we can get that answer by shifting to LSB:

  // ctpop (X & 32) --> (X & 32) >> 5

  // TODO: Investigate removing this as its likely unnecessary given the below

  // `isKnownToBeAPowerOfTwo` check.

  if ((~Known.Zero).isPowerOf2())

    return BinaryOperator::CreateLShr(

        Op0, ConstantInt::get(Ty, (~Known.Zero).exactLogBase2()));


  // More generally we can also handle non-constant power of 2 patterns such as

  // shl/shr(Pow2, X), (X & -X), etc... by transforming:

  // ctpop(Pow2OrZero) --> icmp ne X, 0

  if (IC.isKnownToBeAPowerOfTwo(Op0, /* OrZero */ true))

    return CastInst::Create(Instruction::ZExt,

                            IC.Builder.CreateICmp(ICmpInst::ICMP_NE, Op0,

                                                  Constant::getNullValue(Ty)),

                            Ty);


  // Add range attribute since known bits can't completely reflect what we know.

  if (BitWidth != 1) {

    ConstantRange OldRange =

        II.getRange().value_or(ConstantRange::getFull(BitWidth));


    unsigned Lower = Known.countMinPopulation();

    unsigned Upper = Known.countMaxPopulation() + 1;


    if (Lower == 0 && OldRange.contains(APInt::getZero(BitWidth)) &&

        isKnownNonZero(Op0, IC.getSimplifyQuery().getWithInstruction(&II)))

      Lower = 1;


    ConstantRange Range(APInt(BitWidth, Lower), APInt(BitWidth, Upper));

    Range = Range.intersectWith(OldRange, ConstantRange::Unsigned);


    if (Range != OldRange) {

      II.addRangeRetAttr(Range);

      return &II;

    }

  }


  return nullptr;

}


/// Convert a table lookup to shufflevector if the mask is constant.

/// This could benefit tbl1 if the mask is { 7,6,5,4,3,2,1,0 }, in

/// which case we could lower the shufflevector with rev64 instructions

/// as it's actually a byte reverse.


static Value *simplifyNeonTbl1(const IntrinsicInst &II,

                               InstCombiner::BuilderTy &Builder) {

  // Bail out if the mask is not a constant.

  auto *C = dyn_cast<Constant>(II.getArgOperand(1));

  if (!C)

    return nullptr;


  auto *VecTy = cast<FixedVectorType>(II.getType());

  unsigned NumElts = VecTy->getNumElements();


  // Only perform this transformation for <8 x i8> vector types.

  if (!VecTy->getElementType()->isIntegerTy(8) || NumElts != 8)

    return nullptr;


  int Indexes[8];


  for (unsigned I = 0; I < NumElts; ++I) {

    Constant *COp = C->getAggregateElement(I);


    if (!COp || !isa<ConstantInt>(COp))

      return nullptr;


    Indexes[I] = cast<ConstantInt>(COp)->getLimitedValue();


    // Make sure the mask indices are in range.

    if ((unsigned)Indexes[I] >= NumElts)

      return nullptr;

  }


  auto *V1 = II.getArgOperand(0);

  auto *V2 = Constant::getNullValue(V1->getType());

  return Builder.CreateShuffleVector(V1, V2, ArrayRef(Indexes));

}


// Returns true iff the 2 intrinsics have the same operands, limiting the

// comparison to the first NumOperands.


static bool haveSameOperands(const IntrinsicInst &I, const IntrinsicInst &E,

                             unsigned NumOperands) {

  assert(I.arg_size() >= NumOperands && "Not enough operands");

  assert(E.arg_size() >= NumOperands && "Not enough operands");

  for (unsigned i = 0; i < NumOperands; i++)

    if (I.getArgOperand(i) != E.getArgOperand(i))

      return false;

  return true;

}


// Remove trivially empty start/end intrinsic ranges, i.e. a start

// immediately followed by an end (ignoring debuginfo or other

// start/end intrinsics in between). As this handles only the most trivial

// cases, tracking the nesting level is not needed:

//

//   call @llvm.foo.start(i1 0)

//   call @llvm.foo.start(i1 0) ; This one won't be skipped: it will be removed

//   call @llvm.foo.end(i1 0)

//   call @llvm.foo.end(i1 0) ; &I

static bool


removeTriviallyEmptyRange(IntrinsicInst &EndI, InstCombinerImpl &IC,

                          std::function<bool(const IntrinsicInst &)> IsStart) {

  // We start from the end intrinsic and scan backwards, so that InstCombine

  // has already processed (and potentially removed) all the instructions

  // before the end intrinsic.

  BasicBlock::reverse_iterator BI(EndI), BE(EndI.getParent()->rend());

  for (; BI != BE; ++BI) {

    if (auto *I = dyn_cast<IntrinsicInst>(&*BI)) {

      if (I->isDebugOrPseudoInst() ||

          I->getIntrinsicID() == EndI.getIntrinsicID())

        continue;

      if (IsStart(*I)) {

        if (haveSameOperands(EndI, *I, EndI.arg_size())) {

          IC.eraseInstFromFunction(*I);

          IC.eraseInstFromFunction(EndI);

          return true;

        }

        // Skip start intrinsics that don't pair with this end intrinsic.

        continue;

      }

    }

    break;

  }


  return false;

}


Instruction *InstCombinerImpl::visitVAEndInst(VAEndInst &I) {

  removeTriviallyEmptyRange(I, *this, [&I](const IntrinsicInst &II) {

    // Bail out on the case where the source va_list of a va_copy is destroyed

    // immediately by a follow-up va_end.

    return II.getIntrinsicID() == Intrinsic::vastart ||

           (II.getIntrinsicID() == Intrinsic::vacopy &&

            I.getArgOperand(0) != II.getArgOperand(1));

  });

  return nullptr;

}


static CallInst *canonicalizeConstantArg0ToArg1(CallInst &Call) {

  assert(Call.arg_size() > 1 && "Need at least 2 args to swap");

  Value *Arg0 = Call.getArgOperand(0), *Arg1 = Call.getArgOperand(1);

  if (isa<Constant>(Arg0) && !isa<Constant>(Arg1)) {

    Call.setArgOperand(0, Arg1);

    Call.setArgOperand(1, Arg0);

    return &Call;

  }

  return nullptr;

}


/// Creates a result tuple for an overflow intrinsic \p II with a given

/// \p Result and a constant \p Overflow value.


static Instruction *createOverflowTuple(IntrinsicInst *II, Value *Result,

                                        Constant *Overflow) {

  Constant *V[] = {PoisonValue::get(Result->getType()), Overflow};

  StructType *ST = cast<StructType>(II->getType());

  Constant *Struct = ConstantStruct::get(ST, V);

  return InsertValueInst::Create(Struct, Result, 0);

}


Instruction *

InstCombinerImpl::foldIntrinsicWithOverflowCommon(IntrinsicInst *II) {

  WithOverflowInst *WO = cast<WithOverflowInst>(II);

  Value *OperationResult = nullptr;

  Constant *OverflowResult = nullptr;

  if (OptimizeOverflowCheck(WO->getBinaryOp(), WO->isSigned(), WO->getLHS(),

                            WO->getRHS(), *WO, OperationResult, OverflowResult))

    return createOverflowTuple(WO, OperationResult, OverflowResult);


  // See whether we can optimize the overflow check with assumption information.

  for (User *U : WO->users()) {

    if (!match(U, m_ExtractValue<1>(m_Value())))

      continue;


    for (auto &AssumeVH : AC.assumptionsFor(U)) {

      if (!AssumeVH)

        continue;

      CallInst *I = cast<CallInst>(AssumeVH);

      if (!match(I->getArgOperand(0), m_Not(m_Specific(U))))

        continue;

      if (!isValidAssumeForContext(I, II, /*DT=*/nullptr,

                                   /*AllowEphemerals=*/true))

        continue;

      Value *Result =

          Builder.CreateBinOp(WO->getBinaryOp(), WO->getLHS(), WO->getRHS());

      Result->takeName(WO);

      if (auto *Inst = dyn_cast<Instruction>(Result)) {

        if (WO->isSigned())

          Inst->setHasNoSignedWrap();

        else

          Inst->setHasNoUnsignedWrap();

      }

      return createOverflowTuple(WO, Result,

                                 ConstantInt::getFalse(U->getType()));

    }

  }


  return nullptr;

}


static bool inputDenormalIsIEEE(const Function &F, const Type *Ty) {

  Ty = Ty->getScalarType();

  return F.getDenormalMode(Ty->getFltSemantics()).Input == DenormalMode::IEEE;

}


static bool inputDenormalIsDAZ(const Function &F, const Type *Ty) {

  Ty = Ty->getScalarType();

  return F.getDenormalMode(Ty->getFltSemantics()).inputsAreZero();

}


/// \returns the compare predicate type if the test performed by

/// llvm.is.fpclass(x, \p Mask) is equivalent to fcmp o__ x, 0.0 with the

/// floating-point environment assumed for \p F for type \p Ty


static FCmpInst::Predicate fpclassTestIsFCmp0(FPClassTest Mask,

                                              const Function &F, Type *Ty) {

  switch (static_cast<unsigned>(Mask)) {

  case fcZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OEQ;

    break;

  case fcZero | fcSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OEQ;

    break;

  case fcPositive | fcNegZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OGE;

    break;

  case fcPositive | fcNegZero | fcNegSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OGE;

    break;

  case fcPosSubnormal | fcPosNormal | fcPosInf:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OGT;

    break;

  case fcNegative | fcPosZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OLE;

    break;

  case fcNegative | fcPosZero | fcPosSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OLE;

    break;

  case fcNegSubnormal | fcNegNormal | fcNegInf:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OLT;

    break;

  case fcPosNormal | fcPosInf:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OGT;

    break;

  case fcNegNormal | fcNegInf:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OLT;

    break;

  case ~fcZero & ~fcNan:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_ONE;

    break;

  case ~(fcZero | fcSubnormal) & ~fcNan:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_ONE;

    break;

  default:

    break;

  }


  return FCmpInst::BAD_FCMP_PREDICATE;

}


Instruction *InstCombinerImpl::foldIntrinsicIsFPClass(IntrinsicInst &II) {

  Value *Src0 = II.getArgOperand(0);

  Value *Src1 = II.getArgOperand(1);

  const ConstantInt *CMask = cast<ConstantInt>(Src1);

  FPClassTest Mask = static_cast<FPClassTest>(CMask->getZExtValue());

  const bool IsUnordered = (Mask & fcNan) == fcNan;

  const bool IsOrdered = (Mask & fcNan) == fcNone;

  const FPClassTest OrderedMask = Mask & ~fcNan;

  const FPClassTest OrderedInvertedMask = ~OrderedMask & ~fcNan;


  const bool IsStrict =

      II.getFunction()->getAttributes().hasFnAttr(Attribute::StrictFP);


  Value *FNegSrc;

  if (match(Src0, m_FNeg(m_Value(FNegSrc)))) {

    // is.fpclass (fneg x), mask -> is.fpclass x, (fneg mask)


    II.setArgOperand(1, ConstantInt::get(Src1->getType(), fneg(Mask)));

    return replaceOperand(II, 0, FNegSrc);

  }


  Value *FAbsSrc;

  if (match(Src0, m_FAbs(m_Value(FAbsSrc)))) {

    II.setArgOperand(1, ConstantInt::get(Src1->getType(), inverse_fabs(Mask)));

    return replaceOperand(II, 0, FAbsSrc);

  }


  if ((OrderedMask == fcInf || OrderedInvertedMask == fcInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, fcInf) -> fcmp oeq fabs(x), +inf

    // is.fpclass(x, ~fcInf) -> fcmp one fabs(x), +inf

    // is.fpclass(x, fcInf|fcNan) -> fcmp ueq fabs(x), +inf

    // is.fpclass(x, ~(fcInf|fcNan)) -> fcmp une fabs(x), +inf

    Constant *Inf = ConstantFP::getInfinity(Src0->getType());

    FCmpInst::Predicate Pred =

        IsUnordered ? FCmpInst::FCMP_UEQ : FCmpInst::FCMP_OEQ;

    if (OrderedInvertedMask == fcInf)

      Pred = IsUnordered ? FCmpInst::FCMP_UNE : FCmpInst::FCMP_ONE;


    Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Src0);

    Value *CmpInf = Builder.CreateFCmp(Pred, Fabs, Inf);

    CmpInf->takeName(&II);

    return replaceInstUsesWith(II, CmpInf);

  }


  if ((OrderedMask == fcPosInf || OrderedMask == fcNegInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, fcPosInf) -> fcmp oeq x, +inf

    // is.fpclass(x, fcNegInf) -> fcmp oeq x, -inf

    // is.fpclass(x, fcPosInf|fcNan) -> fcmp ueq x, +inf

    // is.fpclass(x, fcNegInf|fcNan) -> fcmp ueq x, -inf

    Constant *Inf =

        ConstantFP::getInfinity(Src0->getType(), OrderedMask == fcNegInf);

    Value *EqInf = IsUnordered ? Builder.CreateFCmpUEQ(Src0, Inf)

                               : Builder.CreateFCmpOEQ(Src0, Inf);


    EqInf->takeName(&II);

    return replaceInstUsesWith(II, EqInf);

  }


  if ((OrderedInvertedMask == fcPosInf || OrderedInvertedMask == fcNegInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, ~fcPosInf) -> fcmp one x, +inf

    // is.fpclass(x, ~fcNegInf) -> fcmp one x, -inf

    // is.fpclass(x, ~fcPosInf|fcNan) -> fcmp une x, +inf

    // is.fpclass(x, ~fcNegInf|fcNan) -> fcmp une x, -inf

    Constant *Inf = ConstantFP::getInfinity(Src0->getType(),

                                            OrderedInvertedMask == fcNegInf);

    Value *NeInf = IsUnordered ? Builder.CreateFCmpUNE(Src0, Inf)

                               : Builder.CreateFCmpONE(Src0, Inf);

    NeInf->takeName(&II);

    return replaceInstUsesWith(II, NeInf);

  }


  if (Mask == fcNan && !IsStrict) {

    // Equivalent of isnan. Replace with standard fcmp if we don't care about FP

    // exceptions.

    Value *IsNan =

        Builder.CreateFCmpUNO(Src0, ConstantFP::getZero(Src0->getType()));

    IsNan->takeName(&II);

    return replaceInstUsesWith(II, IsNan);

  }


  if (Mask == (~fcNan & fcAllFlags) && !IsStrict) {

    // Equivalent of !isnan. Replace with standard fcmp.

    Value *FCmp =

        Builder.CreateFCmpORD(Src0, ConstantFP::getZero(Src0->getType()));

    FCmp->takeName(&II);

    return replaceInstUsesWith(II, FCmp);

  }


  FCmpInst::Predicate PredType = FCmpInst::BAD_FCMP_PREDICATE;


  // Try to replace with an fcmp with 0

  //

  // is.fpclass(x, fcZero) -> fcmp oeq x, 0.0

  // is.fpclass(x, fcZero | fcNan) -> fcmp ueq x, 0.0

  // is.fpclass(x, ~fcZero & ~fcNan) -> fcmp one x, 0.0

  // is.fpclass(x, ~fcZero) -> fcmp une x, 0.0

  //

  // is.fpclass(x, fcPosSubnormal | fcPosNormal | fcPosInf) -> fcmp ogt x, 0.0

  // is.fpclass(x, fcPositive | fcNegZero) -> fcmp oge x, 0.0

  //

  // is.fpclass(x, fcNegSubnormal | fcNegNormal | fcNegInf) -> fcmp olt x, 0.0

  // is.fpclass(x, fcNegative | fcPosZero) -> fcmp ole x, 0.0

  //

  if (!IsStrict && (IsOrdered || IsUnordered) &&

      (PredType = fpclassTestIsFCmp0(OrderedMask, *II.getFunction(),

                                     Src0->getType())) !=

          FCmpInst::BAD_FCMP_PREDICATE) {

    Constant *Zero = ConstantFP::getZero(Src0->getType());

    // Equivalent of == 0.

    Value *FCmp = Builder.CreateFCmp(

        IsUnordered ? FCmpInst::getUnorderedPredicate(PredType) : PredType,

        Src0, Zero);


    FCmp->takeName(&II);

    return replaceInstUsesWith(II, FCmp);

  }


  KnownFPClass Known = computeKnownFPClass(Src0, Mask, &II);


  // Clear test bits we know must be false from the source value.

  // fp_class (nnan x), qnan|snan|other -> fp_class (nnan x), other

  // fp_class (ninf x), ninf|pinf|other -> fp_class (ninf x), other

  if ((Mask & Known.KnownFPClasses) != Mask) {

    II.setArgOperand(

        1, ConstantInt::get(Src1->getType(), Mask & Known.KnownFPClasses));

    return &II;

  }


  // If none of the tests which can return false are possible, fold to true.

  // fp_class (nnan x), ~(qnan|snan) -> true

  // fp_class (ninf x), ~(ninf|pinf) -> true

  if (Mask == Known.KnownFPClasses)

    return replaceInstUsesWith(II, ConstantInt::get(II.getType(), true));


  return nullptr;

}


static std::optional<bool> getKnownSign(Value *Op, const SimplifyQuery &SQ) {

  KnownBits Known = computeKnownBits(Op, SQ);

  if (Known.isNonNegative())

    return false;

  if (Known.isNegative())

    return true;


  Value *X, *Y;

  if (match(Op, m_NSWSub(m_Value(X), m_Value(Y))))

    return isImpliedByDomCondition(ICmpInst::ICMP_SLT, X, Y, SQ.CxtI, SQ.DL);


  return std::nullopt;

}


static std::optional<bool> getKnownSignOrZero(Value *Op,

                                              const SimplifyQuery &SQ) {

  if (std::optional<bool> Sign = getKnownSign(Op, SQ))

    return Sign;


  Value *X, *Y;

  if (match(Op, m_NSWSub(m_Value(X), m_Value(Y))))

    return isImpliedByDomCondition(ICmpInst::ICMP_SLE, X, Y, SQ.CxtI, SQ.DL);


  return std::nullopt;

}


/// Return true if two values \p Op0 and \p Op1 are known to have the same sign.


static bool signBitMustBeTheSame(Value *Op0, Value *Op1,

                                 const SimplifyQuery &SQ) {

  std::optional<bool> Known1 = getKnownSign(Op1, SQ);

  if (!Known1)

    return false;

  std::optional<bool> Known0 = getKnownSign(Op0, SQ);

  if (!Known0)

    return false;

  return *Known0 == *Known1;

}


/// Try to canonicalize min/max(X + C0, C1) as min/max(X, C1 - C0) + C0. This

/// can trigger other combines.


static Instruction *moveAddAfterMinMax(IntrinsicInst *II,

                                       InstCombiner::BuilderTy &Builder) {

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  assert((MinMaxID == Intrinsic::smax || MinMaxID == Intrinsic::smin ||

          MinMaxID == Intrinsic::umax || MinMaxID == Intrinsic::umin) &&

         "Expected a min or max intrinsic");


  // TODO: Match vectors with undef elements, but undef may not propagate.

  Value *Op0 = II->getArgOperand(0), *Op1 = II->getArgOperand(1);

  Value *X;

  const APInt *C0, *C1;

  if (!match(Op0, m_OneUse(m_Add(m_Value(X), m_APInt(C0)))) ||

      !match(Op1, m_APInt(C1)))

    return nullptr;


  // Check for necessary no-wrap and overflow constraints.

  bool IsSigned = MinMaxID == Intrinsic::smax || MinMaxID == Intrinsic::smin;

  auto *Add = cast<BinaryOperator>(Op0);

  if ((IsSigned && !Add->hasNoSignedWrap()) ||

      (!IsSigned && !Add->hasNoUnsignedWrap()))

    return nullptr;


  // If the constant difference overflows, then instsimplify should reduce the

  // min/max to the add or C1.

  bool Overflow;

  APInt CDiff =

      IsSigned ? C1->ssub_ov(*C0, Overflow) : C1->usub_ov(*C0, Overflow);

  assert(!Overflow && "Expected simplify of min/max");


  // min/max (add X, C0), C1 --> add (min/max X, C1 - C0), C0

  // Note: the "mismatched" no-overflow setting does not propagate.

  Constant *NewMinMaxC = ConstantInt::get(II->getType(), CDiff);

  Value *NewMinMax = Builder.CreateBinaryIntrinsic(MinMaxID, X, NewMinMaxC);

  return IsSigned ? BinaryOperator::CreateNSWAdd(NewMinMax, Add->getOperand(1))

                  : BinaryOperator::CreateNUWAdd(NewMinMax, Add->getOperand(1));

}


/// Match a sadd_sat or ssub_sat which is using min/max to clamp the value.

Instruction *InstCombinerImpl::matchSAddSubSat(IntrinsicInst &MinMax1) {

  Type *Ty = MinMax1.getType();


  // We are looking for a tree of:

  // max(INT_MIN, min(INT_MAX, add(sext(A), sext(B))))

  // Where the min and max could be reversed

  Instruction *MinMax2;

  BinaryOperator *AddSub;

  const APInt *MinValue, *MaxValue;

  if (match(&MinMax1, m_SMin(m_Instruction(MinMax2), m_APInt(MaxValue)))) {

    if (!match(MinMax2, m_SMax(m_BinOp(AddSub), m_APInt(MinValue))))

      return nullptr;

  } else if (match(&MinMax1,

                   m_SMax(m_Instruction(MinMax2), m_APInt(MinValue)))) {

    if (!match(MinMax2, m_SMin(m_BinOp(AddSub), m_APInt(MaxValue))))

      return nullptr;

  } else

    return nullptr;


  // Check that the constants clamp a saturate, and that the new type would be

  // sensible to convert to.

  if (!(*MaxValue + 1).isPowerOf2() || -*MinValue != *MaxValue + 1)

    return nullptr;

  // In what bitwidth can this be treated as saturating arithmetics?

  unsigned NewBitWidth = (*MaxValue + 1).logBase2() + 1;

  // FIXME: This isn't quite right for vectors, but using the scalar type is a

  // good first approximation for what should be done there.

  if (!shouldChangeType(Ty->getScalarType()->getIntegerBitWidth(), NewBitWidth))

    return nullptr;


  // Also make sure that the inner min/max and the add/sub have one use.

  if (!MinMax2->hasOneUse() || !AddSub->hasOneUse())

    return nullptr;


  // Create the new type (which can be a vector type)

  Type *NewTy = Ty->getWithNewBitWidth(NewBitWidth);


  Intrinsic::ID IntrinsicID;

  if (AddSub->getOpcode() == Instruction::Add)

    IntrinsicID = Intrinsic::sadd_sat;

  else if (AddSub->getOpcode() == Instruction::Sub)

    IntrinsicID = Intrinsic::ssub_sat;

  else

    return nullptr;


  // The two operands of the add/sub must be nsw-truncatable to the NewTy. This

  // is usually achieved via a sext from a smaller type.

  if (ComputeMaxSignificantBits(AddSub->getOperand(0), AddSub) > NewBitWidth ||

      ComputeMaxSignificantBits(AddSub->getOperand(1), AddSub) > NewBitWidth)

    return nullptr;


  // Finally create and return the sat intrinsic, truncated to the new type

  Value *AT = Builder.CreateTrunc(AddSub->getOperand(0), NewTy);

  Value *BT = Builder.CreateTrunc(AddSub->getOperand(1), NewTy);

  Value *Sat = Builder.CreateIntrinsic(IntrinsicID, NewTy, {AT, BT});

  return CastInst::Create(Instruction::SExt, Sat, Ty);

}


/// If we have a clamp pattern like max (min X, 42), 41 -- where the output

/// can only be one of two possible constant values -- turn that into a select

/// of constants.


static Instruction *foldClampRangeOfTwo(IntrinsicInst *II,

                                        InstCombiner::BuilderTy &Builder) {

  Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

  Value *X;

  const APInt *C0, *C1;

  if (!match(I1, m_APInt(C1)) || !I0->hasOneUse())

    return nullptr;


  CmpInst::Predicate Pred = CmpInst::BAD_ICMP_PREDICATE;

  switch (II->getIntrinsicID()) {

  case Intrinsic::smax:

    if (match(I0, m_SMin(m_Value(X), m_APInt(C0))) && *C0 == *C1 + 1)

      Pred = ICmpInst::ICMP_SGT;

    break;

  case Intrinsic::smin:

    if (match(I0, m_SMax(m_Value(X), m_APInt(C0))) && *C1 == *C0 + 1)

      Pred = ICmpInst::ICMP_SLT;

    break;

  case Intrinsic::umax:

    if (match(I0, m_UMin(m_Value(X), m_APInt(C0))) && *C0 == *C1 + 1)

      Pred = ICmpInst::ICMP_UGT;

    break;

  case Intrinsic::umin:

    if (match(I0, m_UMax(m_Value(X), m_APInt(C0))) && *C1 == *C0 + 1)

      Pred = ICmpInst::ICMP_ULT;

    break;

  default:

    llvm_unreachable("Expected min/max intrinsic");

  }

  if (Pred == CmpInst::BAD_ICMP_PREDICATE)

    return nullptr;


  // max (min X, 42), 41 --> X > 41 ? 42 : 41

  // min (max X, 42), 43 --> X < 43 ? 42 : 43

  Value *Cmp = Builder.CreateICmp(Pred, X, I1);

  return SelectInst::Create(Cmp, ConstantInt::get(II->getType(), *C0), I1);

}


/// If this min/max has a constant operand and an operand that is a matching

/// min/max with a constant operand, constant-fold the 2 constant operands.


static Value *reassociateMinMaxWithConstants(IntrinsicInst *II,

                                             IRBuilderBase &Builder,

                                             const SimplifyQuery &SQ) {

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  auto *LHS = dyn_cast<MinMaxIntrinsic>(II->getArgOperand(0));

  if (!LHS)

    return nullptr;


  Constant *C0, *C1;

  if (!match(LHS->getArgOperand(1), m_ImmConstant(C0)) ||

      !match(II->getArgOperand(1), m_ImmConstant(C1)))

    return nullptr;


  // max (max X, C0), C1 --> max X, (max C0, C1)

  // min (min X, C0), C1 --> min X, (min C0, C1)

  // umax (smax X, nneg C0), nneg C1 --> smax X, (umax C0, C1)

  // smin (umin X, nneg C0), nneg C1 --> umin X, (smin C0, C1)

  Intrinsic::ID InnerMinMaxID = LHS->getIntrinsicID();

  if (InnerMinMaxID != MinMaxID &&

      !(((MinMaxID == Intrinsic::umax && InnerMinMaxID == Intrinsic::smax) ||

         (MinMaxID == Intrinsic::smin && InnerMinMaxID == Intrinsic::umin)) &&

        isKnownNonNegative(C0, SQ) && isKnownNonNegative(C1, SQ)))

    return nullptr;


  ICmpInst::Predicate Pred = MinMaxIntrinsic::getPredicate(MinMaxID);

  Value *CondC = Builder.CreateICmp(Pred, C0, C1);

  Value *NewC = Builder.CreateSelect(CondC, C0, C1);

  return Builder.CreateIntrinsic(InnerMinMaxID, II->getType(),

                                 {LHS->getArgOperand(0), NewC});

}


/// If this min/max has a matching min/max operand with a constant, try to push

/// the constant operand into this instruction. This can enable more folds.

static Instruction *


reassociateMinMaxWithConstantInOperand(IntrinsicInst *II,

                                       InstCombiner::BuilderTy &Builder) {

  // Match and capture a min/max operand candidate.

  Value *X, *Y;

  Constant *C;

  Instruction *Inner;

  if (!match(II, m_c_MaxOrMin(m_OneUse(m_CombineAnd(

                                  m_Instruction(Inner),

                                  m_MaxOrMin(m_Value(X), m_ImmConstant(C)))),

                              m_Value(Y))))

    return nullptr;


  // The inner op must match. Check for constants to avoid infinite loops.

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  auto *InnerMM = dyn_cast<IntrinsicInst>(Inner);

  if (!InnerMM || InnerMM->getIntrinsicID() != MinMaxID ||

      match(X, m_ImmConstant()) || match(Y, m_ImmConstant()))

    return nullptr;


  // max (max X, C), Y --> max (max X, Y), C

  Function *MinMax = Intrinsic::getOrInsertDeclaration(II->getModule(),

                                                       MinMaxID, II->getType());

  Value *NewInner = Builder.CreateBinaryIntrinsic(MinMaxID, X, Y);

  NewInner->takeName(Inner);

  return CallInst::Create(MinMax, {NewInner, C});

}


/// Reduce a sequence of min/max intrinsics with a common operand.


static Instruction *factorizeMinMaxTree(IntrinsicInst *II) {

  // Match 3 of the same min/max ops. Example: umin(umin(), umin()).

  auto *LHS = dyn_cast<IntrinsicInst>(II->getArgOperand(0));

  auto *RHS = dyn_cast<IntrinsicInst>(II->getArgOperand(1));

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  if (!LHS || !RHS || LHS->getIntrinsicID() != MinMaxID ||

      RHS->getIntrinsicID() != MinMaxID ||

      (!LHS->hasOneUse() && !RHS->hasOneUse()))

    return nullptr;


  Value *A = LHS->getArgOperand(0);

  Value *B = LHS->getArgOperand(1);

  Value *C = RHS->getArgOperand(0);

  Value *D = RHS->getArgOperand(1);


  // Look for a common operand.

  Value *MinMaxOp = nullptr;

  Value *ThirdOp = nullptr;

  if (LHS->hasOneUse()) {

    // If the LHS is only used in this chain and the RHS is used outside of it,

    // reuse the RHS min/max because that will eliminate the LHS.

    if (D == A || C == A) {

      // min(min(a, b), min(c, a)) --> min(min(c, a), b)

      // min(min(a, b), min(a, d)) --> min(min(a, d), b)

      MinMaxOp = RHS;

      ThirdOp = B;

    } else if (D == B || C == B) {

      // min(min(a, b), min(c, b)) --> min(min(c, b), a)

      // min(min(a, b), min(b, d)) --> min(min(b, d), a)

      MinMaxOp = RHS;

      ThirdOp = A;

    }

  } else {

    assert(RHS->hasOneUse() && "Expected one-use operand");

    // Reuse the LHS. This will eliminate the RHS.

    if (D == A || D == B) {

      // min(min(a, b), min(c, a)) --> min(min(a, b), c)

      // min(min(a, b), min(c, b)) --> min(min(a, b), c)

      MinMaxOp = LHS;

      ThirdOp = C;

    } else if (C == A || C == B) {

      // min(min(a, b), min(b, d)) --> min(min(a, b), d)

      // min(min(a, b), min(c, b)) --> min(min(a, b), d)

      MinMaxOp = LHS;

      ThirdOp = D;

    }

  }


  if (!MinMaxOp || !ThirdOp)

    return nullptr;


  Module *Mod = II->getModule();

  Function *MinMax =

      Intrinsic::getOrInsertDeclaration(Mod, MinMaxID, II->getType());

  return CallInst::Create(MinMax, { MinMaxOp, ThirdOp });

}


/// If all arguments of the intrinsic are unary shuffles with the same mask,

/// try to shuffle after the intrinsic.

Instruction *


InstCombinerImpl::foldShuffledIntrinsicOperands(IntrinsicInst *II) {

  if (!isTriviallyVectorizable(II->getIntrinsicID()) ||

      !II->getCalledFunction()->isSpeculatable())

    return nullptr;


  Value *X;

  Constant *C;

  ArrayRef<int> Mask;

  auto *NonConstArg = find_if_not(II->args(), [&II](Use &Arg) {

    return isa<Constant>(Arg.get()) ||

           isVectorIntrinsicWithScalarOpAtArg(II->getIntrinsicID(),

                                              Arg.getOperandNo(), nullptr);

  });

  if (!NonConstArg ||

      !match(NonConstArg, m_Shuffle(m_Value(X), m_Poison(), m_Mask(Mask))))

    return nullptr;


  // At least 1 operand must be a shuffle with 1 use because we are creating 2

  // instructions.

  if (none_of(II->args(), match_fn(m_OneUse(m_Shuffle(m_Value(), m_Value())))))

    return nullptr;


  // See if all arguments are shuffled with the same mask.

  SmallVector<Value *, 4> NewArgs;

  Type *SrcTy = X->getType();

  for (Use &Arg : II->args()) {

    if (isVectorIntrinsicWithScalarOpAtArg(II->getIntrinsicID(),

                                           Arg.getOperandNo(), nullptr))

      NewArgs.push_back(Arg);

    else if (match(&Arg,

                   m_Shuffle(m_Value(X), m_Poison(), m_SpecificMask(Mask))) &&

             X->getType() == SrcTy)

      NewArgs.push_back(X);

    else if (match(&Arg, m_ImmConstant(C))) {

      // If it's a constant, try find the constant that would be shuffled to C.

      if (Constant *ShuffledC =

              unshuffleConstant(Mask, C, cast<VectorType>(SrcTy)))

        NewArgs.push_back(ShuffledC);

      else

        return nullptr;

    } else

      return nullptr;

  }


  // intrinsic (shuf X, M), (shuf Y, M), ... --> shuf (intrinsic X, Y, ...), M

  Instruction *FPI = isa<FPMathOperator>(II) ? II : nullptr;

  // Result type might be a different vector width.

  // TODO: Check that the result type isn't widened?

  VectorType *ResTy =

      VectorType::get(II->getType()->getScalarType(), cast<VectorType>(SrcTy));

  Value *NewIntrinsic =

      Builder.CreateIntrinsic(ResTy, II->getIntrinsicID(), NewArgs, FPI);

  return new ShuffleVectorInst(NewIntrinsic, Mask);

}


/// If all arguments of the intrinsic are reverses, try to pull the reverse

/// after the intrinsic.


Value *InstCombinerImpl::foldReversedIntrinsicOperands(IntrinsicInst *II) {

  if (!isTriviallyVectorizable(II->getIntrinsicID()))

    return nullptr;


  // At least 1 operand must be a reverse with 1 use because we are creating 2

  // instructions.

  if (none_of(II->args(), [](Value *V) {

        return match(V, m_OneUse(m_VecReverse(m_Value())));

      }))

    return nullptr;


  Value *X;

  Constant *C;

  SmallVector<Value *> NewArgs;

  for (Use &Arg : II->args()) {

    if (isVectorIntrinsicWithScalarOpAtArg(II->getIntrinsicID(),

                                           Arg.getOperandNo(), nullptr))

      NewArgs.push_back(Arg);

    else if (match(&Arg, m_VecReverse(m_Value(X))))

      NewArgs.push_back(X);

    else if (isSplatValue(Arg))

      NewArgs.push_back(Arg);

    else if (match(&Arg, m_ImmConstant(C)))

      NewArgs.push_back(Builder.CreateVectorReverse(C));

    else

      return nullptr;

  }


  // intrinsic (reverse X), (reverse Y), ... --> reverse (intrinsic X, Y, ...)

  Instruction *FPI = isa<FPMathOperator>(II) ? II : nullptr;

  Instruction *NewIntrinsic = Builder.CreateIntrinsic(

      II->getType(), II->getIntrinsicID(), NewArgs, FPI);

  return Builder.CreateVectorReverse(NewIntrinsic);

}


/// Fold the following cases and accepts bswap and bitreverse intrinsics:

///   bswap(logic_op(bswap(x), y)) --> logic_op(x, bswap(y))

///   bswap(logic_op(bswap(x), bswap(y))) --> logic_op(x, y) (ignores multiuse)

template <Intrinsic::ID IntrID>


static Instruction *foldBitOrderCrossLogicOp(Value *V,

                                             InstCombiner::BuilderTy &Builder) {

  static_assert(IntrID == Intrinsic::bswap || IntrID == Intrinsic::bitreverse,

                "This helper only supports BSWAP and BITREVERSE intrinsics");


  Value *X, *Y;

  // Find bitwise logic op. Check that it is a BinaryOperator explicitly so we

  // don't match ConstantExpr that aren't meaningful for this transform.

  if (match(V, m_OneUse(m_BitwiseLogic(m_Value(X), m_Value(Y)))) &&

      isa<BinaryOperator>(V)) {

    Value *OldReorderX, *OldReorderY;

    BinaryOperator::BinaryOps Op = cast<BinaryOperator>(V)->getOpcode();


    // If both X and Y are bswap/bitreverse, the transform reduces the number

    // of instructions even if there's multiuse.

    // If only one operand is bswap/bitreverse, we need to ensure the operand

    // have only one use.

    if (match(X, m_Intrinsic<IntrID>(m_Value(OldReorderX))) &&

        match(Y, m_Intrinsic<IntrID>(m_Value(OldReorderY)))) {

      return BinaryOperator::Create(Op, OldReorderX, OldReorderY);

    }


    if (match(X, m_OneUse(m_Intrinsic<IntrID>(m_Value(OldReorderX))))) {

      Value *NewReorder = Builder.CreateUnaryIntrinsic(IntrID, Y);

      return BinaryOperator::Create(Op, OldReorderX, NewReorder);

    }


    if (match(Y, m_OneUse(m_Intrinsic<IntrID>(m_Value(OldReorderY))))) {

      Value *NewReorder = Builder.CreateUnaryIntrinsic(IntrID, X);

      return BinaryOperator::Create(Op, NewReorder, OldReorderY);

    }

  }

  return nullptr;

}


/// Helper to match idempotent binary intrinsics, namely, intrinsics where

/// `f(f(x, y), y) == f(x, y)` holds.


static bool isIdempotentBinaryIntrinsic(Intrinsic::ID IID) {

  switch (IID) {

  case Intrinsic::smax:

  case Intrinsic::smin:

  case Intrinsic::umax:

  case Intrinsic::umin:

  case Intrinsic::maximum:

  case Intrinsic::minimum:

  case Intrinsic::maximumnum:

  case Intrinsic::minimumnum:

  case Intrinsic::maxnum:

  case Intrinsic::minnum:

    return true;

  default:

    return false;

  }

}


/// Attempt to simplify value-accumulating recurrences of kind:

///   %umax.acc = phi i8 [ %umax, %backedge ], [ %a, %entry ]

///   %umax = call i8 @llvm.umax.i8(i8 %umax.acc, i8 %b)

/// And let the idempotent binary intrinsic be hoisted, when the operands are

/// known to be loop-invariant.


static Value *foldIdempotentBinaryIntrinsicRecurrence(InstCombinerImpl &IC,

                                                      IntrinsicInst *II) {

  PHINode *PN;

  Value *Init, *OtherOp;


  // A binary intrinsic recurrence with loop-invariant operands is equivalent to

  // `call @llvm.binary.intrinsic(Init, OtherOp)`.

  auto IID = II->getIntrinsicID();

  if (!isIdempotentBinaryIntrinsic(IID) ||

      !matchSimpleBinaryIntrinsicRecurrence(II, PN, Init, OtherOp) ||

      !IC.getDominatorTree().dominates(OtherOp, PN))

    return nullptr;


  auto *InvariantBinaryInst =

      IC.Builder.CreateBinaryIntrinsic(IID, Init, OtherOp);

  if (isa<FPMathOperator>(InvariantBinaryInst))

    cast<Instruction>(InvariantBinaryInst)->copyFastMathFlags(II);

  return InvariantBinaryInst;

}


static Value *simplifyReductionOperand(Value *Arg, bool CanReorderLanes) {

  if (!CanReorderLanes)

    return nullptr;


  Value *V;

  if (match(Arg, m_VecReverse(m_Value(V))))

    return V;


  ArrayRef<int> Mask;

  if (!isa<FixedVectorType>(Arg->getType()) ||

      !match(Arg, m_Shuffle(m_Value(V), m_Undef(), m_Mask(Mask))) ||

      !cast<ShuffleVectorInst>(Arg)->isSingleSource())

    return nullptr;


  int Sz = Mask.size();

  SmallBitVector UsedIndices(Sz);

  for (int Idx : Mask) {

    if (Idx == PoisonMaskElem || UsedIndices.test(Idx))

      return nullptr;

    UsedIndices.set(Idx);

  }


  // Can remove shuffle iff just shuffled elements, no repeats, undefs, or

  // other changes.

  return UsedIndices.all() ? V : nullptr;

}


/// Fold an unsigned minimum of trailing or leading zero bits counts:

///   umin(cttz(CtOp, ZeroUndef), ConstOp) --> cttz(CtOp | (1 << ConstOp))

///   umin(ctlz(CtOp, ZeroUndef), ConstOp) --> ctlz(CtOp | (SignedMin

///                                              >> ConstOp))

template <Intrinsic::ID IntrID>

static Value *


foldMinimumOverTrailingOrLeadingZeroCount(Value *I0, Value *I1,

                                          const DataLayout &DL,

                                          InstCombiner::BuilderTy &Builder) {

  static_assert(IntrID == Intrinsic::cttz || IntrID == Intrinsic::ctlz,

                "This helper only supports cttz and ctlz intrinsics");


  Value *CtOp;

  Value *ZeroUndef;

  if (!match(I0,

             m_OneUse(m_Intrinsic<IntrID>(m_Value(CtOp), m_Value(ZeroUndef)))))

    return nullptr;


  unsigned BitWidth = I1->getType()->getScalarSizeInBits();

  auto LessBitWidth = [BitWidth](auto &C) { return C.ult(BitWidth); };

  if (!match(I1, m_CheckedInt(LessBitWidth)))

    // We have a constant >= BitWidth (which can be handled by CVP)

    // or a non-splat vector with elements < and >= BitWidth

    return nullptr;


  Type *Ty = I1->getType();

  Constant *NewConst = ConstantFoldBinaryOpOperands(

      IntrID == Intrinsic::cttz ? Instruction::Shl : Instruction::LShr,

      IntrID == Intrinsic::cttz

          ? ConstantInt::get(Ty, 1)

          : ConstantInt::get(Ty, APInt::getSignedMinValue(BitWidth)),

      cast<Constant>(I1), DL);

  return Builder.CreateBinaryIntrinsic(

      IntrID, Builder.CreateOr(CtOp, NewConst),

      ConstantInt::getTrue(ZeroUndef->getType()));

}


/// Return whether "X LOp (Y ROp Z)" is always equal to

/// "(X LOp Y) ROp (X LOp Z)".


static bool leftDistributesOverRight(Instruction::BinaryOps LOp, bool HasNUW,

                                     bool HasNSW, Intrinsic::ID ROp) {

  switch (ROp) {

  case Intrinsic::umax:

  case Intrinsic::umin:

    if (HasNUW && LOp == Instruction::Add)

      return true;

    if (HasNUW && LOp == Instruction::Shl)

      return true;

    return false;

  case Intrinsic::smax:

  case Intrinsic::smin:

    return HasNSW && LOp == Instruction::Add;

  default:

    return false;

  }

}


// Attempts to factorise a common term

// in an instruction that has the form "(A op' B) op (C op' D)

// where op is an intrinsic and op' is a binop

static Value *


foldIntrinsicUsingDistributiveLaws(IntrinsicInst *II,

                                   InstCombiner::BuilderTy &Builder) {

  Value *LHS = II->getOperand(0), *RHS = II->getOperand(1);

  Intrinsic::ID TopLevelOpcode = II->getIntrinsicID();


  OverflowingBinaryOperator *Op0 = dyn_cast<OverflowingBinaryOperator>(LHS);

  OverflowingBinaryOperator *Op1 = dyn_cast<OverflowingBinaryOperator>(RHS);


  if (!Op0 || !Op1)

    return nullptr;


  if (Op0->getOpcode() != Op1->getOpcode())

    return nullptr;


  if (!Op0->hasOneUse() || !Op1->hasOneUse())

    return nullptr;


  Instruction::BinaryOps InnerOpcode =

      static_cast<Instruction::BinaryOps>(Op0->getOpcode());

  bool HasNUW = Op0->hasNoUnsignedWrap() && Op1->hasNoUnsignedWrap();

  bool HasNSW = Op0->hasNoSignedWrap() && Op1->hasNoSignedWrap();


  if (!leftDistributesOverRight(InnerOpcode, HasNUW, HasNSW, TopLevelOpcode))

    return nullptr;


  Value *A = Op0->getOperand(0);

  Value *B = Op0->getOperand(1);

  Value *C = Op1->getOperand(0);

  Value *D = Op1->getOperand(1);


  // Attempts to swap variables such that A equals C or B equals D,

  // if the inner operation is commutative.

  if (Op0->isCommutative() && A != C && B != D) {

    if (A == D || B == C)

      std::swap(C, D);

    else

      return nullptr;

  }


  BinaryOperator *NewBinop;

  if (A == C) {

    Value *NewIntrinsic = Builder.CreateBinaryIntrinsic(TopLevelOpcode, B, D);

    NewBinop =

        cast<BinaryOperator>(Builder.CreateBinOp(InnerOpcode, A, NewIntrinsic));

  } else if (B == D) {

    Value *NewIntrinsic = Builder.CreateBinaryIntrinsic(TopLevelOpcode, A, C);

    NewBinop =

        cast<BinaryOperator>(Builder.CreateBinOp(InnerOpcode, NewIntrinsic, B));

  } else {

    return nullptr;

  }


  NewBinop->setHasNoUnsignedWrap(HasNUW);

  NewBinop->setHasNoSignedWrap(HasNSW);


  return NewBinop;

}


/// CallInst simplification. This mostly only handles folding of intrinsic

/// instructions. For normal calls, it allows visitCallBase to do the heavy

/// lifting.


Instruction *InstCombinerImpl::visitCallInst(CallInst &CI) {

  // Don't try to simplify calls without uses. It will not do anything useful,

  // but will result in the following folds being skipped.

  if (!CI.use_empty()) {

    SmallVector<Value *, 8> Args(CI.args());

    if (Value *V = simplifyCall(&CI, CI.getCalledOperand(), Args,

                                SQ.getWithInstruction(&CI)))

      return replaceInstUsesWith(CI, V);

  }


  if (Value *FreedOp = getFreedOperand(&CI, &TLI))

    return visitFree(CI, FreedOp);


  // If the caller function (i.e. us, the function that contains this CallInst)

  // is nounwind, mark the call as nounwind, even if the callee isn't.

  if (CI.getFunction()->doesNotThrow() && !CI.doesNotThrow()) {

    CI.setDoesNotThrow();

    return &CI;

  }


  IntrinsicInst *II = dyn_cast<IntrinsicInst>(&CI);

  if (!II)

    return visitCallBase(CI);


  // Intrinsics cannot occur in an invoke or a callbr, so handle them here

  // instead of in visitCallBase.

  if (auto *MI = dyn_cast<AnyMemIntrinsic>(II)) {

    if (auto NumBytes = MI->getLengthInBytes()) {

      // memmove/cpy/set of zero bytes is a noop.

      if (NumBytes->isZero())

        return eraseInstFromFunction(CI);


      // For atomic unordered mem intrinsics if len is not a positive or

      // not a multiple of element size then behavior is undefined.

      if (MI->isAtomic() &&

          (NumBytes->isNegative() ||

           (NumBytes->getZExtValue() % MI->getElementSizeInBytes() != 0))) {

        CreateNonTerminatorUnreachable(MI);

        assert(MI->getType()->isVoidTy() &&

               "non void atomic unordered mem intrinsic");

        return eraseInstFromFunction(*MI);

      }

    }


    // No other transformations apply to volatile transfers.

    if (MI->isVolatile())

      return nullptr;


    if (AnyMemTransferInst *MTI = dyn_cast<AnyMemTransferInst>(MI)) {

      // memmove(x,x,size) -> noop.

      if (MTI->getSource() == MTI->getDest())

        return eraseInstFromFunction(CI);

    }


    auto IsPointerUndefined = [MI](Value *Ptr) {

      return isa<ConstantPointerNull>(Ptr) &&

             !NullPointerIsDefined(

                 MI->getFunction(),

                 cast<PointerType>(Ptr->getType())->getAddressSpace());

    };

    bool SrcIsUndefined = false;

    // If we can determine a pointer alignment that is bigger than currently

    // set, update the alignment.

    if (auto *MTI = dyn_cast<AnyMemTransferInst>(MI)) {

      if (Instruction *I = SimplifyAnyMemTransfer(MTI))

        return I;

      SrcIsUndefined = IsPointerUndefined(MTI->getRawSource());

    } else if (auto *MSI = dyn_cast<AnyMemSetInst>(MI)) {

      if (Instruction *I = SimplifyAnyMemSet(MSI))

        return I;

    }


    // If src/dest is null, this memory intrinsic must be a noop.

    if (SrcIsUndefined || IsPointerUndefined(MI->getRawDest())) {

      Builder.CreateAssumption(Builder.CreateIsNull(MI->getLength()));

      return eraseInstFromFunction(CI);

    }


    // If we have a memmove and the source operation is a constant global,

    // then the source and dest pointers can't alias, so we can change this

    // into a call to memcpy.

    if (auto *MMI = dyn_cast<AnyMemMoveInst>(MI)) {

      if (GlobalVariable *GVSrc = dyn_cast<GlobalVariable>(MMI->getSource()))

        if (GVSrc->isConstant()) {

          Module *M = CI.getModule();

          Intrinsic::ID MemCpyID =

              MMI->isAtomic()

                  ? Intrinsic::memcpy_element_unordered_atomic

                  : Intrinsic::memcpy;

          Type *Tys[3] = { CI.getArgOperand(0)->getType(),

                           CI.getArgOperand(1)->getType(),

                           CI.getArgOperand(2)->getType() };

          CI.setCalledFunction(

              Intrinsic::getOrInsertDeclaration(M, MemCpyID, Tys));

          return II;

        }

    }

  }


  // For fixed width vector result intrinsics, use the generic demanded vector

  // support.

  if (auto *IIFVTy = dyn_cast<FixedVectorType>(II->getType())) {

    auto VWidth = IIFVTy->getNumElements();

    APInt PoisonElts(VWidth, 0);

    APInt AllOnesEltMask(APInt::getAllOnes(VWidth));

    if (Value *V = SimplifyDemandedVectorElts(II, AllOnesEltMask, PoisonElts)) {

      if (V != II)

        return replaceInstUsesWith(*II, V);

      return II;

    }

  }


  if (II->isCommutative()) {

    if (auto Pair = matchSymmetricPair(II->getOperand(0), II->getOperand(1))) {

      replaceOperand(*II, 0, Pair->first);

      replaceOperand(*II, 1, Pair->second);

      return II;

    }


    if (CallInst *NewCall = canonicalizeConstantArg0ToArg1(CI))

      return NewCall;

  }


  // Unused constrained FP intrinsic calls may have declared side effect, which

  // prevents it from being removed. In some cases however the side effect is

  // actually absent. To detect this case, call SimplifyConstrainedFPCall. If it

  // returns a replacement, the call may be removed.

  if (CI.use_empty() && isa<ConstrainedFPIntrinsic>(CI)) {

    if (simplifyConstrainedFPCall(&CI, SQ.getWithInstruction(&CI)))

      return eraseInstFromFunction(CI);

  }


  Intrinsic::ID IID = II->getIntrinsicID();

  switch (IID) {

  case Intrinsic::objectsize: {

    SmallVector<Instruction *> InsertedInstructions;

    if (Value *V = lowerObjectSizeCall(II, DL, &TLI, AA, /*MustSucceed=*/false,

                                       &InsertedInstructions)) {

      for (Instruction *Inserted : InsertedInstructions)

        Worklist.add(Inserted);

      return replaceInstUsesWith(CI, V);

    }

    return nullptr;

  }

  case Intrinsic::abs: {

    Value *IIOperand = II->getArgOperand(0);

    bool IntMinIsPoison = cast<Constant>(II->getArgOperand(1))->isOneValue();


    // abs(-x) -> abs(x)

    Value *X;

    if (match(IIOperand, m_Neg(m_Value(X)))) {

      if (cast<Instruction>(IIOperand)->hasNoSignedWrap() || IntMinIsPoison)

        replaceOperand(*II, 1, Builder.getTrue());

      return replaceOperand(*II, 0, X);

    }

    if (match(IIOperand, m_c_Select(m_Neg(m_Value(X)), m_Deferred(X))))

      return replaceOperand(*II, 0, X);


    Value *Y;

    // abs(a * abs(b)) -> abs(a * b)

    if (match(IIOperand,

              m_OneUse(m_c_Mul(m_Value(X),

                               m_Intrinsic<Intrinsic::abs>(m_Value(Y)))))) {

      bool NSW =

          cast<Instruction>(IIOperand)->hasNoSignedWrap() && IntMinIsPoison;

      auto *XY = NSW ? Builder.CreateNSWMul(X, Y) : Builder.CreateMul(X, Y);

      return replaceOperand(*II, 0, XY);

    }


    if (std::optional<bool> Known =

            getKnownSignOrZero(IIOperand, SQ.getWithInstruction(II))) {

      // abs(x) -> x if x >= 0 (include abs(x-y) --> x - y where x >= y)

      // abs(x) -> x if x > 0 (include abs(x-y) --> x - y where x > y)

      if (!*Known)

        return replaceInstUsesWith(*II, IIOperand);


      // abs(x) -> -x if x < 0

      // abs(x) -> -x if x < = 0 (include abs(x-y) --> y - x where x <= y)

      if (IntMinIsPoison)

        return BinaryOperator::CreateNSWNeg(IIOperand);

      return BinaryOperator::CreateNeg(IIOperand);

    }


    // abs (sext X) --> zext (abs X*)

    // Clear the IsIntMin (nsw) bit on the abs to allow narrowing.

    if (match(IIOperand, m_OneUse(m_SExt(m_Value(X))))) {

      Value *NarrowAbs =

          Builder.CreateBinaryIntrinsic(Intrinsic::abs, X, Builder.getFalse());

      return CastInst::Create(Instruction::ZExt, NarrowAbs, II->getType());

    }


    // Match a complicated way to check if a number is odd/even:

    // abs (srem X, 2) --> and X, 1

    const APInt *C;

    if (match(IIOperand, m_SRem(m_Value(X), m_APInt(C))) && *C == 2)

      return BinaryOperator::CreateAnd(X, ConstantInt::get(II->getType(), 1));


    break;

  }

  case Intrinsic::umin: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    // umin(x, 1) == zext(x != 0)

    if (match(I1, m_One())) {

      assert(II->getType()->getScalarSizeInBits() != 1 &&

             "Expected simplify of umin with max constant");

      Value *Zero = Constant::getNullValue(I0->getType());

      Value *Cmp = Builder.CreateICmpNE(I0, Zero);

      return CastInst::Create(Instruction::ZExt, Cmp, II->getType());

    }

    // umin(cttz(x), const) --> cttz(x | (1 << const))

    if (Value *FoldedCttz =

            foldMinimumOverTrailingOrLeadingZeroCount<Intrinsic::cttz>(

                I0, I1, DL, Builder))

      return replaceInstUsesWith(*II, FoldedCttz);

    // umin(ctlz(x), const) --> ctlz(x | (SignedMin >> const))

    if (Value *FoldedCtlz =

            foldMinimumOverTrailingOrLeadingZeroCount<Intrinsic::ctlz>(

                I0, I1, DL, Builder))

      return replaceInstUsesWith(*II, FoldedCtlz);

    [[fallthrough]];

  }

  case Intrinsic::umax: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(I0, m_ZExt(m_Value(X))) && match(I1, m_ZExt(m_Value(Y))) &&

        (I0->hasOneUse() || I1->hasOneUse()) && X->getType() == Y->getType()) {

      Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, Y);

      return CastInst::Create(Instruction::ZExt, NarrowMaxMin, II->getType());

    }

    Constant *C;

    if (match(I0, m_ZExt(m_Value(X))) && match(I1, m_Constant(C)) &&

        I0->hasOneUse()) {

      if (Constant *NarrowC = getLosslessUnsignedTrunc(C, X->getType(), DL)) {

        Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, NarrowC);

        return CastInst::Create(Instruction::ZExt, NarrowMaxMin, II->getType());

      }

    }

    // If C is not 0:

    //   umax(nuw_shl(x, C), x + 1) -> x == 0 ? 1 : nuw_shl(x, C)

    // If C is not 0 or 1:

    //   umax(nuw_mul(x, C), x + 1) -> x == 0 ? 1 : nuw_mul(x, C)

    auto foldMaxMulShift = [&](Value *A, Value *B) -> Instruction * {

      const APInt *C;

      Value *X;

      if (!match(A, m_NUWShl(m_Value(X), m_APInt(C))) &&

          !(match(A, m_NUWMul(m_Value(X), m_APInt(C))) && !C->isOne()))

        return nullptr;

      if (C->isZero())

        return nullptr;

      if (!match(B, m_OneUse(m_Add(m_Specific(X), m_One()))))

        return nullptr;


      Value *Cmp = Builder.CreateICmpEQ(X, ConstantInt::get(X->getType(), 0));

      Value *NewSelect =

          Builder.CreateSelect(Cmp, ConstantInt::get(X->getType(), 1), A);

      return replaceInstUsesWith(*II, NewSelect);

    };


    if (IID == Intrinsic::umax) {

      if (Instruction *I = foldMaxMulShift(I0, I1))

        return I;

      if (Instruction *I = foldMaxMulShift(I1, I0))

        return I;

    }


    // If both operands of unsigned min/max are sign-extended, it is still ok

    // to narrow the operation.

    [[fallthrough]];

  }

  case Intrinsic::smax:

  case Intrinsic::smin: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(I0, m_SExt(m_Value(X))) && match(I1, m_SExt(m_Value(Y))) &&

        (I0->hasOneUse() || I1->hasOneUse()) && X->getType() == Y->getType()) {

      Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, Y);

      return CastInst::Create(Instruction::SExt, NarrowMaxMin, II->getType());

    }


    Constant *C;

    if (match(I0, m_SExt(m_Value(X))) && match(I1, m_Constant(C)) &&

        I0->hasOneUse()) {

      if (Constant *NarrowC = getLosslessSignedTrunc(C, X->getType(), DL)) {

        Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, NarrowC);

        return CastInst::Create(Instruction::SExt, NarrowMaxMin, II->getType());

      }

    }


    // smax(smin(X, MinC), MaxC) -> smin(smax(X, MaxC), MinC) if MinC s>= MaxC

    // umax(umin(X, MinC), MaxC) -> umin(umax(X, MaxC), MinC) if MinC u>= MaxC

    const APInt *MinC, *MaxC;

    auto CreateCanonicalClampForm = [&](bool IsSigned) {

      auto MaxIID = IsSigned ? Intrinsic::smax : Intrinsic::umax;

      auto MinIID = IsSigned ? Intrinsic::smin : Intrinsic::umin;

      Value *NewMax = Builder.CreateBinaryIntrinsic(

          MaxIID, X, ConstantInt::get(X->getType(), *MaxC));

      return replaceInstUsesWith(

          *II, Builder.CreateBinaryIntrinsic(

                   MinIID, NewMax, ConstantInt::get(X->getType(), *MinC)));

    };

    if (IID == Intrinsic::smax &&

        match(I0, m_OneUse(m_Intrinsic<Intrinsic::smin>(m_Value(X),

                                                        m_APInt(MinC)))) &&

        match(I1, m_APInt(MaxC)) && MinC->sgt(*MaxC))

      return CreateCanonicalClampForm(true);

    if (IID == Intrinsic::umax &&

        match(I0, m_OneUse(m_Intrinsic<Intrinsic::umin>(m_Value(X),

                                                        m_APInt(MinC)))) &&

        match(I1, m_APInt(MaxC)) && MinC->ugt(*MaxC))

      return CreateCanonicalClampForm(false);


    // umin(i1 X, i1 Y) -> and i1 X, Y

    // smax(i1 X, i1 Y) -> and i1 X, Y

    if ((IID == Intrinsic::umin || IID == Intrinsic::smax) &&

        II->getType()->isIntOrIntVectorTy(1)) {

      return BinaryOperator::CreateAnd(I0, I1);

    }


    // umax(i1 X, i1 Y) -> or i1 X, Y

    // smin(i1 X, i1 Y) -> or i1 X, Y

    if ((IID == Intrinsic::umax || IID == Intrinsic::smin) &&

        II->getType()->isIntOrIntVectorTy(1)) {

      return BinaryOperator::CreateOr(I0, I1);

    }


    // smin(smax(X, -1), 1) -> scmp(X, 0)

    // smax(smin(X, 1), -1) -> scmp(X, 0)

    // At this point, smax(smin(X, 1), -1) is changed to smin(smax(X, -1)

    // And i1's have been changed to and/ors

    // So we only need to check for smin

    if (IID == Intrinsic::smin) {

      if (match(I0, m_OneUse(m_SMax(m_Value(X), m_AllOnes()))) &&

          match(I1, m_One())) {

        Value *Zero = ConstantInt::get(X->getType(), 0);

        return replaceInstUsesWith(

            CI,

            Builder.CreateIntrinsic(II->getType(), Intrinsic::scmp, {X, Zero}));

      }

    }


    if (IID == Intrinsic::smax || IID == Intrinsic::smin) {

      // smax (neg nsw X), (neg nsw Y) --> neg nsw (smin X, Y)

      // smin (neg nsw X), (neg nsw Y) --> neg nsw (smax X, Y)

      // TODO: Canonicalize neg after min/max if I1 is constant.

      if (match(I0, m_NSWNeg(m_Value(X))) && match(I1, m_NSWNeg(m_Value(Y))) &&

          (I0->hasOneUse() || I1->hasOneUse())) {

        Intrinsic::ID InvID = getInverseMinMaxIntrinsic(IID);

        Value *InvMaxMin = Builder.CreateBinaryIntrinsic(InvID, X, Y);

        return BinaryOperator::CreateNSWNeg(InvMaxMin);

      }

    }


    // (umax X, (xor X, Pow2))

    //      -> (or X, Pow2)

    // (umin X, (xor X, Pow2))

    //      -> (and X, ~Pow2)

    // (smax X, (xor X, Pos_Pow2))

    //      -> (or X, Pos_Pow2)

    // (smin X, (xor X, Pos_Pow2))

    //      -> (and X, ~Pos_Pow2)

    // (smax X, (xor X, Neg_Pow2))

    //      -> (and X, ~Neg_Pow2)

    // (smin X, (xor X, Neg_Pow2))

    //      -> (or X, Neg_Pow2)

    if ((match(I0, m_c_Xor(m_Specific(I1), m_Value(X))) ||

         match(I1, m_c_Xor(m_Specific(I0), m_Value(X)))) &&

        isKnownToBeAPowerOfTwo(X, /* OrZero */ true)) {

      bool UseOr = IID == Intrinsic::smax || IID == Intrinsic::umax;

      bool UseAndN = IID == Intrinsic::smin || IID == Intrinsic::umin;


      if (IID == Intrinsic::smax || IID == Intrinsic::smin) {

        auto KnownSign = getKnownSign(X, SQ.getWithInstruction(II));

        if (KnownSign == std::nullopt) {

          UseOr = false;

          UseAndN = false;

        } else if (*KnownSign /* true is Signed. */) {

          UseOr ^= true;

          UseAndN ^= true;

          Type *Ty = I0->getType();

          // Negative power of 2 must be IntMin. It's possible to be able to

          // prove negative / power of 2 without actually having known bits, so

          // just get the value by hand.

          X = Constant::getIntegerValue(

              Ty, APInt::getSignedMinValue(Ty->getScalarSizeInBits()));

        }

      }

      if (UseOr)

        return BinaryOperator::CreateOr(I0, X);

      else if (UseAndN)

        return BinaryOperator::CreateAnd(I0, Builder.CreateNot(X));

    }


    // If we can eliminate ~A and Y is free to invert:

    // max ~A, Y --> ~(min A, ~Y)

    //

    // Examples:

    // max ~A, ~Y --> ~(min A, Y)

    // max ~A, C --> ~(min A, ~C)

    // max ~A, (max ~Y, ~Z) --> ~min( A, (min Y, Z))

    auto moveNotAfterMinMax = [&](Value *X, Value *Y) -> Instruction * {

      Value *A;

      if (match(X, m_OneUse(m_Not(m_Value(A)))) &&

          !isFreeToInvert(A, A->hasOneUse())) {

        if (Value *NotY = getFreelyInverted(Y, Y->hasOneUse(), &Builder)) {

          Intrinsic::ID InvID = getInverseMinMaxIntrinsic(IID);

          Value *InvMaxMin = Builder.CreateBinaryIntrinsic(InvID, A, NotY);

          return BinaryOperator::CreateNot(InvMaxMin);

        }

      }

      return nullptr;

    };


    if (Instruction *I = moveNotAfterMinMax(I0, I1))

      return I;

    if (Instruction *I = moveNotAfterMinMax(I1, I0))

      return I;


    if (Instruction *I = moveAddAfterMinMax(II, Builder))

      return I;


    // minmax (X & NegPow2C, Y & NegPow2C) --> minmax(X, Y) & NegPow2C

    const APInt *RHSC;

    if (match(I0, m_OneUse(m_And(m_Value(X), m_NegatedPower2(RHSC)))) &&

        match(I1, m_OneUse(m_And(m_Value(Y), m_SpecificInt(*RHSC)))))

      return BinaryOperator::CreateAnd(Builder.CreateBinaryIntrinsic(IID, X, Y),

                                       ConstantInt::get(II->getType(), *RHSC));


    // smax(X, -X) --> abs(X)

    // smin(X, -X) --> -abs(X)

    // umax(X, -X) --> -abs(X)

    // umin(X, -X) --> abs(X)

    if (isKnownNegation(I0, I1)) {

      // We can choose either operand as the input to abs(), but if we can

      // eliminate the only use of a value, that's better for subsequent

      // transforms/analysis.

      if (I0->hasOneUse() && !I1->hasOneUse())

        std::swap(I0, I1);


      // This is some variant of abs(). See if we can propagate 'nsw' to the abs

      // operation and potentially its negation.

      bool IntMinIsPoison = isKnownNegation(I0, I1, /* NeedNSW */ true);

      Value *Abs = Builder.CreateBinaryIntrinsic(

          Intrinsic::abs, I0,

          ConstantInt::getBool(II->getContext(), IntMinIsPoison));


      // We don't have a "nabs" intrinsic, so negate if needed based on the

      // max/min operation.

      if (IID == Intrinsic::smin || IID == Intrinsic::umax)

        Abs = Builder.CreateNeg(Abs, "nabs", IntMinIsPoison);

      return replaceInstUsesWith(CI, Abs);

    }


    if (Instruction *Sel = foldClampRangeOfTwo(II, Builder))

      return Sel;


    if (Instruction *SAdd = matchSAddSubSat(*II))

      return SAdd;


    if (Value *NewMinMax = reassociateMinMaxWithConstants(II, Builder, SQ))

      return replaceInstUsesWith(*II, NewMinMax);


    if (Instruction *R = reassociateMinMaxWithConstantInOperand(II, Builder))

      return R;


    if (Instruction *NewMinMax = factorizeMinMaxTree(II))

       return NewMinMax;


    // Try to fold minmax with constant RHS based on range information

    if (match(I1, m_APIntAllowPoison(RHSC))) {

      ICmpInst::Predicate Pred =

          ICmpInst::getNonStrictPredicate(MinMaxIntrinsic::getPredicate(IID));

      bool IsSigned = MinMaxIntrinsic::isSigned(IID);

      ConstantRange LHS_CR = computeConstantRangeIncludingKnownBits(

          I0, IsSigned, SQ.getWithInstruction(II));

      if (!LHS_CR.isFullSet()) {

        if (LHS_CR.icmp(Pred, *RHSC))

          return replaceInstUsesWith(*II, I0);

        if (LHS_CR.icmp(ICmpInst::getSwappedPredicate(Pred), *RHSC))

          return replaceInstUsesWith(*II,

                                     ConstantInt::get(II->getType(), *RHSC));

      }

    }


    if (Value *V = foldIntrinsicUsingDistributiveLaws(II, Builder))

      return replaceInstUsesWith(*II, V);


    break;

  }

  case Intrinsic::scmp: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    Value *LHS, *RHS;

    if (match(I0, m_NSWSub(m_Value(LHS), m_Value(RHS))) && match(I1, m_Zero()))

      return replaceInstUsesWith(

          CI,

          Builder.CreateIntrinsic(II->getType(), Intrinsic::scmp, {LHS, RHS}));

    break;

  }

  case Intrinsic::bitreverse: {

    Value *IIOperand = II->getArgOperand(0);

    // bitrev (zext i1 X to ?) --> X ? SignBitC : 0

    Value *X;

    if (match(IIOperand, m_ZExt(m_Value(X))) &&

        X->getType()->isIntOrIntVectorTy(1)) {

      Type *Ty = II->getType();

      APInt SignBit = APInt::getSignMask(Ty->getScalarSizeInBits());

      return SelectInst::Create(X, ConstantInt::get(Ty, SignBit),

                                ConstantInt::getNullValue(Ty));

    }


    if (Instruction *crossLogicOpFold =

        foldBitOrderCrossLogicOp<Intrinsic::bitreverse>(IIOperand, Builder))

      return crossLogicOpFold;


    break;

  }

  case Intrinsic::bswap: {

    Value *IIOperand = II->getArgOperand(0);


    // Try to canonicalize bswap-of-logical-shift-by-8-bit-multiple as

    // inverse-shift-of-bswap:

    // bswap (shl X, Y) --> lshr (bswap X), Y

    // bswap (lshr X, Y) --> shl (bswap X), Y

    Value *X, *Y;

    if (match(IIOperand, m_OneUse(m_LogicalShift(m_Value(X), m_Value(Y))))) {

      unsigned BitWidth = IIOperand->getType()->getScalarSizeInBits();

      if (MaskedValueIsZero(Y, APInt::getLowBitsSet(BitWidth, 3))) {

        Value *NewSwap = Builder.CreateUnaryIntrinsic(Intrinsic::bswap, X);

        BinaryOperator::BinaryOps InverseShift =

            cast<BinaryOperator>(IIOperand)->getOpcode() == Instruction::Shl

                ? Instruction::LShr

                : Instruction::Shl;

        return BinaryOperator::Create(InverseShift, NewSwap, Y);

      }

    }


    KnownBits Known = computeKnownBits(IIOperand, II);

    uint64_t LZ = alignDown(Known.countMinLeadingZeros(), 8);

    uint64_t TZ = alignDown(Known.countMinTrailingZeros(), 8);

    unsigned BW = Known.getBitWidth();


    // bswap(x) -> shift(x) if x has exactly one "active byte"

    if (BW - LZ - TZ == 8) {

      assert(LZ != TZ && "active byte cannot be in the middle");

      if (LZ > TZ)  // -> shl(x) if the "active byte" is in the low part of x

        return BinaryOperator::CreateNUWShl(

            IIOperand, ConstantInt::get(IIOperand->getType(), LZ - TZ));

      // -> lshr(x) if the "active byte" is in the high part of x

      return BinaryOperator::CreateExactLShr(

            IIOperand, ConstantInt::get(IIOperand->getType(), TZ - LZ));

    }


    // bswap(trunc(bswap(x))) -> trunc(lshr(x, c))

    if (match(IIOperand, m_Trunc(m_BSwap(m_Value(X))))) {

      unsigned C = X->getType()->getScalarSizeInBits() - BW;

      Value *CV = ConstantInt::get(X->getType(), C);

      Value *V = Builder.CreateLShr(X, CV);

      return new TruncInst(V, IIOperand->getType());

    }


    if (Instruction *crossLogicOpFold =

            foldBitOrderCrossLogicOp<Intrinsic::bswap>(IIOperand, Builder)) {

      return crossLogicOpFold;

    }


    // Try to fold into bitreverse if bswap is the root of the expression tree.

    if (Instruction *BitOp = matchBSwapOrBitReverse(*II, /*MatchBSwaps*/ false,

                                                    /*MatchBitReversals*/ true))

      return BitOp;

    break;

  }

  case Intrinsic::masked_load:

    if (Value *SimplifiedMaskedOp = simplifyMaskedLoad(*II))

      return replaceInstUsesWith(CI, SimplifiedMaskedOp);

    break;

  case Intrinsic::masked_store:

    return simplifyMaskedStore(*II);

  case Intrinsic::masked_gather:

    return simplifyMaskedGather(*II);

  case Intrinsic::masked_scatter:

    return simplifyMaskedScatter(*II);

  case Intrinsic::launder_invariant_group:

  case Intrinsic::strip_invariant_group:

    if (auto *SkippedBarrier = simplifyInvariantGroupIntrinsic(*II, *this))

      return replaceInstUsesWith(*II, SkippedBarrier);

    break;

  case Intrinsic::powi:

    if (ConstantInt *Power = dyn_cast<ConstantInt>(II->getArgOperand(1))) {

      // 0 and 1 are handled in instsimplify

      // powi(x, -1) -> 1/x

      if (Power->isMinusOne())

        return BinaryOperator::CreateFDivFMF(ConstantFP::get(CI.getType(), 1.0),

                                             II->getArgOperand(0), II);

      // powi(x, 2) -> x*x

      if (Power->equalsInt(2))

        return BinaryOperator::CreateFMulFMF(II->getArgOperand(0),

                                             II->getArgOperand(0), II);


      if (!Power->getValue()[0]) {

        Value *X;

        // If power is even:

        // powi(-x, p) -> powi(x, p)

        // powi(fabs(x), p) -> powi(x, p)

        // powi(copysign(x, y), p) -> powi(x, p)

        if (match(II->getArgOperand(0), m_FNeg(m_Value(X))) ||

            match(II->getArgOperand(0), m_FAbs(m_Value(X))) ||

            match(II->getArgOperand(0),

                  m_Intrinsic<Intrinsic::copysign>(m_Value(X), m_Value())))

          return replaceOperand(*II, 0, X);

      }

    }

    break;


  case Intrinsic::cttz:

  case Intrinsic::ctlz:

    if (auto *I = foldCttzCtlz(*II, *this))

      return I;

    break;


  case Intrinsic::ctpop:

    if (auto *I = foldCtpop(*II, *this))

      return I;

    break;


  case Intrinsic::fshl:

  case Intrinsic::fshr: {

    Value *Op0 = II->getArgOperand(0), *Op1 = II->getArgOperand(1);

    Type *Ty = II->getType();

    unsigned BitWidth = Ty->getScalarSizeInBits();

    Constant *ShAmtC;

    if (match(II->getArgOperand(2), m_ImmConstant(ShAmtC))) {

      // Canonicalize a shift amount constant operand to modulo the bit-width.

      Constant *WidthC = ConstantInt::get(Ty, BitWidth);

      Constant *ModuloC =

          ConstantFoldBinaryOpOperands(Instruction::URem, ShAmtC, WidthC, DL);

      if (!ModuloC)

        return nullptr;

      if (ModuloC != ShAmtC)

        return replaceOperand(*II, 2, ModuloC);


      assert(match(ConstantFoldCompareInstOperands(ICmpInst::ICMP_UGT, WidthC,

                                                   ShAmtC, DL),

                   m_One()) &&

             "Shift amount expected to be modulo bitwidth");


      // Canonicalize funnel shift right by constant to funnel shift left. This

      // is not entirely arbitrary. For historical reasons, the backend may

      // recognize rotate left patterns but miss rotate right patterns.

      if (IID == Intrinsic::fshr) {

        // fshr X, Y, C --> fshl X, Y, (BitWidth - C) if C is not zero.

        if (!isKnownNonZero(ShAmtC, SQ.getWithInstruction(II)))

          return nullptr;


        Constant *LeftShiftC = ConstantExpr::getSub(WidthC, ShAmtC);

        Module *Mod = II->getModule();

        Function *Fshl =

            Intrinsic::getOrInsertDeclaration(Mod, Intrinsic::fshl, Ty);

        return CallInst::Create(Fshl, { Op0, Op1, LeftShiftC });

      }

      assert(IID == Intrinsic::fshl &&

             "All funnel shifts by simple constants should go left");


      // fshl(X, 0, C) --> shl X, C

      // fshl(X, undef, C) --> shl X, C

      if (match(Op1, m_ZeroInt()) || match(Op1, m_Undef()))

        return BinaryOperator::CreateShl(Op0, ShAmtC);


      // fshl(0, X, C) --> lshr X, (BW-C)

      // fshl(undef, X, C) --> lshr X, (BW-C)

      if (match(Op0, m_ZeroInt()) || match(Op0, m_Undef()))

        return BinaryOperator::CreateLShr(Op1,

                                          ConstantExpr::getSub(WidthC, ShAmtC));


      // fshl i16 X, X, 8 --> bswap i16 X (reduce to more-specific form)

      if (Op0 == Op1 && BitWidth == 16 && match(ShAmtC, m_SpecificInt(8))) {

        Module *Mod = II->getModule();

        Function *Bswap =

            Intrinsic::getOrInsertDeclaration(Mod, Intrinsic::bswap, Ty);

        return CallInst::Create(Bswap, { Op0 });

      }

      if (Instruction *BitOp =

              matchBSwapOrBitReverse(*II, /*MatchBSwaps*/ true,

                                     /*MatchBitReversals*/ true))

        return BitOp;


      // R = fshl(X, X, C2)

      // fshl(R, R, C1) --> fshl(X, X, (C1 + C2) % bitsize)

      Value *InnerOp;

      const APInt *ShAmtInnerC, *ShAmtOuterC;

      if (match(Op0, m_FShl(m_Value(InnerOp), m_Deferred(InnerOp),

                            m_APInt(ShAmtInnerC))) &&

          match(ShAmtC, m_APInt(ShAmtOuterC)) && Op0 == Op1) {

        APInt Sum = *ShAmtOuterC + *ShAmtInnerC;

        APInt Modulo = Sum.urem(APInt(Sum.getBitWidth(), BitWidth));

        if (Modulo.isZero())

          return replaceInstUsesWith(*II, InnerOp);

        Constant *ModuloC = ConstantInt::get(Ty, Modulo);

        return CallInst::Create(cast<IntrinsicInst>(Op0)->getCalledFunction(),

                                {InnerOp, InnerOp, ModuloC});

      }

    }


    // fshl(X, X, Neg(Y)) --> fshr(X, X, Y)

    // fshr(X, X, Neg(Y)) --> fshl(X, X, Y)

    // if BitWidth is a power-of-2

    Value *Y;

    if (Op0 == Op1 && isPowerOf2_32(BitWidth) &&

        match(II->getArgOperand(2), m_Neg(m_Value(Y)))) {

      Module *Mod = II->getModule();

      Function *OppositeShift = Intrinsic::getOrInsertDeclaration(

          Mod, IID == Intrinsic::fshl ? Intrinsic::fshr : Intrinsic::fshl, Ty);

      return CallInst::Create(OppositeShift, {Op0, Op1, Y});

    }


    // fshl(X, 0, Y) --> shl(X, and(Y, BitWidth - 1)) if bitwidth is a

    // power-of-2

    if (IID == Intrinsic::fshl && isPowerOf2_32(BitWidth) &&

        match(Op1, m_ZeroInt())) {

      Value *Op2 = II->getArgOperand(2);

      Value *And = Builder.CreateAnd(Op2, ConstantInt::get(Ty, BitWidth - 1));

      return BinaryOperator::CreateShl(Op0, And);

    }


    // Left or right might be masked.

    if (SimplifyDemandedInstructionBits(*II))

      return &CI;


    // The shift amount (operand 2) of a funnel shift is modulo the bitwidth,

    // so only the low bits of the shift amount are demanded if the bitwidth is

    // a power-of-2.

    if (!isPowerOf2_32(BitWidth))

      break;

    APInt Op2Demanded = APInt::getLowBitsSet(BitWidth, Log2_32_Ceil(BitWidth));

    KnownBits Op2Known(BitWidth);

    if (SimplifyDemandedBits(II, 2, Op2Demanded, Op2Known))

      return &CI;

    break;

  }

  case Intrinsic::ptrmask: {

    unsigned BitWidth = DL.getPointerTypeSizeInBits(II->getType());

    KnownBits Known(BitWidth);

    if (SimplifyDemandedInstructionBits(*II, Known))

      return II;


    Value *InnerPtr, *InnerMask;

    bool Changed = false;

    // Combine:

    // (ptrmask (ptrmask p, A), B)

    //    -> (ptrmask p, (and A, B))

    if (match(II->getArgOperand(0),

              m_OneUse(m_Intrinsic<Intrinsic::ptrmask>(m_Value(InnerPtr),

                                                       m_Value(InnerMask))))) {

      assert(II->getArgOperand(1)->getType() == InnerMask->getType() &&

             "Mask types must match");

      // TODO: If InnerMask == Op1, we could copy attributes from inner

      // callsite -> outer callsite.

      Value *NewMask = Builder.CreateAnd(II->getArgOperand(1), InnerMask);

      replaceOperand(CI, 0, InnerPtr);

      replaceOperand(CI, 1, NewMask);

      Changed = true;

    }


    // See if we can deduce non-null.

    if (!CI.hasRetAttr(Attribute::NonNull) &&

        (Known.isNonZero() ||

         isKnownNonZero(II, getSimplifyQuery().getWithInstruction(II)))) {

      CI.addRetAttr(Attribute::NonNull);

      Changed = true;

    }


    unsigned NewAlignmentLog =

        std::min(Value::MaxAlignmentExponent,

                 std::min(BitWidth - 1, Known.countMinTrailingZeros()));

    // Known bits will capture if we had alignment information associated with

    // the pointer argument.

    if (NewAlignmentLog > Log2(CI.getRetAlign().valueOrOne())) {

      CI.addRetAttr(Attribute::getWithAlignment(

          CI.getContext(), Align(uint64_t(1) << NewAlignmentLog)));

      Changed = true;

    }

    if (Changed)

      return &CI;

    break;

  }

  case Intrinsic::uadd_with_overflow:

  case Intrinsic::sadd_with_overflow: {

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;


    // Given 2 constant operands whose sum does not overflow:

    // uaddo (X +nuw C0), C1 -> uaddo X, C0 + C1

    // saddo (X +nsw C0), C1 -> saddo X, C0 + C1

    Value *X;

    const APInt *C0, *C1;

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    bool IsSigned = IID == Intrinsic::sadd_with_overflow;

    bool HasNWAdd = IsSigned

                        ? match(Arg0, m_NSWAddLike(m_Value(X), m_APInt(C0)))

                        : match(Arg0, m_NUWAddLike(m_Value(X), m_APInt(C0)));

    if (HasNWAdd && match(Arg1, m_APInt(C1))) {

      bool Overflow;

      APInt NewC =

          IsSigned ? C1->sadd_ov(*C0, Overflow) : C1->uadd_ov(*C0, Overflow);

      if (!Overflow)

        return replaceInstUsesWith(

            *II, Builder.CreateBinaryIntrinsic(

                     IID, X, ConstantInt::get(Arg1->getType(), NewC)));

    }

    break;

  }


  case Intrinsic::umul_with_overflow:

  case Intrinsic::smul_with_overflow:

  case Intrinsic::usub_with_overflow:

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;

    break;


  case Intrinsic::ssub_with_overflow: {

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;


    Constant *C;

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    // Given a constant C that is not the minimum signed value

    // for an integer of a given bit width:

    //

    // ssubo X, C -> saddo X, -C

    if (match(Arg1, m_Constant(C)) && C->isNotMinSignedValue()) {

      Value *NegVal = ConstantExpr::getNeg(C);

      // Build a saddo call that is equivalent to the discovered

      // ssubo call.

      return replaceInstUsesWith(

          *II, Builder.CreateBinaryIntrinsic(Intrinsic::sadd_with_overflow,

                                             Arg0, NegVal));

    }


    break;

  }


  case Intrinsic::uadd_sat:

  case Intrinsic::sadd_sat:

  case Intrinsic::usub_sat:

  case Intrinsic::ssub_sat: {

    SaturatingInst *SI = cast<SaturatingInst>(II);

    Type *Ty = SI->getType();

    Value *Arg0 = SI->getLHS();

    Value *Arg1 = SI->getRHS();


    // Make use of known overflow information.

    OverflowResult OR = computeOverflow(SI->getBinaryOp(), SI->isSigned(),

                                        Arg0, Arg1, SI);

    switch (OR) {

      case OverflowResult::MayOverflow:

        break;

      case OverflowResult::NeverOverflows:

        if (SI->isSigned())

          return BinaryOperator::CreateNSW(SI->getBinaryOp(), Arg0, Arg1);

        else

          return BinaryOperator::CreateNUW(SI->getBinaryOp(), Arg0, Arg1);

      case OverflowResult::AlwaysOverflowsLow: {

        unsigned BitWidth = Ty->getScalarSizeInBits();

        APInt Min = APSInt::getMinValue(BitWidth, !SI->isSigned());

        return replaceInstUsesWith(*SI, ConstantInt::get(Ty, Min));

      }

      case OverflowResult::AlwaysOverflowsHigh: {

        unsigned BitWidth = Ty->getScalarSizeInBits();

        APInt Max = APSInt::getMaxValue(BitWidth, !SI->isSigned());

        return replaceInstUsesWith(*SI, ConstantInt::get(Ty, Max));

      }

    }


    // usub_sat((sub nuw C, A), C1) -> usub_sat(usub_sat(C, C1), A)

    // which after that:

    // usub_sat((sub nuw C, A), C1) -> usub_sat(C - C1, A) if C1 u< C

    // usub_sat((sub nuw C, A), C1) -> 0 otherwise

    Constant *C, *C1;

    Value *A;

    if (IID == Intrinsic::usub_sat &&

        match(Arg0, m_NUWSub(m_ImmConstant(C), m_Value(A))) &&

        match(Arg1, m_ImmConstant(C1))) {

      auto *NewC = Builder.CreateBinaryIntrinsic(Intrinsic::usub_sat, C, C1);

      auto *NewSub =

          Builder.CreateBinaryIntrinsic(Intrinsic::usub_sat, NewC, A);

      return replaceInstUsesWith(*SI, NewSub);

    }


    // ssub.sat(X, C) -> sadd.sat(X, -C) if C != MIN

    if (IID == Intrinsic::ssub_sat && match(Arg1, m_Constant(C)) &&

        C->isNotMinSignedValue()) {

      Value *NegVal = ConstantExpr::getNeg(C);

      return replaceInstUsesWith(

          *II, Builder.CreateBinaryIntrinsic(

              Intrinsic::sadd_sat, Arg0, NegVal));

    }


    // sat(sat(X + Val2) + Val) -> sat(X + (Val+Val2))

    // sat(sat(X - Val2) - Val) -> sat(X - (Val+Val2))

    // if Val and Val2 have the same sign

    if (auto *Other = dyn_cast<IntrinsicInst>(Arg0)) {

      Value *X;

      const APInt *Val, *Val2;

      APInt NewVal;

      bool IsUnsigned =

          IID == Intrinsic::uadd_sat || IID == Intrinsic::usub_sat;

      if (Other->getIntrinsicID() == IID &&

          match(Arg1, m_APInt(Val)) &&

          match(Other->getArgOperand(0), m_Value(X)) &&

          match(Other->getArgOperand(1), m_APInt(Val2))) {

        if (IsUnsigned)

          NewVal = Val->uadd_sat(*Val2);

        else if (Val->isNonNegative() == Val2->isNonNegative()) {

          bool Overflow;

          NewVal = Val->sadd_ov(*Val2, Overflow);

          if (Overflow) {

            // Both adds together may add more than SignedMaxValue

            // without saturating the final result.

            break;

          }

        } else {

          // Cannot fold saturated addition with different signs.

          break;

        }


        return replaceInstUsesWith(

            *II, Builder.CreateBinaryIntrinsic(

                     IID, X, ConstantInt::get(II->getType(), NewVal)));

      }

    }

    break;

  }


  case Intrinsic::minnum:

  case Intrinsic::maxnum:

  case Intrinsic::minimum:

  case Intrinsic::maximum: {

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(Arg0, m_FNeg(m_Value(X))) && match(Arg1, m_FNeg(m_Value(Y))) &&

        (Arg0->hasOneUse() || Arg1->hasOneUse())) {

      // If both operands are negated, invert the call and negate the result:

      // min(-X, -Y) --> -(max(X, Y))

      // max(-X, -Y) --> -(min(X, Y))

      Intrinsic::ID NewIID;

      switch (IID) {

      case Intrinsic::maxnum:

        NewIID = Intrinsic::minnum;

        break;

      case Intrinsic::minnum:

        NewIID = Intrinsic::maxnum;

        break;

      case Intrinsic::maximum:

        NewIID = Intrinsic::minimum;

        break;

      case Intrinsic::minimum:

        NewIID = Intrinsic::maximum;

        break;

      default:

        llvm_unreachable("unexpected intrinsic ID");

      }

      Value *NewCall = Builder.CreateBinaryIntrinsic(NewIID, X, Y, II);

      Instruction *FNeg = UnaryOperator::CreateFNeg(NewCall);

      FNeg->copyIRFlags(II);

      return FNeg;

    }


    // m(m(X, C2), C1) -> m(X, C)

    const APFloat *C1, *C2;

    if (auto *M = dyn_cast<IntrinsicInst>(Arg0)) {

      if (M->getIntrinsicID() == IID && match(Arg1, m_APFloat(C1)) &&

          ((match(M->getArgOperand(0), m_Value(X)) &&

            match(M->getArgOperand(1), m_APFloat(C2))) ||

           (match(M->getArgOperand(1), m_Value(X)) &&

            match(M->getArgOperand(0), m_APFloat(C2))))) {

        APFloat Res(0.0);

        switch (IID) {

        case Intrinsic::maxnum:

          Res = maxnum(*C1, *C2);

          break;

        case Intrinsic::minnum:

          Res = minnum(*C1, *C2);

          break;

        case Intrinsic::maximum:

          Res = maximum(*C1, *C2);

          break;

        case Intrinsic::minimum:

          Res = minimum(*C1, *C2);

          break;

        default:

          llvm_unreachable("unexpected intrinsic ID");

        }

        // TODO: Conservatively intersecting FMF. If Res == C2, the transform

        //       was a simplification (so Arg0 and its original flags could

        //       propagate?)

        Value *V = Builder.CreateBinaryIntrinsic(

            IID, X, ConstantFP::get(Arg0->getType(), Res),

            FMFSource::intersect(II, M));

        return replaceInstUsesWith(*II, V);

      }

    }


    // m((fpext X), (fpext Y)) -> fpext (m(X, Y))

    if (match(Arg0, m_OneUse(m_FPExt(m_Value(X)))) &&

        match(Arg1, m_OneUse(m_FPExt(m_Value(Y)))) &&

        X->getType() == Y->getType()) {

      Value *NewCall =

          Builder.CreateBinaryIntrinsic(IID, X, Y, II, II->getName());

      return new FPExtInst(NewCall, II->getType());

    }


    // max X, -X --> fabs X

    // min X, -X --> -(fabs X)

    // TODO: Remove one-use limitation? That is obviously better for max,

    // hence why we don't check for one-use for that. However,

    // it would be an extra instruction for min (fnabs), but

    // that is still likely better for analysis and codegen.

    auto IsMinMaxOrXNegX = [IID, &X](Value *Op0, Value *Op1) {

      if (match(Op0, m_FNeg(m_Value(X))) && match(Op1, m_Specific(X)))

        return Op0->hasOneUse() ||

               (IID != Intrinsic::minimum && IID != Intrinsic::minnum);

      return false;

    };


    if (IsMinMaxOrXNegX(Arg0, Arg1) || IsMinMaxOrXNegX(Arg1, Arg0)) {

      Value *R = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, X, II);

      if (IID == Intrinsic::minimum || IID == Intrinsic::minnum)

        R = Builder.CreateFNegFMF(R, II);

      return replaceInstUsesWith(*II, R);

    }


    break;

  }

  case Intrinsic::matrix_multiply: {

    // Optimize negation in matrix multiplication.


    // -A * -B -> A * B

    Value *A, *B;

    if (match(II->getArgOperand(0), m_FNeg(m_Value(A))) &&

        match(II->getArgOperand(1), m_FNeg(m_Value(B)))) {

      replaceOperand(*II, 0, A);

      replaceOperand(*II, 1, B);

      return II;

    }


    Value *Op0 = II->getOperand(0);

    Value *Op1 = II->getOperand(1);

    Value *OpNotNeg, *NegatedOp;

    unsigned NegatedOpArg, OtherOpArg;

    if (match(Op0, m_FNeg(m_Value(OpNotNeg)))) {

      NegatedOp = Op0;

      NegatedOpArg = 0;

      OtherOpArg = 1;

    } else if (match(Op1, m_FNeg(m_Value(OpNotNeg)))) {

      NegatedOp = Op1;

      NegatedOpArg = 1;

      OtherOpArg = 0;

    } else

      // Multiplication doesn't have a negated operand.

      break;


    // Only optimize if the negated operand has only one use.

    if (!NegatedOp->hasOneUse())

      break;


    Value *OtherOp = II->getOperand(OtherOpArg);

    VectorType *RetTy = cast<VectorType>(II->getType());

    VectorType *NegatedOpTy = cast<VectorType>(NegatedOp->getType());

    VectorType *OtherOpTy = cast<VectorType>(OtherOp->getType());

    ElementCount NegatedCount = NegatedOpTy->getElementCount();

    ElementCount OtherCount = OtherOpTy->getElementCount();

    ElementCount RetCount = RetTy->getElementCount();

    // (-A) * B -> A * (-B), if it is cheaper to negate B and vice versa.

    if (ElementCount::isKnownGT(NegatedCount, OtherCount) &&

        ElementCount::isKnownLT(OtherCount, RetCount)) {

      Value *InverseOtherOp = Builder.CreateFNeg(OtherOp);

      replaceOperand(*II, NegatedOpArg, OpNotNeg);

      replaceOperand(*II, OtherOpArg, InverseOtherOp);

      return II;

    }

    // (-A) * B -> -(A * B), if it is cheaper to negate the result

    if (ElementCount::isKnownGT(NegatedCount, RetCount)) {

      SmallVector<Value *, 5> NewArgs(II->args());

      NewArgs[NegatedOpArg] = OpNotNeg;

      Instruction *NewMul =

          Builder.CreateIntrinsic(II->getType(), IID, NewArgs, II);

      return replaceInstUsesWith(*II, Builder.CreateFNegFMF(NewMul, II));

    }

    break;

  }

  case Intrinsic::fmuladd: {

    // Try to simplify the underlying FMul.

    if (Value *V =

            simplifyFMulInst(II->getArgOperand(0), II->getArgOperand(1),

                             II->getFastMathFlags(), SQ.getWithInstruction(II)))

      return BinaryOperator::CreateFAddFMF(V, II->getArgOperand(2),

                                           II->getFastMathFlags());


    [[fallthrough]];

  }

  case Intrinsic::fma: {

    // fma fneg(x), fneg(y), z -> fma x, y, z

    Value *Src0 = II->getArgOperand(0);

    Value *Src1 = II->getArgOperand(1);

    Value *Src2 = II->getArgOperand(2);

    Value *X, *Y;

    if (match(Src0, m_FNeg(m_Value(X))) && match(Src1, m_FNeg(m_Value(Y)))) {

      replaceOperand(*II, 0, X);

      replaceOperand(*II, 1, Y);

      return II;

    }


    // fma fabs(x), fabs(x), z -> fma x, x, z

    if (match(Src0, m_FAbs(m_Value(X))) &&

        match(Src1, m_FAbs(m_Specific(X)))) {

      replaceOperand(*II, 0, X);

      replaceOperand(*II, 1, X);

      return II;

    }


    // Try to simplify the underlying FMul. We can only apply simplifications

    // that do not require rounding.

    if (Value *V = simplifyFMAFMul(Src0, Src1, II->getFastMathFlags(),

                                   SQ.getWithInstruction(II)))

      return BinaryOperator::CreateFAddFMF(V, Src2, II->getFastMathFlags());


    // fma x, y, 0 -> fmul x, y

    // This is always valid for -0.0, but requires nsz for +0.0 as

    // -0.0 + 0.0 = 0.0, which would not be the same as the fmul on its own.

    if (match(Src2, m_NegZeroFP()) ||

        (match(Src2, m_PosZeroFP()) && II->getFastMathFlags().noSignedZeros()))

      return BinaryOperator::CreateFMulFMF(Src0, Src1, II);


    // fma x, -1.0, y -> fsub y, x

    if (match(Src1, m_SpecificFP(-1.0)))

      return BinaryOperator::CreateFSubFMF(Src2, Src0, II);


    break;

  }

  case Intrinsic::copysign: {

    Value *Mag = II->getArgOperand(0), *Sign = II->getArgOperand(1);

    if (std::optional<bool> KnownSignBit = computeKnownFPSignBit(

            Sign, getSimplifyQuery().getWithInstruction(II))) {

      if (*KnownSignBit) {

        // If we know that the sign argument is negative, reduce to FNABS:

        // copysign Mag, -Sign --> fneg (fabs Mag)

        Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Mag, II);

        return replaceInstUsesWith(*II, Builder.CreateFNegFMF(Fabs, II));

      }


      // If we know that the sign argument is positive, reduce to FABS:

      // copysign Mag, +Sign --> fabs Mag

      Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Mag, II);

      return replaceInstUsesWith(*II, Fabs);

    }


    // Propagate sign argument through nested calls:

    // copysign Mag, (copysign ?, X) --> copysign Mag, X

    Value *X;

    if (match(Sign, m_Intrinsic<Intrinsic::copysign>(m_Value(), m_Value(X)))) {

      Value *CopySign =

          Builder.CreateCopySign(Mag, X, FMFSource::intersect(II, Sign));

      return replaceInstUsesWith(*II, CopySign);

    }


    // Clear sign-bit of constant magnitude:

    // copysign -MagC, X --> copysign MagC, X

    // TODO: Support constant folding for fabs

    const APFloat *MagC;

    if (match(Mag, m_APFloat(MagC)) && MagC->isNegative()) {

      APFloat PosMagC = *MagC;

      PosMagC.clearSign();

      return replaceOperand(*II, 0, ConstantFP::get(Mag->getType(), PosMagC));

    }


    // Peek through changes of magnitude's sign-bit. This call rewrites those:

    // copysign (fabs X), Sign --> copysign X, Sign

    // copysign (fneg X), Sign --> copysign X, Sign

    if (match(Mag, m_FAbs(m_Value(X))) || match(Mag, m_FNeg(m_Value(X))))

      return replaceOperand(*II, 0, X);


    break;

  }

  case Intrinsic::fabs: {

    Value *Cond, *TVal, *FVal;

    Value *Arg = II->getArgOperand(0);

    Value *X;

    // fabs (-X) --> fabs (X)

    if (match(Arg, m_FNeg(m_Value(X)))) {

        CallInst *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, X, II);

        return replaceInstUsesWith(CI, Fabs);

    }


    if (match(Arg, m_Select(m_Value(Cond), m_Value(TVal), m_Value(FVal)))) {

      // fabs (select Cond, TrueC, FalseC) --> select Cond, AbsT, AbsF

      if (Arg->hasOneUse() ? (isa<Constant>(TVal) || isa<Constant>(FVal))

                           : (isa<Constant>(TVal) && isa<Constant>(FVal))) {

        CallInst *AbsT = Builder.CreateCall(II->getCalledFunction(), {TVal});

        CallInst *AbsF = Builder.CreateCall(II->getCalledFunction(), {FVal});

        SelectInst *SI = SelectInst::Create(Cond, AbsT, AbsF);

        FastMathFlags FMF1 = II->getFastMathFlags();

        FastMathFlags FMF2 = cast<SelectInst>(Arg)->getFastMathFlags();

        FMF2.setNoSignedZeros(false);

        SI->setFastMathFlags(FMF1 | FMF2);

        return SI;

      }

      // fabs (select Cond, -FVal, FVal) --> fabs FVal

      if (match(TVal, m_FNeg(m_Specific(FVal))))

        return replaceOperand(*II, 0, FVal);

      // fabs (select Cond, TVal, -TVal) --> fabs TVal

      if (match(FVal, m_FNeg(m_Specific(TVal))))

        return replaceOperand(*II, 0, TVal);

    }


    Value *Magnitude, *Sign;

    if (match(II->getArgOperand(0),

              m_CopySign(m_Value(Magnitude), m_Value(Sign)))) {

      // fabs (copysign x, y) -> (fabs x)

      CallInst *AbsSign =

          Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Magnitude, II);

      return replaceInstUsesWith(*II, AbsSign);

    }


    [[fallthrough]];

  }

  case Intrinsic::ceil:

  case Intrinsic::floor:

  case Intrinsic::round:

  case Intrinsic::roundeven:

  case Intrinsic::nearbyint:

  case Intrinsic::rint:

  case Intrinsic::trunc: {

    Value *ExtSrc;

    if (match(II->getArgOperand(0), m_OneUse(m_FPExt(m_Value(ExtSrc))))) {

      // Narrow the call: intrinsic (fpext x) -> fpext (intrinsic x)

      Value *NarrowII = Builder.CreateUnaryIntrinsic(IID, ExtSrc, II);

      return new FPExtInst(NarrowII, II->getType());

    }

    break;

  }

  case Intrinsic::cos:

  case Intrinsic::amdgcn_cos: {

    Value *X, *Sign;

    Value *Src = II->getArgOperand(0);

    if (match(Src, m_FNeg(m_Value(X))) || match(Src, m_FAbs(m_Value(X))) ||

        match(Src, m_CopySign(m_Value(X), m_Value(Sign)))) {

      // cos(-x) --> cos(x)

      // cos(fabs(x)) --> cos(x)

      // cos(copysign(x, y)) --> cos(x)

      return replaceOperand(*II, 0, X);

    }

    break;

  }

  case Intrinsic::sin:

  case Intrinsic::amdgcn_sin: {

    Value *X;

    if (match(II->getArgOperand(0), m_OneUse(m_FNeg(m_Value(X))))) {

      // sin(-x) --> -sin(x)

      Value *NewSin = Builder.CreateUnaryIntrinsic(IID, X, II);

      return UnaryOperator::CreateFNegFMF(NewSin, II);

    }

    break;

  }

  case Intrinsic::ldexp: {

    // ldexp(ldexp(x, a), b) -> ldexp(x, a + b)

    //

    // The danger is if the first ldexp would overflow to infinity or underflow

    // to zero, but the combined exponent avoids it. We ignore this with

    // reassoc.

    //

    // It's also safe to fold if we know both exponents are >= 0 or <= 0 since

    // it would just double down on the overflow/underflow which would occur

    // anyway.

    //

    // TODO: Could do better if we had range tracking for the input value

    // exponent. Also could broaden sign check to cover == 0 case.

    Value *Src = II->getArgOperand(0);

    Value *Exp = II->getArgOperand(1);

    Value *InnerSrc;

    Value *InnerExp;

    if (match(Src, m_OneUse(m_Intrinsic<Intrinsic::ldexp>(

                       m_Value(InnerSrc), m_Value(InnerExp)))) &&

        Exp->getType() == InnerExp->getType()) {

      FastMathFlags FMF = II->getFastMathFlags();

      FastMathFlags InnerFlags = cast<FPMathOperator>(Src)->getFastMathFlags();


      if ((FMF.allowReassoc() && InnerFlags.allowReassoc()) ||

          signBitMustBeTheSame(Exp, InnerExp, SQ.getWithInstruction(II))) {

        // TODO: Add nsw/nuw probably safe if integer type exceeds exponent

        // width.

        Value *NewExp = Builder.CreateAdd(InnerExp, Exp);

        II->setArgOperand(1, NewExp);

        II->setFastMathFlags(InnerFlags); // Or the inner flags.

        return replaceOperand(*II, 0, InnerSrc);

      }

    }


    // ldexp(x, zext(i1 y)) -> fmul x, (select y, 2.0, 1.0)

    // ldexp(x, sext(i1 y)) -> fmul x, (select y, 0.5, 1.0)

    Value *ExtSrc;

    if (match(Exp, m_ZExt(m_Value(ExtSrc))) &&

        ExtSrc->getType()->getScalarSizeInBits() == 1) {

      Value *Select =

          Builder.CreateSelect(ExtSrc, ConstantFP::get(II->getType(), 2.0),

                               ConstantFP::get(II->getType(), 1.0));

      return BinaryOperator::CreateFMulFMF(Src, Select, II);

    }

    if (match(Exp, m_SExt(m_Value(ExtSrc))) &&

        ExtSrc->getType()->getScalarSizeInBits() == 1) {

      Value *Select =

          Builder.CreateSelect(ExtSrc, ConstantFP::get(II->getType(), 0.5),

                               ConstantFP::get(II->getType(), 1.0));

      return BinaryOperator::CreateFMulFMF(Src, Select, II);

    }


    // ldexp(x, c ? exp : 0) -> c ? ldexp(x, exp) : x

    // ldexp(x, c ? 0 : exp) -> c ? x : ldexp(x, exp)

    ///

    // TODO: If we cared, should insert a canonicalize for x

    Value *SelectCond, *SelectLHS, *SelectRHS;

    if (match(II->getArgOperand(1),

              m_OneUse(m_Select(m_Value(SelectCond), m_Value(SelectLHS),

                                m_Value(SelectRHS))))) {

      Value *NewLdexp = nullptr;

      Value *Select = nullptr;

      if (match(SelectRHS, m_ZeroInt())) {

        NewLdexp = Builder.CreateLdexp(Src, SelectLHS, II);

        Select = Builder.CreateSelect(SelectCond, NewLdexp, Src);

      } else if (match(SelectLHS, m_ZeroInt())) {

        NewLdexp = Builder.CreateLdexp(Src, SelectRHS, II);

        Select = Builder.CreateSelect(SelectCond, Src, NewLdexp);

      }


      if (NewLdexp) {

        Select->takeName(II);

        return replaceInstUsesWith(*II, Select);

      }

    }


    break;

  }

  case Intrinsic::ptrauth_auth:

  case Intrinsic::ptrauth_resign: {

    // (sign|resign) + (auth|resign) can be folded by omitting the middle

    // sign+auth component if the key and discriminator match.

    bool NeedSign = II->getIntrinsicID() == Intrinsic::ptrauth_resign;

    Value *Ptr = II->getArgOperand(0);

    Value *Key = II->getArgOperand(1);

    Value *Disc = II->getArgOperand(2);


    // AuthKey will be the key we need to end up authenticating against in

    // whatever we replace this sequence with.

    Value *AuthKey = nullptr, *AuthDisc = nullptr, *BasePtr;

    if (const auto *CI = dyn_cast<CallBase>(Ptr)) {

      BasePtr = CI->getArgOperand(0);

      if (CI->getIntrinsicID() == Intrinsic::ptrauth_sign) {

        if (CI->getArgOperand(1) != Key || CI->getArgOperand(2) != Disc)

          break;

      } else if (CI->getIntrinsicID() == Intrinsic::ptrauth_resign) {

        if (CI->getArgOperand(3) != Key || CI->getArgOperand(4) != Disc)

          break;

        AuthKey = CI->getArgOperand(1);

        AuthDisc = CI->getArgOperand(2);

      } else

        break;

    } else if (const auto *PtrToInt = dyn_cast<PtrToIntOperator>(Ptr)) {

      // ptrauth constants are equivalent to a call to @llvm.ptrauth.sign for

      // our purposes, so check for that too.

      const auto *CPA = dyn_cast<ConstantPtrAuth>(PtrToInt->getOperand(0));

      if (!CPA || !CPA->isKnownCompatibleWith(Key, Disc, DL))

        break;


      // resign(ptrauth(p,ks,ds),ks,ds,kr,dr) -> ptrauth(p,kr,dr)

      if (NeedSign && isa<ConstantInt>(II->getArgOperand(4))) {

        auto *SignKey = cast<ConstantInt>(II->getArgOperand(3));

        auto *SignDisc = cast<ConstantInt>(II->getArgOperand(4));

        auto *SignAddrDisc = ConstantPointerNull::get(Builder.getPtrTy());

        auto *NewCPA = ConstantPtrAuth::get(CPA->getPointer(), SignKey,

                                            SignDisc, SignAddrDisc);

        replaceInstUsesWith(

            *II, ConstantExpr::getPointerCast(NewCPA, II->getType()));

        return eraseInstFromFunction(*II);

      }


      // auth(ptrauth(p,k,d),k,d) -> p

      BasePtr = Builder.CreatePtrToInt(CPA->getPointer(), II->getType());

    } else

      break;


    unsigned NewIntrin;

    if (AuthKey && NeedSign) {

      // resign(0,1) + resign(1,2) = resign(0, 2)

      NewIntrin = Intrinsic::ptrauth_resign;

    } else if (AuthKey) {

      // resign(0,1) + auth(1) = auth(0)

      NewIntrin = Intrinsic::ptrauth_auth;

    } else if (NeedSign) {

      // sign(0) + resign(0, 1) = sign(1)

      NewIntrin = Intrinsic::ptrauth_sign;

    } else {

      // sign(0) + auth(0) = nop

      replaceInstUsesWith(*II, BasePtr);

      return eraseInstFromFunction(*II);

    }


    SmallVector<Value *, 4> CallArgs;

    CallArgs.push_back(BasePtr);

    if (AuthKey) {

      CallArgs.push_back(AuthKey);

      CallArgs.push_back(AuthDisc);

    }


    if (NeedSign) {

      CallArgs.push_back(II->getArgOperand(3));

      CallArgs.push_back(II->getArgOperand(4));

    }


    Function *NewFn =

        Intrinsic::getOrInsertDeclaration(II->getModule(), NewIntrin);

    return CallInst::Create(NewFn, CallArgs);

  }

  case Intrinsic::arm_neon_vtbl1:

  case Intrinsic::aarch64_neon_tbl1:

    if (Value *V = simplifyNeonTbl1(*II, Builder))

      return replaceInstUsesWith(*II, V);

    break;


  case Intrinsic::arm_neon_vmulls:

  case Intrinsic::arm_neon_vmullu:

  case Intrinsic::aarch64_neon_smull:

  case Intrinsic::aarch64_neon_umull: {

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);


    // Handle mul by zero first:

    if (isa<ConstantAggregateZero>(Arg0) || isa<ConstantAggregateZero>(Arg1)) {

      return replaceInstUsesWith(CI, ConstantAggregateZero::get(II->getType()));

    }


    // Check for constant LHS & RHS - in this case we just simplify.

    bool Zext = (IID == Intrinsic::arm_neon_vmullu ||

                 IID == Intrinsic::aarch64_neon_umull);

    VectorType *NewVT = cast<VectorType>(II->getType());

    if (Constant *CV0 = dyn_cast<Constant>(Arg0)) {

      if (Constant *CV1 = dyn_cast<Constant>(Arg1)) {

        Value *V0 = Builder.CreateIntCast(CV0, NewVT, /*isSigned=*/!Zext);

        Value *V1 = Builder.CreateIntCast(CV1, NewVT, /*isSigned=*/!Zext);

        return replaceInstUsesWith(CI, Builder.CreateMul(V0, V1));

      }


      // Couldn't simplify - canonicalize constant to the RHS.

      std::swap(Arg0, Arg1);

    }


    // Handle mul by one:

    if (Constant *CV1 = dyn_cast<Constant>(Arg1))

      if (ConstantInt *Splat =

              dyn_cast_or_null<ConstantInt>(CV1->getSplatValue()))

        if (Splat->isOne())

          return CastInst::CreateIntegerCast(Arg0, II->getType(),

                                             /*isSigned=*/!Zext);


    break;

  }

  case Intrinsic::arm_neon_aesd:

  case Intrinsic::arm_neon_aese:

  case Intrinsic::aarch64_crypto_aesd:

  case Intrinsic::aarch64_crypto_aese:

  case Intrinsic::aarch64_sve_aesd:

  case Intrinsic::aarch64_sve_aese: {

    Value *DataArg = II->getArgOperand(0);

    Value *KeyArg  = II->getArgOperand(1);


    // Accept zero on either operand.

    if (!match(KeyArg, m_ZeroInt()))

      std::swap(KeyArg, DataArg);


    // Try to use the builtin XOR in AESE and AESD to eliminate a prior XOR

    Value *Data, *Key;

    if (match(KeyArg, m_ZeroInt()) &&

        match(DataArg, m_Xor(m_Value(Data), m_Value(Key)))) {

      replaceOperand(*II, 0, Data);

      replaceOperand(*II, 1, Key);

      return II;

    }

    break;

  }

  case Intrinsic::hexagon_V6_vandvrt:

  case Intrinsic::hexagon_V6_vandvrt_128B: {

    // Simplify Q -> V -> Q conversion.

    if (auto Op0 = dyn_cast<IntrinsicInst>(II->getArgOperand(0))) {

      Intrinsic::ID ID0 = Op0->getIntrinsicID();

      if (ID0 != Intrinsic::hexagon_V6_vandqrt &&

          ID0 != Intrinsic::hexagon_V6_vandqrt_128B)

        break;

      Value *Bytes = Op0->getArgOperand(1), *Mask = II->getArgOperand(1);

      uint64_t Bytes1 = computeKnownBits(Bytes, Op0).One.getZExtValue();

      uint64_t Mask1 = computeKnownBits(Mask, II).One.getZExtValue();

      // Check if every byte has common bits in Bytes and Mask.

      uint64_t C = Bytes1 & Mask1;

      if ((C & 0xFF) && (C & 0xFF00) && (C & 0xFF0000) && (C & 0xFF000000))

        return replaceInstUsesWith(*II, Op0->getArgOperand(0));

    }

    break;

  }

  case Intrinsic::stackrestore: {

    enum class ClassifyResult {

      None,

      Alloca,

      StackRestore,

      CallWithSideEffects,

    };

    auto Classify = [](const Instruction *I) {

      if (isa<AllocaInst>(I))

        return ClassifyResult::Alloca;


      if (auto *CI = dyn_cast<CallInst>(I)) {

        if (auto *II = dyn_cast<IntrinsicInst>(CI)) {

          if (II->getIntrinsicID() == Intrinsic::stackrestore)

            return ClassifyResult::StackRestore;


          if (II->mayHaveSideEffects())

            return ClassifyResult::CallWithSideEffects;

        } else {

          // Consider all non-intrinsic calls to be side effects

          return ClassifyResult::CallWithSideEffects;

        }

      }


      return ClassifyResult::None;

    };


    // If the stacksave and the stackrestore are in the same BB, and there is

    // no intervening call, alloca, or stackrestore of a different stacksave,

    // remove the restore. This can happen when variable allocas are DCE'd.

    if (IntrinsicInst *SS = dyn_cast<IntrinsicInst>(II->getArgOperand(0))) {

      if (SS->getIntrinsicID() == Intrinsic::stacksave &&

          SS->getParent() == II->getParent()) {

        BasicBlock::iterator BI(SS);

        bool CannotRemove = false;

        for (++BI; &*BI != II; ++BI) {

          switch (Classify(&*BI)) {

          case ClassifyResult::None:

            // So far so good, look at next instructions.

            break;


          case ClassifyResult::StackRestore:

            // If we found an intervening stackrestore for a different

            // stacksave, we can't remove the stackrestore. Otherwise, continue.

            if (cast<IntrinsicInst>(*BI).getArgOperand(0) != SS)

              CannotRemove = true;

            break;


          case ClassifyResult::Alloca:

          case ClassifyResult::CallWithSideEffects:

            // If we found an alloca, a non-intrinsic call, or an intrinsic

            // call with side effects, we can't remove the stackrestore.

            CannotRemove = true;

            break;

          }

          if (CannotRemove)

            break;

        }


        if (!CannotRemove)

          return eraseInstFromFunction(CI);

      }

    }


    // Scan down this block to see if there is another stack restore in the

    // same block without an intervening call/alloca.

    BasicBlock::iterator BI(II);

    Instruction *TI = II->getParent()->getTerminator();

    bool CannotRemove = false;

    for (++BI; &*BI != TI; ++BI) {

      switch (Classify(&*BI)) {

      case ClassifyResult::None:

        // So far so good, look at next instructions.

        break;


      case ClassifyResult::StackRestore:

        // If there is a stackrestore below this one, remove this one.

        return eraseInstFromFunction(CI);


      case ClassifyResult::Alloca:

      case ClassifyResult::CallWithSideEffects:

        // If we found an alloca, a non-intrinsic call, or an intrinsic call

        // with side effects (such as llvm.stacksave and llvm.read_register),

        // we can't remove the stack restore.

        CannotRemove = true;

        break;

      }

      if (CannotRemove)

        break;

    }


    // If the stack restore is in a return, resume, or unwind block and if there

    // are no allocas or calls between the restore and the return, nuke the

    // restore.

    if (!CannotRemove && (isa<ReturnInst>(TI) || isa<ResumeInst>(TI)))

      return eraseInstFromFunction(CI);

    break;

  }

  case Intrinsic::lifetime_end:

    // Asan needs to poison memory to detect invalid access which is possible

    // even for empty lifetime range.

    if (II->getFunction()->hasFnAttribute(Attribute::SanitizeAddress) ||

        II->getFunction()->hasFnAttribute(Attribute::SanitizeMemory) ||

        II->getFunction()->hasFnAttribute(Attribute::SanitizeHWAddress))

      break;


    if (removeTriviallyEmptyRange(*II, *this, [](const IntrinsicInst &I) {

          return I.getIntrinsicID() == Intrinsic::lifetime_start;

        }))

      return nullptr;

    break;

  case Intrinsic::assume: {

    Value *IIOperand = II->getArgOperand(0);

    SmallVector<OperandBundleDef, 4> OpBundles;

    II->getOperandBundlesAsDefs(OpBundles);


    /// This will remove the boolean Condition from the assume given as

    /// argument and remove the assume if it becomes useless.

    /// always returns nullptr for use as a return values.

    auto RemoveConditionFromAssume = [&](Instruction *Assume) -> Instruction * {

      assert(isa<AssumeInst>(Assume));

      if (isAssumeWithEmptyBundle(*cast<AssumeInst>(II)))

        return eraseInstFromFunction(CI);

      replaceUse(II->getOperandUse(0), ConstantInt::getTrue(II->getContext()));

      return nullptr;

    };

    // Remove an assume if it is followed by an identical assume.

    // TODO: Do we need this? Unless there are conflicting assumptions, the

    // computeKnownBits(IIOperand) below here eliminates redundant assumes.

    Instruction *Next = II->getNextNode();

    if (match(Next, m_Intrinsic<Intrinsic::assume>(m_Specific(IIOperand))))

      return RemoveConditionFromAssume(Next);


    // Canonicalize assume(a && b) -> assume(a); assume(b);

    // Note: New assumption intrinsics created here are registered by

    // the InstCombineIRInserter object.

    FunctionType *AssumeIntrinsicTy = II->getFunctionType();

    Value *AssumeIntrinsic = II->getCalledOperand();

    Value *A, *B;

    if (match(IIOperand, m_LogicalAnd(m_Value(A), m_Value(B)))) {

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic, A, OpBundles,

                         II->getName());

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic, B, II->getName());

      return eraseInstFromFunction(*II);

    }

    // assume(!(a || b)) -> assume(!a); assume(!b);

    if (match(IIOperand, m_Not(m_LogicalOr(m_Value(A), m_Value(B))))) {

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic,

                         Builder.CreateNot(A), OpBundles, II->getName());

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic,

                         Builder.CreateNot(B), II->getName());

      return eraseInstFromFunction(*II);

    }


    // assume( (load addr) != null ) -> add 'nonnull' metadata to load

    // (if assume is valid at the load)

    Instruction *LHS;

    if (match(IIOperand, m_SpecificICmp(ICmpInst::ICMP_NE, m_Instruction(LHS),

                                        m_Zero())) &&

        LHS->getOpcode() == Instruction::Load &&

        LHS->getType()->isPointerTy() &&

        isValidAssumeForContext(II, LHS, &DT)) {

      MDNode *MD = MDNode::get(II->getContext(), {});

      LHS->setMetadata(LLVMContext::MD_nonnull, MD);

      LHS->setMetadata(LLVMContext::MD_noundef, MD);

      return RemoveConditionFromAssume(II);


      // TODO: apply nonnull return attributes to calls and invokes

      // TODO: apply range metadata for range check patterns?

    }


    for (unsigned Idx = 0; Idx < II->getNumOperandBundles(); Idx++) {

      OperandBundleUse OBU = II->getOperandBundleAt(Idx);


      // Separate storage assumptions apply to the underlying allocations, not

      // any particular pointer within them. When evaluating the hints for AA

      // purposes we getUnderlyingObject them; by precomputing the answers here

      // we can avoid having to do so repeatedly there.

      if (OBU.getTagName() == "separate_storage") {

        assert(OBU.Inputs.size() == 2);

        auto MaybeSimplifyHint = [&](const Use &U) {

          Value *Hint = U.get();

          // Not having a limit is safe because InstCombine removes unreachable

          // code.

          Value *UnderlyingObject = getUnderlyingObject(Hint, /*MaxLookup*/ 0);

          if (Hint != UnderlyingObject)

            replaceUse(const_cast<Use &>(U), UnderlyingObject);

        };

        MaybeSimplifyHint(OBU.Inputs[0]);

        MaybeSimplifyHint(OBU.Inputs[1]);

      }


      // Try to remove redundant alignment assumptions.

      if (OBU.getTagName() == "align" && OBU.Inputs.size() == 2) {

        RetainedKnowledge RK = getKnowledgeFromOperandInAssume(

            *cast<AssumeInst>(II), II->arg_size() + Idx);

        if (!RK || RK.AttrKind != Attribute::Alignment ||

            !isPowerOf2_64(RK.ArgValue) || !isa<ConstantInt>(RK.IRArgValue))

          continue;


        // Remove align 1 bundles; they don't add any useful information.

        if (RK.ArgValue == 1)

          return CallBase::removeOperandBundle(II, OBU.getTagID());


        // Don't try to remove align assumptions for pointers derived from

        // arguments. We might lose information if the function gets inline and

        // the align argument attribute disappears.

        Value *UO = getUnderlyingObject(RK.WasOn);

        if (!UO || isa<Argument>(UO))

          continue;


        // Compute known bits for the pointer, passing nullptr as context to

        // avoid computeKnownBits using the assumption we are about to remove

        // for reasoning.

        KnownBits Known = computeKnownBits(RK.WasOn, /*CtxI=*/nullptr);

        unsigned TZ = std::min(Known.countMinTrailingZeros(),

                               Value::MaxAlignmentExponent);

        if ((1ULL << TZ) < RK.ArgValue)

          continue;

        return CallBase::removeOperandBundle(II, OBU.getTagID());

      }

    }


    // Convert nonnull assume like:

    // %A = icmp ne i32* %PTR, null

    // call void @llvm.assume(i1 %A)

    // into

    // call void @llvm.assume(i1 true) [ "nonnull"(i32* %PTR) ]

    if (EnableKnowledgeRetention &&

        match(IIOperand,

              m_SpecificICmp(ICmpInst::ICMP_NE, m_Value(A), m_Zero())) &&

        A->getType()->isPointerTy()) {

      if (auto *Replacement = buildAssumeFromKnowledge(

              {RetainedKnowledge{Attribute::NonNull, 0, A}}, Next, &AC, &DT)) {


        Replacement->insertBefore(Next->getIterator());

        AC.registerAssumption(Replacement);

        return RemoveConditionFromAssume(II);

      }

    }


    // Convert alignment assume like:

    // %B = ptrtoint i32* %A to i64

    // %C = and i64 %B, Constant

    // %D = icmp eq i64 %C, 0

    // call void @llvm.assume(i1 %D)

    // into

    // call void @llvm.assume(i1 true) [ "align"(i32* [[A]], i64  Constant + 1)]

    uint64_t AlignMask = 1;

    if (EnableKnowledgeRetention &&

        (match(IIOperand, m_Not(m_Trunc(m_Value(A)))) ||

         match(IIOperand,

               m_SpecificICmp(ICmpInst::ICMP_EQ,

                              m_And(m_Value(A), m_ConstantInt(AlignMask)),

                              m_Zero())))) {

      if (isPowerOf2_64(AlignMask + 1)) {

        uint64_t Offset = 0;

        match(A, m_Add(m_Value(A), m_ConstantInt(Offset)));

        if (match(A, m_PtrToIntOrAddr(m_Value(A)))) {

          /// Note: this doesn't preserve the offset information but merges

          /// offset and alignment.

          /// TODO: we can generate a GEP instead of merging the alignment with

          /// the offset.

          RetainedKnowledge RK{Attribute::Alignment,

                               (unsigned)MinAlign(Offset, AlignMask + 1), A};

          if (auto *Replacement =

                  buildAssumeFromKnowledge(RK, Next, &AC, &DT)) {


            Replacement->insertAfter(II->getIterator());

            AC.registerAssumption(Replacement);

          }

          return RemoveConditionFromAssume(II);

        }

      }

    }


    /// Canonicalize Knowledge in operand bundles.

    if (EnableKnowledgeRetention && II->hasOperandBundles()) {

      for (unsigned Idx = 0; Idx < II->getNumOperandBundles(); Idx++) {

        auto &BOI = II->bundle_op_info_begin()[Idx];

        RetainedKnowledge RK =

          llvm::getKnowledgeFromBundle(cast<AssumeInst>(*II), BOI);

        if (BOI.End - BOI.Begin > 2)

          continue; // Prevent reducing knowledge in an align with offset since

                    // extracting a RetainedKnowledge from them looses offset

                    // information

        RetainedKnowledge CanonRK =

          llvm::simplifyRetainedKnowledge(cast<AssumeInst>(II), RK,

                                          &getAssumptionCache(),

                                          &getDominatorTree());

        if (CanonRK == RK)

          continue;

        if (!CanonRK) {

          if (BOI.End - BOI.Begin > 0) {

            Worklist.pushValue(II->op_begin()[BOI.Begin]);

            Value::dropDroppableUse(II->op_begin()[BOI.Begin]);

          }

          continue;

        }

        assert(RK.AttrKind == CanonRK.AttrKind);

        if (BOI.End - BOI.Begin > 0)

          II->op_begin()[BOI.Begin].set(CanonRK.WasOn);

        if (BOI.End - BOI.Begin > 1)

          II->op_begin()[BOI.Begin + 1].set(ConstantInt::get(

              Type::getInt64Ty(II->getContext()), CanonRK.ArgValue));

        if (RK.WasOn)

          Worklist.pushValue(RK.WasOn);

        return II;

      }

    }


    // If there is a dominating assume with the same condition as this one,

    // then this one is redundant, and should be removed.

    KnownBits Known(1);

    computeKnownBits(IIOperand, Known, II);

    if (Known.isAllOnes() && isAssumeWithEmptyBundle(cast<AssumeInst>(*II)))

      return eraseInstFromFunction(*II);


    // assume(false) is unreachable.

    if (match(IIOperand, m_CombineOr(m_Zero(), m_Undef()))) {

      CreateNonTerminatorUnreachable(II);

      return eraseInstFromFunction(*II);

    }


    // Update the cache of affected values for this assumption (we might be

    // here because we just simplified the condition).

    AC.updateAffectedValues(cast<AssumeInst>(II));

    break;

  }

  case Intrinsic::experimental_guard: {

    // Is this guard followed by another guard?  We scan forward over a small

    // fixed window of instructions to handle common cases with conditions

    // computed between guards.

    Instruction *NextInst = II->getNextNode();

    for (unsigned i = 0; i < GuardWideningWindow; i++) {

      // Note: Using context-free form to avoid compile time blow up

      if (!isSafeToSpeculativelyExecute(NextInst))

        break;

      NextInst = NextInst->getNextNode();

    }

    Value *NextCond = nullptr;

    if (match(NextInst,

              m_Intrinsic<Intrinsic::experimental_guard>(m_Value(NextCond)))) {

      Value *CurrCond = II->getArgOperand(0);


      // Remove a guard that it is immediately preceded by an identical guard.

      // Otherwise canonicalize guard(a); guard(b) -> guard(a & b).

      if (CurrCond != NextCond) {

        Instruction *MoveI = II->getNextNode();

        while (MoveI != NextInst) {

          auto *Temp = MoveI;

          MoveI = MoveI->getNextNode();

          Temp->moveBefore(II->getIterator());

        }

        replaceOperand(*II, 0, Builder.CreateAnd(CurrCond, NextCond));

      }

      eraseInstFromFunction(*NextInst);

      return II;

    }

    break;

  }

  case Intrinsic::vector_insert: {

    Value *Vec = II->getArgOperand(0);

    Value *SubVec = II->getArgOperand(1);

    Value *Idx = II->getArgOperand(2);

    auto *DstTy = dyn_cast<FixedVectorType>(II->getType());

    auto *VecTy = dyn_cast<FixedVectorType>(Vec->getType());

    auto *SubVecTy = dyn_cast<FixedVectorType>(SubVec->getType());


    // Only canonicalize if the destination vector, Vec, and SubVec are all

    // fixed vectors.

    if (DstTy && VecTy && SubVecTy) {

      unsigned DstNumElts = DstTy->getNumElements();

      unsigned VecNumElts = VecTy->getNumElements();

      unsigned SubVecNumElts = SubVecTy->getNumElements();

      unsigned IdxN = cast<ConstantInt>(Idx)->getZExtValue();


      // An insert that entirely overwrites Vec with SubVec is a nop.

      if (VecNumElts == SubVecNumElts)

        return replaceInstUsesWith(CI, SubVec);


      // Widen SubVec into a vector of the same width as Vec, since

      // shufflevector requires the two input vectors to be the same width.

      // Elements beyond the bounds of SubVec within the widened vector are

      // undefined.

      SmallVector<int, 8> WidenMask;

      unsigned i;

      for (i = 0; i != SubVecNumElts; ++i)

        WidenMask.push_back(i);

      for (; i != VecNumElts; ++i)

        WidenMask.push_back(PoisonMaskElem);


      Value *WidenShuffle = Builder.CreateShuffleVector(SubVec, WidenMask);


      SmallVector<int, 8> Mask;

      for (unsigned i = 0; i != IdxN; ++i)

        Mask.push_back(i);

      for (unsigned i = DstNumElts; i != DstNumElts + SubVecNumElts; ++i)

        Mask.push_back(i);

      for (unsigned i = IdxN + SubVecNumElts; i != DstNumElts; ++i)

        Mask.push_back(i);


      Value *Shuffle = Builder.CreateShuffleVector(Vec, WidenShuffle, Mask);

      return replaceInstUsesWith(CI, Shuffle);

    }

    break;

  }

  case Intrinsic::vector_extract: {

    Value *Vec = II->getArgOperand(0);

    Value *Idx = II->getArgOperand(1);


    Type *ReturnType = II->getType();

    // (extract_vector (insert_vector InsertTuple, InsertValue, InsertIdx),

    // ExtractIdx)

    unsigned ExtractIdx = cast<ConstantInt>(Idx)->getZExtValue();

    Value *InsertTuple, *InsertIdx, *InsertValue;

    if (match(Vec, m_Intrinsic<Intrinsic::vector_insert>(m_Value(InsertTuple),

                                                         m_Value(InsertValue),

                                                         m_Value(InsertIdx))) &&

        InsertValue->getType() == ReturnType) {

      unsigned Index = cast<ConstantInt>(InsertIdx)->getZExtValue();

      // Case where we get the same index right after setting it.

      // extract.vector(insert.vector(InsertTuple, InsertValue, Idx), Idx) -->

      // InsertValue

      if (ExtractIdx == Index)

        return replaceInstUsesWith(CI, InsertValue);

      // If we are getting a different index than what was set in the

      // insert.vector intrinsic. We can just set the input tuple to the one up

      // in the chain. extract.vector(insert.vector(InsertTuple, InsertValue,

      // InsertIndex), ExtractIndex)

      // --> extract.vector(InsertTuple, ExtractIndex)

      else

        return replaceOperand(CI, 0, InsertTuple);

    }


    auto *DstTy = dyn_cast<VectorType>(ReturnType);

    auto *VecTy = dyn_cast<VectorType>(Vec->getType());


    if (DstTy && VecTy) {

      auto DstEltCnt = DstTy->getElementCount();

      auto VecEltCnt = VecTy->getElementCount();

      unsigned IdxN = cast<ConstantInt>(Idx)->getZExtValue();


      // Extracting the entirety of Vec is a nop.

      if (DstEltCnt == VecTy->getElementCount()) {

        replaceInstUsesWith(CI, Vec);

        return eraseInstFromFunction(CI);

      }


      // Only canonicalize to shufflevector if the destination vector and

      // Vec are fixed vectors.

      if (VecEltCnt.isScalable() || DstEltCnt.isScalable())

        break;


      SmallVector<int, 8> Mask;

      for (unsigned i = 0; i != DstEltCnt.getKnownMinValue(); ++i)

        Mask.push_back(IdxN + i);


      Value *Shuffle = Builder.CreateShuffleVector(Vec, Mask);

      return replaceInstUsesWith(CI, Shuffle);

    }

    break;

  }

  case Intrinsic::experimental_vp_reverse: {

    Value *X;

    Value *Vec = II->getArgOperand(0);

    Value *Mask = II->getArgOperand(1);

    if (!match(Mask, m_AllOnes()))

      break;

    Value *EVL = II->getArgOperand(2);

    // TODO: Canonicalize experimental.vp.reverse after unop/binops?

    // rev(unop rev(X)) --> unop X

    if (match(Vec,

              m_OneUse(m_UnOp(m_Intrinsic<Intrinsic::experimental_vp_reverse>(

                  m_Value(X), m_AllOnes(), m_Specific(EVL)))))) {

      auto *OldUnOp = cast<UnaryOperator>(Vec);

      auto *NewUnOp = UnaryOperator::CreateWithCopiedFlags(

          OldUnOp->getOpcode(), X, OldUnOp, OldUnOp->getName(),

          II->getIterator());

      return replaceInstUsesWith(CI, NewUnOp);

    }

    break;

  }

  case Intrinsic::vector_reduce_or:

  case Intrinsic::vector_reduce_and: {

    // Canonicalize logical or/and reductions:

    // Or reduction for i1 is represented as:

    // %val = bitcast <ReduxWidth x i1> to iReduxWidth

    // %res = cmp ne iReduxWidth %val, 0

    // And reduction for i1 is represented as:

    // %val = bitcast <ReduxWidth x i1> to iReduxWidth

    // %res = cmp eq iReduxWidth %val, 11111

    Value *Arg = II->getArgOperand(0);

    Value *Vect;


    if (Value *NewOp =

            simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

      replaceUse(II->getOperandUse(0), NewOp);

      return II;

    }


    if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

      if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

        if (FTy->getElementType() == Builder.getInt1Ty()) {

          Value *Res = Builder.CreateBitCast(

              Vect, Builder.getIntNTy(FTy->getNumElements()));

          if (IID == Intrinsic::vector_reduce_and) {

            Res = Builder.CreateICmpEQ(

                Res, ConstantInt::getAllOnesValue(Res->getType()));

          } else {

            assert(IID == Intrinsic::vector_reduce_or &&

                   "Expected or reduction.");

            Res = Builder.CreateIsNotNull(Res);

          }

          if (Arg != Vect)

            Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                     II->getType());

          return replaceInstUsesWith(CI, Res);

        }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_add: {

    if (IID == Intrinsic::vector_reduce_add) {

      // Convert vector_reduce_add(ZExt(<n x i1>)) to

      // ZExtOrTrunc(ctpop(bitcast <n x i1> to in)).

      // Convert vector_reduce_add(SExt(<n x i1>)) to

      // -ZExtOrTrunc(ctpop(bitcast <n x i1> to in)).

      // Convert vector_reduce_add(<n x i1>) to

      // Trunc(ctpop(bitcast <n x i1> to in)).

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

          if (FTy->getElementType() == Builder.getInt1Ty()) {

            Value *V = Builder.CreateBitCast(

                Vect, Builder.getIntNTy(FTy->getNumElements()));

            Value *Res = Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, V);

            if (Res->getType() != II->getType())

              Res = Builder.CreateZExtOrTrunc(Res, II->getType());

            if (Arg != Vect &&

                cast<Instruction>(Arg)->getOpcode() == Instruction::SExt)

              Res = Builder.CreateNeg(Res);

            return replaceInstUsesWith(CI, Res);

          }

      }


      // vector.reduce.add.vNiM(splat(%x)) -> mul(%x, N)

      if (Value *Splat = getSplatValue(Arg)) {

        ElementCount VecToReduceCount =

            cast<VectorType>(Arg->getType())->getElementCount();

        if (VecToReduceCount.isFixed()) {

          unsigned VectorSize = VecToReduceCount.getFixedValue();

          return BinaryOperator::CreateMul(

              Splat, ConstantInt::get(Splat->getType(), VectorSize));

        }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_xor: {

    if (IID == Intrinsic::vector_reduce_xor) {

      // Exclusive disjunction reduction over the vector with

      // (potentially-extended) i1 element type is actually a

      // (potentially-extended) arithmetic `add` reduction over the original

      // non-extended value:

      //   vector_reduce_xor(?ext(<n x i1>))

      //     -->

      //   ?ext(vector_reduce_add(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = Builder.CreateAddReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                       II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_mul: {

    if (IID == Intrinsic::vector_reduce_mul) {

      // Multiplicative reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially zero-extended)

      // logical `and` reduction over the original non-extended value:

      //   vector_reduce_mul(?ext(<n x i1>))

      //     -->

      //   zext(vector_reduce_and(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = Builder.CreateAndReduce(Vect);

            if (Res->getType() != II->getType())

              Res = Builder.CreateZExt(Res, II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_umin:

  case Intrinsic::vector_reduce_umax: {

    if (IID == Intrinsic::vector_reduce_umin ||

        IID == Intrinsic::vector_reduce_umax) {

      // UMin/UMax reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially-extended)

      // logical `and`/`or` reduction over the original non-extended value:

      //   vector_reduce_u{min,max}(?ext(<n x i1>))

      //     -->

      //   ?ext(vector_reduce_{and,or}(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = IID == Intrinsic::vector_reduce_umin

                             ? Builder.CreateAndReduce(Vect)

                             : Builder.CreateOrReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                       II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_smin:

  case Intrinsic::vector_reduce_smax: {

    if (IID == Intrinsic::vector_reduce_smin ||

        IID == Intrinsic::vector_reduce_smax) {

      // SMin/SMax reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially-extended)

      // logical `and`/`or` reduction over the original non-extended value:

      //   vector_reduce_s{min,max}(<n x i1>)

      //     -->

      //   vector_reduce_{or,and}(<n x i1>)

      // and

      //   vector_reduce_s{min,max}(sext(<n x i1>))

      //     -->

      //   sext(vector_reduce_{or,and}(<n x i1>))

      // and

      //   vector_reduce_s{min,max}(zext(<n x i1>))

      //     -->

      //   zext(vector_reduce_{and,or}(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Instruction::CastOps ExtOpc = Instruction::CastOps::CastOpsEnd;

            if (Arg != Vect)

              ExtOpc = cast<CastInst>(Arg)->getOpcode();

            Value *Res = ((IID == Intrinsic::vector_reduce_smin) ==

                          (ExtOpc == Instruction::CastOps::ZExt))

                             ? Builder.CreateAndReduce(Vect)

                             : Builder.CreateOrReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(ExtOpc, Res, II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_fmax:

  case Intrinsic::vector_reduce_fmin:

  case Intrinsic::vector_reduce_fadd:

  case Intrinsic::vector_reduce_fmul: {

    bool CanReorderLanes = (IID != Intrinsic::vector_reduce_fadd &&

                            IID != Intrinsic::vector_reduce_fmul) ||

                           II->hasAllowReassoc();

    const unsigned ArgIdx = (IID == Intrinsic::vector_reduce_fadd ||

                             IID == Intrinsic::vector_reduce_fmul)

                                ? 1

                                : 0;

    Value *Arg = II->getArgOperand(ArgIdx);

    if (Value *NewOp = simplifyReductionOperand(Arg, CanReorderLanes)) {

      replaceUse(II->getOperandUse(ArgIdx), NewOp);

      return nullptr;

    }

    break;

  }

  case Intrinsic::is_fpclass: {

    if (Instruction *I = foldIntrinsicIsFPClass(*II))

      return I;

    break;

  }

  case Intrinsic::threadlocal_address: {

    Align MinAlign = getKnownAlignment(II->getArgOperand(0), DL, II, &AC, &DT);

    MaybeAlign Align = II->getRetAlign();

    if (MinAlign > Align.valueOrOne()) {

      II->addRetAttr(Attribute::getWithAlignment(II->getContext(), MinAlign));

      return II;

    }

    break;

  }

  case Intrinsic::frexp: {

    Value *X;

    // The first result is idempotent with the added complication of the struct

    // return, and the second result is zero because the value is already

    // normalized.

    if (match(II->getArgOperand(0), m_ExtractValue<0>(m_Value(X)))) {

      if (match(X, m_Intrinsic<Intrinsic::frexp>(m_Value()))) {

        X = Builder.CreateInsertValue(

            X, Constant::getNullValue(II->getType()->getStructElementType(1)),

            1);

        return replaceInstUsesWith(*II, X);

      }

    }

    break;

  }

  case Intrinsic::get_active_lane_mask: {

    const APInt *Op0, *Op1;

    if (match(II->getOperand(0), m_StrictlyPositive(Op0)) &&

        match(II->getOperand(1), m_APInt(Op1))) {

      Type *OpTy = II->getOperand(0)->getType();

      return replaceInstUsesWith(

          *II, Builder.CreateIntrinsic(

                   II->getType(), Intrinsic::get_active_lane_mask,

                   {Constant::getNullValue(OpTy),

                    ConstantInt::get(OpTy, Op1->usub_sat(*Op0))}));

    }

    break;

  }

  default: {

    // Handle target specific intrinsics

    std::optional<Instruction *> V = targetInstCombineIntrinsic(*II);

    if (V)

      return *V;

    break;

  }

  }


  // Try to fold intrinsic into select/phi operands. This is legal if:

  //  * The intrinsic is speculatable.

  //  * The operand is one of the following:

  //    - a phi.

  //    - a select with a scalar condition.

  //    - a select with a vector condition and II is not a cross lane operation.

  if (isSafeToSpeculativelyExecuteWithVariableReplaced(&CI)) {

    for (Value *Op : II->args()) {

      if (auto *Sel = dyn_cast<SelectInst>(Op)) {

        bool IsVectorCond = Sel->getCondition()->getType()->isVectorTy();

        if (IsVectorCond && !isNotCrossLaneOperation(II))

          continue;

        // Don't replace a scalar select with a more expensive vector select if

        // we can't simplify both arms of the select.

        bool SimplifyBothArms =

            !Op->getType()->isVectorTy() && II->getType()->isVectorTy();

        if (Instruction *R = FoldOpIntoSelect(

                *II, Sel, /*FoldWithMultiUse=*/false, SimplifyBothArms))

          return R;

      }

      if (auto *Phi = dyn_cast<PHINode>(Op))

        if (Instruction *R = foldOpIntoPhi(*II, Phi))

          return R;

    }

  }


  if (Instruction *Shuf = foldShuffledIntrinsicOperands(II))

    return Shuf;


  if (Value *Reverse = foldReversedIntrinsicOperands(II))

    return replaceInstUsesWith(*II, Reverse);


  if (Value *Res = foldIdempotentBinaryIntrinsicRecurrence(*this, II))

    return replaceInstUsesWith(*II, Res);


  // Some intrinsics (like experimental_gc_statepoint) can be used in invoke

  // context, so it is handled in visitCallBase and we should trigger it.

  return visitCallBase(*II);

}


// Fence instruction simplification


Instruction *InstCombinerImpl::visitFenceInst(FenceInst &FI) {

  auto *NFI = dyn_cast<FenceInst>(FI.getNextNode());

  // This check is solely here to handle arbitrary target-dependent syncscopes.

  // TODO: Can remove if does not matter in practice.

  if (NFI && FI.isIdenticalTo(NFI))

    return eraseInstFromFunction(FI);


  // Returns true if FI1 is identical or stronger fence than FI2.

  auto isIdenticalOrStrongerFence = [](FenceInst *FI1, FenceInst *FI2) {

    auto FI1SyncScope = FI1->getSyncScopeID();

    // Consider same scope, where scope is global or single-thread.

    if (FI1SyncScope != FI2->getSyncScopeID() ||

        (FI1SyncScope != SyncScope::System &&

         FI1SyncScope != SyncScope::SingleThread))

      return false;


    return isAtLeastOrStrongerThan(FI1->getOrdering(), FI2->getOrdering());

  };

  if (NFI && isIdenticalOrStrongerFence(NFI, &FI))

    return eraseInstFromFunction(FI);


  if (auto *PFI = dyn_cast_or_null<FenceInst>(FI.getPrevNode()))

    if (isIdenticalOrStrongerFence(PFI, &FI))

      return eraseInstFromFunction(FI);

  return nullptr;

}


// InvokeInst simplification


Instruction *InstCombinerImpl::visitInvokeInst(InvokeInst &II) {

  return visitCallBase(II);

}


// CallBrInst simplification


Instruction *InstCombinerImpl::visitCallBrInst(CallBrInst &CBI) {

  return visitCallBase(CBI);

}


Instruction *InstCombinerImpl::tryOptimizeCall(CallInst *CI) {

  if (!CI->getCalledFunction()) return nullptr;


  // Skip optimizing notail and musttail calls so

  // LibCallSimplifier::optimizeCall doesn't have to preserve those invariants.

  // LibCallSimplifier::optimizeCall should try to preserve tail calls though.

  if (CI->isMustTailCall() || CI->isNoTailCall())

    return nullptr;


  auto InstCombineRAUW = [this](Instruction *From, Value *With) {

    replaceInstUsesWith(*From, With);

  };

  auto InstCombineErase = [this](Instruction *I) {

    eraseInstFromFunction(*I);

  };

  LibCallSimplifier Simplifier(DL, &TLI, &DT, &DC, &AC, ORE, BFI, PSI,

                               InstCombineRAUW, InstCombineErase);

  if (Value *With = Simplifier.optimizeCall(CI, Builder)) {

    ++NumSimplified;

    return CI->use_empty() ? CI : replaceInstUsesWith(*CI, With);

  }


  return nullptr;

}


static IntrinsicInst *findInitTrampolineFromAlloca(Value *TrampMem) {

  // Strip off at most one level of pointer casts, looking for an alloca.  This

  // is good enough in practice and simpler than handling any number of casts.

  Value *Underlying = TrampMem->stripPointerCasts();

  if (Underlying != TrampMem &&

      (!Underlying->hasOneUse() || Underlying->user_back() != TrampMem))

    return nullptr;

  if (!isa<AllocaInst>(Underlying))

    return nullptr;


  IntrinsicInst *InitTrampoline = nullptr;

  for (User *U : TrampMem->users()) {

    IntrinsicInst *II = dyn_cast<IntrinsicInst>(U);

    if (!II)

      return nullptr;

    if (II->getIntrinsicID() == Intrinsic::init_trampoline) {

      if (InitTrampoline)

        // More than one init_trampoline writes to this value.  Give up.

        return nullptr;

      InitTrampoline = II;

      continue;

    }

    if (II->getIntrinsicID() == Intrinsic::adjust_trampoline)

      // Allow any number of calls to adjust.trampoline.

      continue;

    return nullptr;

  }


  // No call to init.trampoline found.

  if (!InitTrampoline)

    return nullptr;


  // Check that the alloca is being used in the expected way.

  if (InitTrampoline->getOperand(0) != TrampMem)

    return nullptr;


  return InitTrampoline;

}


static IntrinsicInst *findInitTrampolineFromBB(IntrinsicInst *AdjustTramp,

                                               Value *TrampMem) {

  // Visit all the previous instructions in the basic block, and try to find a

  // init.trampoline which has a direct path to the adjust.trampoline.

  for (BasicBlock::iterator I = AdjustTramp->getIterator(),

                            E = AdjustTramp->getParent()->begin();

       I != E;) {

    Instruction *Inst = &*--I;

    if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(I))

      if (II->getIntrinsicID() == Intrinsic::init_trampoline &&

          II->getOperand(0) == TrampMem)

        return II;

    if (Inst->mayWriteToMemory())

      return nullptr;

  }

  return nullptr;

}


// Given a call to llvm.adjust.trampoline, find and return the corresponding

// call to llvm.init.trampoline if the call to the trampoline can be optimized

// to a direct call to a function.  Otherwise return NULL.


static IntrinsicInst *findInitTrampoline(Value *Callee) {

  Callee = Callee->stripPointerCasts();

  IntrinsicInst *AdjustTramp = dyn_cast<IntrinsicInst>(Callee);

  if (!AdjustTramp ||

      AdjustTramp->getIntrinsicID() != Intrinsic::adjust_trampoline)

    return nullptr;


  Value *TrampMem = AdjustTramp->getOperand(0);


  if (IntrinsicInst *IT = findInitTrampolineFromAlloca(TrampMem))

    return IT;

  if (IntrinsicInst *IT = findInitTrampolineFromBB(AdjustTramp, TrampMem))

    return IT;

  return nullptr;

}


Instruction *InstCombinerImpl::foldPtrAuthIntrinsicCallee(CallBase &Call) {

  const Value *Callee = Call.getCalledOperand();

  const auto *IPC = dyn_cast<IntToPtrInst>(Callee);

  if (!IPC || !IPC->isNoopCast(DL))

    return nullptr;


  const auto *II = dyn_cast<IntrinsicInst>(IPC->getOperand(0));

  if (!II)

    return nullptr;


  Intrinsic::ID IIID = II->getIntrinsicID();

  if (IIID != Intrinsic::ptrauth_resign && IIID != Intrinsic::ptrauth_sign)

    return nullptr;


  // Isolate the ptrauth bundle from the others.

  std::optional<OperandBundleUse> PtrAuthBundleOrNone;

  SmallVector<OperandBundleDef, 2> NewBundles;

  for (unsigned BI = 0, BE = Call.getNumOperandBundles(); BI != BE; ++BI) {

    OperandBundleUse Bundle = Call.getOperandBundleAt(BI);

    if (Bundle.getTagID() == LLVMContext::OB_ptrauth)

      PtrAuthBundleOrNone = Bundle;

    else

      NewBundles.emplace_back(Bundle);

  }


  if (!PtrAuthBundleOrNone)

    return nullptr;


  Value *NewCallee = nullptr;

  switch (IIID) {

  // call(ptrauth.resign(p)), ["ptrauth"()] ->  call p, ["ptrauth"()]

  // assuming the call bundle and the sign operands match.

  case Intrinsic::ptrauth_resign: {

    // Resign result key should match bundle.

    if (II->getOperand(3) != PtrAuthBundleOrNone->Inputs[0])

      return nullptr;

    // Resign result discriminator should match bundle.

    if (II->getOperand(4) != PtrAuthBundleOrNone->Inputs[1])

      return nullptr;


    // Resign input (auth) key should also match: we can't change the key on

    // the new call we're generating, because we don't know what keys are valid.

    if (II->getOperand(1) != PtrAuthBundleOrNone->Inputs[0])

      return nullptr;


    Value *NewBundleOps[] = {II->getOperand(1), II->getOperand(2)};

    NewBundles.emplace_back("ptrauth", NewBundleOps);

    NewCallee = II->getOperand(0);

    break;

  }


  // call(ptrauth.sign(p)), ["ptrauth"()] ->  call p

  // assuming the call bundle and the sign operands match.

  // Non-ptrauth indirect calls are undesirable, but so is ptrauth.sign.

  case Intrinsic::ptrauth_sign: {

    // Sign key should match bundle.

    if (II->getOperand(1) != PtrAuthBundleOrNone->Inputs[0])

      return nullptr;

    // Sign discriminator should match bundle.

    if (II->getOperand(2) != PtrAuthBundleOrNone->Inputs[1])

      return nullptr;

    NewCallee = II->getOperand(0);

    break;

  }

  default:

    llvm_unreachable("unexpected intrinsic ID");

  }


  if (!NewCallee)

    return nullptr;


  NewCallee = Builder.CreateBitOrPointerCast(NewCallee, Callee->getType());

  CallBase *NewCall = CallBase::Create(&Call, NewBundles);

  NewCall->setCalledOperand(NewCallee);

  return NewCall;

}


Instruction *InstCombinerImpl::foldPtrAuthConstantCallee(CallBase &Call) {

  auto *CPA = dyn_cast<ConstantPtrAuth>(Call.getCalledOperand());

  if (!CPA)

    return nullptr;


  auto *CalleeF = dyn_cast<Function>(CPA->getPointer());

  // If the ptrauth constant isn't based on a function pointer, bail out.

  if (!CalleeF)

    return nullptr;


  // Inspect the call ptrauth bundle to check it matches the ptrauth constant.

  auto PAB = Call.getOperandBundle(LLVMContext::OB_ptrauth);

  if (!PAB)

    return nullptr;


  auto *Key = cast<ConstantInt>(PAB->Inputs[0]);

  Value *Discriminator = PAB->Inputs[1];


  // If the bundle doesn't match, this is probably going to fail to auth.

  if (!CPA->isKnownCompatibleWith(Key, Discriminator, DL))

    return nullptr;


  // If the bundle matches the constant, proceed in making this a direct call.

  auto *NewCall = CallBase::removeOperandBundle(&Call, LLVMContext::OB_ptrauth);

  NewCall->setCalledOperand(CalleeF);

  return NewCall;

}


bool InstCombinerImpl::annotateAnyAllocSite(CallBase &Call,

                                            const TargetLibraryInfo *TLI) {

  // Note: We only handle cases which can't be driven from generic attributes

  // here.  So, for example, nonnull and noalias (which are common properties

  // of some allocation functions) are expected to be handled via annotation

  // of the respective allocator declaration with generic attributes.

  bool Changed = false;


  if (!Call.getType()->isPointerTy())

    return Changed;


  std::optional<APInt> Size = getAllocSize(&Call, TLI);

  if (Size && *Size != 0) {

    // TODO: We really should just emit deref_or_null here and then

    // let the generic inference code combine that with nonnull.

    if (Call.hasRetAttr(Attribute::NonNull)) {

      Changed = !Call.hasRetAttr(Attribute::Dereferenceable);

      Call.addRetAttr(Attribute::getWithDereferenceableBytes(

          Call.getContext(), Size->getLimitedValue()));

    } else {

      Changed = !Call.hasRetAttr(Attribute::DereferenceableOrNull);

      Call.addRetAttr(Attribute::getWithDereferenceableOrNullBytes(

          Call.getContext(), Size->getLimitedValue()));

    }

  }


  // Add alignment attribute if alignment is a power of two constant.

  Value *Alignment = getAllocAlignment(&Call, TLI);

  if (!Alignment)

    return Changed;


  ConstantInt *AlignOpC = dyn_cast<ConstantInt>(Alignment);

  if (AlignOpC && AlignOpC->getValue().ult(llvm::Value::MaximumAlignment)) {

    uint64_t AlignmentVal = AlignOpC->getZExtValue();

    if (llvm::isPowerOf2_64(AlignmentVal)) {

      Align ExistingAlign = Call.getRetAlign().valueOrOne();

      Align NewAlign = Align(AlignmentVal);

      if (NewAlign > ExistingAlign) {

        Call.addRetAttr(

            Attribute::getWithAlignment(Call.getContext(), NewAlign));

        Changed = true;

      }

    }

  }

  return Changed;

}


/// Improvements for call, callbr and invoke instructions.

Instruction *InstCombinerImpl::visitCallBase(CallBase &Call) {

  bool Changed = annotateAnyAllocSite(Call, &TLI);


  // Mark any parameters that are known to be non-null with the nonnull

  // attribute.  This is helpful for inlining calls to functions with null

  // checks on their arguments.

  SmallVector<unsigned, 4> ArgNos;

  unsigned ArgNo = 0;


  for (Value *V : Call.args()) {

    if (V->getType()->isPointerTy()) {

      // Simplify the nonnull operand if the parameter is known to be nonnull.

      // Otherwise, try to infer nonnull for it.

      bool HasDereferenceable = Call.getParamDereferenceableBytes(ArgNo) > 0;

      if (Call.paramHasAttr(ArgNo, Attribute::NonNull) ||

          (HasDereferenceable &&

           !NullPointerIsDefined(Call.getFunction(),

                                 V->getType()->getPointerAddressSpace()))) {

        if (Value *Res = simplifyNonNullOperand(V, HasDereferenceable)) {

          replaceOperand(Call, ArgNo, Res);

          Changed = true;

        }

      } else if (isKnownNonZero(V,

                                getSimplifyQuery().getWithInstruction(&Call))) {

        ArgNos.push_back(ArgNo);

      }

    }

    ArgNo++;

  }


  assert(ArgNo == Call.arg_size() && "Call arguments not processed correctly.");


  if (!ArgNos.empty()) {

    AttributeList AS = Call.getAttributes();

    LLVMContext &Ctx = Call.getContext();

    AS = AS.addParamAttribute(Ctx, ArgNos,

                              Attribute::get(Ctx, Attribute::NonNull));

    Call.setAttributes(AS);

    Changed = true;

  }


  // If the callee is a pointer to a function, attempt to move any casts to the

  // arguments of the call/callbr/invoke.

  Value *Callee = Call.getCalledOperand();

  Function *CalleeF = dyn_cast<Function>(Callee);

  if ((!CalleeF || CalleeF->getFunctionType() != Call.getFunctionType()) &&

      transformConstExprCastCall(Call))

    return nullptr;


  if (CalleeF) {

    // Remove the convergent attr on calls when the callee is not convergent.

    if (Call.isConvergent() && !CalleeF->isConvergent() &&

        !CalleeF->isIntrinsic()) {

      LLVM_DEBUG(dbgs() << "Removing convergent attr from instr " << Call

                        << "\n");

      Call.setNotConvergent();

      return &Call;

    }


    // If the call and callee calling conventions don't match, and neither one

    // of the calling conventions is compatible with C calling convention

    // this call must be unreachable, as the call is undefined.

    if ((CalleeF->getCallingConv() != Call.getCallingConv() &&

         !(CalleeF->getCallingConv() == llvm::CallingConv::C &&

           TargetLibraryInfoImpl::isCallingConvCCompatible(&Call)) &&

         !(Call.getCallingConv() == llvm::CallingConv::C &&

           TargetLibraryInfoImpl::isCallingConvCCompatible(CalleeF))) &&

        // Only do this for calls to a function with a body.  A prototype may

        // not actually end up matching the implementation's calling conv for a

        // variety of reasons (e.g. it may be written in assembly).

        !CalleeF->isDeclaration()) {

      Instruction *OldCall = &Call;

      CreateNonTerminatorUnreachable(OldCall);

      // If OldCall does not return void then replaceInstUsesWith poison.

      // This allows ValueHandlers and custom metadata to adjust itself.

      if (!OldCall->getType()->isVoidTy())

        replaceInstUsesWith(*OldCall, PoisonValue::get(OldCall->getType()));

      if (isa<CallInst>(OldCall))

        return eraseInstFromFunction(*OldCall);


      // We cannot remove an invoke or a callbr, because it would change thexi

      // CFG, just change the callee to a null pointer.

      cast<CallBase>(OldCall)->setCalledFunction(

          CalleeF->getFunctionType(),

          Constant::getNullValue(CalleeF->getType()));

      return nullptr;

    }

  }


  // Calling a null function pointer is undefined if a null address isn't

  // dereferenceable.

  if ((isa<ConstantPointerNull>(Callee) &&

       !NullPointerIsDefined(Call.getFunction())) ||

      isa<UndefValue>(Callee)) {

    // If Call does not return void then replaceInstUsesWith poison.

    // This allows ValueHandlers and custom metadata to adjust itself.

    if (!Call.getType()->isVoidTy())

      replaceInstUsesWith(Call, PoisonValue::get(Call.getType()));


    if (Call.isTerminator()) {

      // Can't remove an invoke or callbr because we cannot change the CFG.

      return nullptr;

    }


    // This instruction is not reachable, just remove it.

    CreateNonTerminatorUnreachable(&Call);

    return eraseInstFromFunction(Call);

  }


  if (IntrinsicInst *II = findInitTrampoline(Callee))

    return transformCallThroughTrampoline(Call, *II);


  // Combine calls involving pointer authentication intrinsics.

  if (Instruction *NewCall = foldPtrAuthIntrinsicCallee(Call))

    return NewCall;


  // Combine calls to ptrauth constants.

  if (Instruction *NewCall = foldPtrAuthConstantCallee(Call))

    return NewCall;


  if (isa<InlineAsm>(Callee) && !Call.doesNotThrow()) {

    InlineAsm *IA = cast<InlineAsm>(Callee);

    if (!IA->canThrow()) {

      // Normal inline asm calls cannot throw - mark them

      // 'nounwind'.

      Call.setDoesNotThrow();

      Changed = true;

    }

  }


  // Try to optimize the call if possible, we require DataLayout for most of

  // this.  None of these calls are seen as possibly dead so go ahead and

  // delete the instruction now.

  if (CallInst *CI = dyn_cast<CallInst>(&Call)) {

    Instruction *I = tryOptimizeCall(CI);

    // If we changed something return the result, etc. Otherwise let

    // the fallthrough check.

    if (I) return eraseInstFromFunction(*I);

  }


  if (!Call.use_empty() && !Call.isMustTailCall())

    if (Value *ReturnedArg = Call.getReturnedArgOperand()) {

      Type *CallTy = Call.getType();

      Type *RetArgTy = ReturnedArg->getType();

      if (RetArgTy->canLosslesslyBitCastTo(CallTy))

        return replaceInstUsesWith(

            Call, Builder.CreateBitOrPointerCast(ReturnedArg, CallTy));

    }


  // Drop unnecessary callee_type metadata from calls that were converted

  // into direct calls.

  if (Call.getMetadata(LLVMContext::MD_callee_type) && !Call.isIndirectCall()) {

    Call.setMetadata(LLVMContext::MD_callee_type, nullptr);

    Changed = true;

  }


  // Drop unnecessary kcfi operand bundles from calls that were converted

  // into direct calls.

  auto Bundle = Call.getOperandBundle(LLVMContext::OB_kcfi);

  if (Bundle && !Call.isIndirectCall()) {

    DEBUG_WITH_TYPE(DEBUG_TYPE "-kcfi", {

      if (CalleeF) {

        ConstantInt *FunctionType = nullptr;

        ConstantInt *ExpectedType = cast<ConstantInt>(Bundle->Inputs[0]);


        if (MDNode *MD = CalleeF->getMetadata(LLVMContext::MD_kcfi_type))

          FunctionType = mdconst::extract<ConstantInt>(MD->getOperand(0));


        if (FunctionType &&

            FunctionType->getZExtValue() != ExpectedType->getZExtValue())

          dbgs() << Call.getModule()->getName()

                 << ": warning: kcfi: " << Call.getCaller()->getName()

                 << ": call to " << CalleeF->getName()

                 << " using a mismatching function pointer type\n";

      }

    });


    return CallBase::removeOperandBundle(&Call, LLVMContext::OB_kcfi);

  }


  if (isRemovableAlloc(&Call, &TLI))

    return visitAllocSite(Call);


  // Handle intrinsics which can be used in both call and invoke context.

  switch (Call.getIntrinsicID()) {

  case Intrinsic::experimental_gc_statepoint: {

    GCStatepointInst &GCSP = *cast<GCStatepointInst>(&Call);

    SmallPtrSet<Value *, 32> LiveGcValues;

    for (const GCRelocateInst *Reloc : GCSP.getGCRelocates()) {

      GCRelocateInst &GCR = *const_cast<GCRelocateInst *>(Reloc);


      // Remove the relocation if unused.

      if (GCR.use_empty()) {

        eraseInstFromFunction(GCR);

        continue;

      }


      Value *DerivedPtr = GCR.getDerivedPtr();

      Value *BasePtr = GCR.getBasePtr();


      // Undef is undef, even after relocation.

      if (isa<UndefValue>(DerivedPtr) || isa<UndefValue>(BasePtr)) {

        replaceInstUsesWith(GCR, UndefValue::get(GCR.getType()));

        eraseInstFromFunction(GCR);

        continue;

      }


      if (auto *PT = dyn_cast<PointerType>(GCR.getType())) {

        // The relocation of null will be null for most any collector.

        // TODO: provide a hook for this in GCStrategy.  There might be some

        // weird collector this property does not hold for.

        if (isa<ConstantPointerNull>(DerivedPtr)) {

          // Use null-pointer of gc_relocate's type to replace it.

          replaceInstUsesWith(GCR, ConstantPointerNull::get(PT));

          eraseInstFromFunction(GCR);

          continue;

        }


        // isKnownNonNull -> nonnull attribute

        if (!GCR.hasRetAttr(Attribute::NonNull) &&

            isKnownNonZero(DerivedPtr,

                           getSimplifyQuery().getWithInstruction(&Call))) {

          GCR.addRetAttr(Attribute::NonNull);

          // We discovered new fact, re-check users.

          Worklist.pushUsersToWorkList(GCR);

        }

      }


      // If we have two copies of the same pointer in the statepoint argument

      // list, canonicalize to one.  This may let us common gc.relocates.

      if (GCR.getBasePtr() == GCR.getDerivedPtr() &&

          GCR.getBasePtrIndex() != GCR.getDerivedPtrIndex()) {

        auto *OpIntTy = GCR.getOperand(2)->getType();

        GCR.setOperand(2, ConstantInt::get(OpIntTy, GCR.getBasePtrIndex()));

      }


      // TODO: bitcast(relocate(p)) -> relocate(bitcast(p))

      // Canonicalize on the type from the uses to the defs


      // TODO: relocate((gep p, C, C2, ...)) -> gep(relocate(p), C, C2, ...)

      LiveGcValues.insert(BasePtr);

      LiveGcValues.insert(DerivedPtr);

    }

    std::optional<OperandBundleUse> Bundle =

        GCSP.getOperandBundle(LLVMContext::OB_gc_live);

    unsigned NumOfGCLives = LiveGcValues.size();

    if (!Bundle || NumOfGCLives == Bundle->Inputs.size())

      break;

    // We can reduce the size of gc live bundle.

    DenseMap<Value *, unsigned> Val2Idx;

    std::vector<Value *> NewLiveGc;

    for (Value *V : Bundle->Inputs) {

      auto [It, Inserted] = Val2Idx.try_emplace(V);

      if (!Inserted)

        continue;

      if (LiveGcValues.count(V)) {

        It->second = NewLiveGc.size();

        NewLiveGc.push_back(V);

      } else

        It->second = NumOfGCLives;

    }

    // Update all gc.relocates

    for (const GCRelocateInst *Reloc : GCSP.getGCRelocates()) {

      GCRelocateInst &GCR = *const_cast<GCRelocateInst *>(Reloc);

      Value *BasePtr = GCR.getBasePtr();

      assert(Val2Idx.count(BasePtr) && Val2Idx[BasePtr] != NumOfGCLives &&

             "Missed live gc for base pointer");

      auto *OpIntTy1 = GCR.getOperand(1)->getType();

      GCR.setOperand(1, ConstantInt::get(OpIntTy1, Val2Idx[BasePtr]));

      Value *DerivedPtr = GCR.getDerivedPtr();

      assert(Val2Idx.count(DerivedPtr) && Val2Idx[DerivedPtr] != NumOfGCLives &&

             "Missed live gc for derived pointer");

      auto *OpIntTy2 = GCR.getOperand(2)->getType();

      GCR.setOperand(2, ConstantInt::get(OpIntTy2, Val2Idx[DerivedPtr]));

    }

    // Create new statepoint instruction.

    OperandBundleDef NewBundle("gc-live", NewLiveGc);

    return CallBase::Create(&Call, NewBundle);

  }

  default: { break; }

  }


  return Changed ? &Call : nullptr;

}


/// If the callee is a constexpr cast of a function, attempt to move the cast to

/// the arguments of the call/invoke.

/// CallBrInst is not supported.

bool InstCombinerImpl::transformConstExprCastCall(CallBase &Call) {

  auto *Callee =

      dyn_cast<Function>(Call.getCalledOperand()->stripPointerCasts());

  if (!Callee)

    return false;


  assert(!isa<CallBrInst>(Call) &&

         "CallBr's don't have a single point after a def to insert at");


  // Don't perform the transform for declarations, which may not be fully

  // accurate. For example, void @foo() is commonly used as a placeholder for

  // unknown prototypes.

  if (Callee->isDeclaration())

    return false;


  // If this is a call to a thunk function, don't remove the cast. Thunks are

  // used to transparently forward all incoming parameters and outgoing return

  // values, so it's important to leave the cast in place.

  if (Callee->hasFnAttribute("thunk"))

    return false;


  // If this is a call to a naked function, the assembly might be

  // using an argument, or otherwise rely on the frame layout,

  // the function prototype will mismatch.

  if (Callee->hasFnAttribute(Attribute::Naked))

    return false;


  // If this is a musttail call, the callee's prototype must match the caller's

  // prototype with the exception of pointee types. The code below doesn't

  // implement that, so we can't do this transform.

  // TODO: Do the transform if it only requires adding pointer casts.

  if (Call.isMustTailCall())

    return false;


  Instruction *Caller = &Call;

  const AttributeList &CallerPAL = Call.getAttributes();


  // Okay, this is a cast from a function to a different type.  Unless doing so

  // would cause a type conversion of one of our arguments, change this call to

  // be a direct call with arguments casted to the appropriate types.

  FunctionType *FT = Callee->getFunctionType();

  Type *OldRetTy = Caller->getType();

  Type *NewRetTy = FT->getReturnType();


  // Check to see if we are changing the return type...

  if (OldRetTy != NewRetTy) {


    if (NewRetTy->isStructTy())

      return false; // TODO: Handle multiple return values.


    if (!CastInst::isBitOrNoopPointerCastable(NewRetTy, OldRetTy, DL)) {

      if (!Caller->use_empty())

        return false;   // Cannot transform this return value.

    }


    if (!CallerPAL.isEmpty() && !Caller->use_empty()) {

      AttrBuilder RAttrs(FT->getContext(), CallerPAL.getRetAttrs());

      if (RAttrs.overlaps(AttributeFuncs::typeIncompatible(

              NewRetTy, CallerPAL.getRetAttrs())))

        return false;   // Attribute not compatible with transformed value.

    }


    // If the callbase is an invoke instruction, and the return value is

    // used by a PHI node in a successor, we cannot change the return type of

    // the call because there is no place to put the cast instruction (without

    // breaking the critical edge).  Bail out in this case.

    if (!Caller->use_empty()) {

      BasicBlock *PhisNotSupportedBlock = nullptr;

      if (auto *II = dyn_cast<InvokeInst>(Caller))

        PhisNotSupportedBlock = II->getNormalDest();

      if (PhisNotSupportedBlock)

        for (User *U : Caller->users())

          if (PHINode *PN = dyn_cast<PHINode>(U))

            if (PN->getParent() == PhisNotSupportedBlock)

              return false;

    }

  }


  unsigned NumActualArgs = Call.arg_size();

  unsigned NumCommonArgs = std::min(FT->getNumParams(), NumActualArgs);


  // Prevent us turning:

  // declare void @takes_i32_inalloca(i32* inalloca)

  //  call void bitcast (void (i32*)* @takes_i32_inalloca to void (i32)*)(i32 0)

  //

  // into:

  //  call void @takes_i32_inalloca(i32* null)

  //

  //  Similarly, avoid folding away bitcasts of byval calls.

  if (Callee->getAttributes().hasAttrSomewhere(Attribute::InAlloca) ||

      Callee->getAttributes().hasAttrSomewhere(Attribute::Preallocated))

    return false;


  auto AI = Call.arg_begin();

  for (unsigned i = 0, e = NumCommonArgs; i != e; ++i, ++AI) {

    Type *ParamTy = FT->getParamType(i);

    Type *ActTy = (*AI)->getType();


    if (!CastInst::isBitOrNoopPointerCastable(ActTy, ParamTy, DL))

      return false;   // Cannot transform this parameter value.


    // Check if there are any incompatible attributes we cannot drop safely.

    if (AttrBuilder(FT->getContext(), CallerPAL.getParamAttrs(i))

            .overlaps(AttributeFuncs::typeIncompatible(

                ParamTy, CallerPAL.getParamAttrs(i),

                AttributeFuncs::ASK_UNSAFE_TO_DROP)))

      return false;   // Attribute not compatible with transformed value.


    if (Call.isInAllocaArgument(i) ||

        CallerPAL.hasParamAttr(i, Attribute::Preallocated))

      return false; // Cannot transform to and from inalloca/preallocated.


    if (CallerPAL.hasParamAttr(i, Attribute::SwiftError))

      return false;


    if (CallerPAL.hasParamAttr(i, Attribute::ByVal) !=

        Callee->getAttributes().hasParamAttr(i, Attribute::ByVal))

      return false; // Cannot transform to or from byval.

  }


  if (FT->getNumParams() < NumActualArgs && FT->isVarArg() &&

      !CallerPAL.isEmpty()) {

    // In this case we have more arguments than the new function type, but we

    // won't be dropping them.  Check that these extra arguments have attributes

    // that are compatible with being a vararg call argument.

    unsigned SRetIdx;

    if (CallerPAL.hasAttrSomewhere(Attribute::StructRet, &SRetIdx) &&

        SRetIdx - AttributeList::FirstArgIndex >= FT->getNumParams())

      return false;

  }


  // Okay, we decided that this is a safe thing to do: go ahead and start

  // inserting cast instructions as necessary.

  SmallVector<Value *, 8> Args;

  SmallVector<AttributeSet, 8> ArgAttrs;

  Args.reserve(NumActualArgs);

  ArgAttrs.reserve(NumActualArgs);


  // Get any return attributes.

  AttrBuilder RAttrs(FT->getContext(), CallerPAL.getRetAttrs());


  // If the return value is not being used, the type may not be compatible

  // with the existing attributes.  Wipe out any problematic attributes.

  RAttrs.remove(

      AttributeFuncs::typeIncompatible(NewRetTy, CallerPAL.getRetAttrs()));


  LLVMContext &Ctx = Call.getContext();

  AI = Call.arg_begin();

  for (unsigned i = 0; i != NumCommonArgs; ++i, ++AI) {

    Type *ParamTy = FT->getParamType(i);


    Value *NewArg = *AI;

    if ((*AI)->getType() != ParamTy)

      NewArg = Builder.CreateBitOrPointerCast(*AI, ParamTy);

    Args.push_back(NewArg);


    // Add any parameter attributes except the ones incompatible with the new

    // type. Note that we made sure all incompatible ones are safe to drop.

    AttributeMask IncompatibleAttrs = AttributeFuncs::typeIncompatible(

        ParamTy, CallerPAL.getParamAttrs(i), AttributeFuncs::ASK_SAFE_TO_DROP);

    ArgAttrs.push_back(

        CallerPAL.getParamAttrs(i).removeAttributes(Ctx, IncompatibleAttrs));

  }


  // If the function takes more arguments than the call was taking, add them

  // now.

  for (unsigned i = NumCommonArgs; i != FT->getNumParams(); ++i) {

    Args.push_back(Constant::getNullValue(FT->getParamType(i)));

    ArgAttrs.push_back(AttributeSet());

  }


  // If we are removing arguments to the function, emit an obnoxious warning.

  if (FT->getNumParams() < NumActualArgs) {

    // TODO: if (!FT->isVarArg()) this call may be unreachable. PR14722

    if (FT->isVarArg()) {

      // Add all of the arguments in their promoted form to the arg list.

      for (unsigned i = FT->getNumParams(); i != NumActualArgs; ++i, ++AI) {

        Type *PTy = getPromotedType((*AI)->getType());

        Value *NewArg = *AI;

        if (PTy != (*AI)->getType()) {

          // Must promote to pass through va_arg area!

          Instruction::CastOps opcode =

            CastInst::getCastOpcode(*AI, false, PTy, false);

          NewArg = Builder.CreateCast(opcode, *AI, PTy);

        }

        Args.push_back(NewArg);


        // Add any parameter attributes.

        ArgAttrs.push_back(CallerPAL.getParamAttrs(i));

      }

    }

  }


  AttributeSet FnAttrs = CallerPAL.getFnAttrs();


  if (NewRetTy->isVoidTy())

    Caller->setName("");   // Void type should not have a name.


  assert((ArgAttrs.size() == FT->getNumParams() || FT->isVarArg()) &&

         "missing argument attributes");

  AttributeList NewCallerPAL = AttributeList::get(

      Ctx, FnAttrs, AttributeSet::get(Ctx, RAttrs), ArgAttrs);


  SmallVector<OperandBundleDef, 1> OpBundles;

  Call.getOperandBundlesAsDefs(OpBundles);


  CallBase *NewCall;

  if (InvokeInst *II = dyn_cast<InvokeInst>(Caller)) {

    NewCall = Builder.CreateInvoke(Callee, II->getNormalDest(),

                                   II->getUnwindDest(), Args, OpBundles);

  } else {

    NewCall = Builder.CreateCall(Callee, Args, OpBundles);

    cast<CallInst>(NewCall)->setTailCallKind(

        cast<CallInst>(Caller)->getTailCallKind());

  }

  NewCall->takeName(Caller);

  NewCall->setCallingConv(Call.getCallingConv());

  NewCall->setAttributes(NewCallerPAL);


  // Preserve prof metadata if any.

  NewCall->copyMetadata(*Caller, {LLVMContext::MD_prof});


  // Insert a cast of the return type as necessary.

  Instruction *NC = NewCall;

  Value *NV = NC;

  if (OldRetTy != NV->getType() && !Caller->use_empty()) {

    assert(!NV->getType()->isVoidTy());

    NV = NC = CastInst::CreateBitOrPointerCast(NC, OldRetTy);

    NC->setDebugLoc(Caller->getDebugLoc());


    auto OptInsertPt = NewCall->getInsertionPointAfterDef();

    assert(OptInsertPt && "No place to insert cast");

    InsertNewInstBefore(NC, *OptInsertPt);

    Worklist.pushUsersToWorkList(*Caller);

  }


  if (!Caller->use_empty())

    replaceInstUsesWith(*Caller, NV);

  else if (Caller->hasValueHandle()) {

    if (OldRetTy == NV->getType())

      ValueHandleBase::ValueIsRAUWd(Caller, NV);

    else

      // We cannot call ValueIsRAUWd with a different type, and the

      // actual tracked value will disappear.

      ValueHandleBase::ValueIsDeleted(Caller);

  }


  eraseInstFromFunction(*Caller);

  return true;

}


/// Turn a call to a function created by init_trampoline / adjust_trampoline

/// intrinsic pair into a direct call to the underlying function.

Instruction *

InstCombinerImpl::transformCallThroughTrampoline(CallBase &Call,

                                                 IntrinsicInst &Tramp) {

  FunctionType *FTy = Call.getFunctionType();

  AttributeList Attrs = Call.getAttributes();


  // If the call already has the 'nest' attribute somewhere then give up -

  // otherwise 'nest' would occur twice after splicing in the chain.

  if (Attrs.hasAttrSomewhere(Attribute::Nest))

    return nullptr;


  Function *NestF = cast<Function>(Tramp.getArgOperand(1)->stripPointerCasts());

  FunctionType *NestFTy = NestF->getFunctionType();


  AttributeList NestAttrs = NestF->getAttributes();

  if (!NestAttrs.isEmpty()) {

    unsigned NestArgNo = 0;

    Type *NestTy = nullptr;

    AttributeSet NestAttr;


    // Look for a parameter marked with the 'nest' attribute.

    for (FunctionType::param_iterator I = NestFTy->param_begin(),

                                      E = NestFTy->param_end();

         I != E; ++NestArgNo, ++I) {

      AttributeSet AS = NestAttrs.getParamAttrs(NestArgNo);

      if (AS.hasAttribute(Attribute::Nest)) {

        // Record the parameter type and any other attributes.

        NestTy = *I;

        NestAttr = AS;

        break;

      }

    }


    if (NestTy) {

      std::vector<Value*> NewArgs;

      std::vector<AttributeSet> NewArgAttrs;

      NewArgs.reserve(Call.arg_size() + 1);

      NewArgAttrs.reserve(Call.arg_size());


      // Insert the nest argument into the call argument list, which may

      // mean appending it.  Likewise for attributes.


      {

        unsigned ArgNo = 0;

        auto I = Call.arg_begin(), E = Call.arg_end();

        do {

          if (ArgNo == NestArgNo) {

            // Add the chain argument and attributes.

            Value *NestVal = Tramp.getArgOperand(2);

            if (NestVal->getType() != NestTy)

              NestVal = Builder.CreateBitCast(NestVal, NestTy, "nest");

            NewArgs.push_back(NestVal);

            NewArgAttrs.push_back(NestAttr);

          }


          if (I == E)

            break;


          // Add the original argument and attributes.

          NewArgs.push_back(*I);

          NewArgAttrs.push_back(Attrs.getParamAttrs(ArgNo));


          ++ArgNo;

          ++I;

        } while (true);

      }


      // The trampoline may have been bitcast to a bogus type (FTy).

      // Handle this by synthesizing a new function type, equal to FTy

      // with the chain parameter inserted.


      std::vector<Type*> NewTypes;

      NewTypes.reserve(FTy->getNumParams()+1);


      // Insert the chain's type into the list of parameter types, which may

      // mean appending it.

      {

        unsigned ArgNo = 0;

        FunctionType::param_iterator I = FTy->param_begin(),

          E = FTy->param_end();


        do {

          if (ArgNo == NestArgNo)

            // Add the chain's type.

            NewTypes.push_back(NestTy);


          if (I == E)

            break;


          // Add the original type.

          NewTypes.push_back(*I);


          ++ArgNo;

          ++I;

        } while (true);

      }


      // Replace the trampoline call with a direct call.  Let the generic

      // code sort out any function type mismatches.

      FunctionType *NewFTy =

          FunctionType::get(FTy->getReturnType(), NewTypes, FTy->isVarArg());

      AttributeList NewPAL =

          AttributeList::get(FTy->getContext(), Attrs.getFnAttrs(),

                             Attrs.getRetAttrs(), NewArgAttrs);


      SmallVector<OperandBundleDef, 1> OpBundles;

      Call.getOperandBundlesAsDefs(OpBundles);


      Instruction *NewCaller;

      if (InvokeInst *II = dyn_cast<InvokeInst>(&Call)) {

        NewCaller = InvokeInst::Create(NewFTy, NestF, II->getNormalDest(),

                                       II->getUnwindDest(), NewArgs, OpBundles);

        cast<InvokeInst>(NewCaller)->setCallingConv(II->getCallingConv());

        cast<InvokeInst>(NewCaller)->setAttributes(NewPAL);

      } else if (CallBrInst *CBI = dyn_cast<CallBrInst>(&Call)) {

        NewCaller =

            CallBrInst::Create(NewFTy, NestF, CBI->getDefaultDest(),

                               CBI->getIndirectDests(), NewArgs, OpBundles);

        cast<CallBrInst>(NewCaller)->setCallingConv(CBI->getCallingConv());

        cast<CallBrInst>(NewCaller)->setAttributes(NewPAL);

      } else {

        NewCaller = CallInst::Create(NewFTy, NestF, NewArgs, OpBundles);

        cast<CallInst>(NewCaller)->setTailCallKind(

            cast<CallInst>(Call).getTailCallKind());

        cast<CallInst>(NewCaller)->setCallingConv(

            cast<CallInst>(Call).getCallingConv());

        cast<CallInst>(NewCaller)->setAttributes(NewPAL);

      }

      NewCaller->setDebugLoc(Call.getDebugLoc());


      return NewCaller;

    }

  }


  // Replace the trampoline call with a direct call.  Since there is no 'nest'

  // parameter, there is no need to adjust the argument list.  Let the generic

  // code sort out any function type mismatches.

  Call.setCalledFunction(FTy, NestF);

  return &Call;

}

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

Select
AMDGPU Register Bank Select
Definition AMDGPURegBankSelect.cpp:68

APFloat.h
This file declares a class to represent arbitrary precision floating point values and provide a varie...

APInt.h
This file implements a class to represent arbitrary precision integral constant values and operations...

APSInt.h
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition ARMSLSHardening.cpp:73

IT
static cl::opt< ITMode > IT(cl::desc("IT block support"), cl::Hidden, cl::init(DefaultIT), cl::values(clEnumValN(DefaultIT, "arm-default-it", "Generate any type of IT block"), clEnumValN(RestrictedIT, "arm-restrict-it", "Disallow complex IT blocks")))

AliasAnalysis.h

ArrayRef.h

AssumeBundleBuilder.h

AssumeBundleQueries.h

AssumptionCache.h

AtomicOrdering.h
Atomic ordering constants.

AttributeMask.h

Attributes.h
This file contains the simple types necessary to represent the attributes associated with functions a...

BT
BitTracker BT
Definition BitTracker.cpp:68

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

E
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

Casting.h

CommandLine.h

Compiler.h

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

foldBitOrderCrossLogicOp
static SDValue foldBitOrderCrossLogicOp(SDNode *N, SelectionDAG &DAG)
Definition DAGCombiner.cpp:10901

DataLayout.h

DerivedTypes.h

DEBUG_TYPE
#define DEBUG_TYPE
Definition GenericCycleImpl.h:31

GlobalVariable.h

MI
IRTranslator LLVM IR MI
Definition IRTranslator.cpp:110

BasicBlock.h

Constant.h

Function.h

Instruction.h

IntrinsicInst.h

Type.h

User.h

Value.h

InlineAsm.h

InlinePriorityMode::Size
@ Size
Definition InlineOrder.cpp:25

getPromotedType
static Type * getPromotedType(Type *Ty)
Return the specified type promoted as it would be to pass though a va_arg area.
Definition InstCombineCalls.cpp:96

createOverflowTuple
static Instruction * createOverflowTuple(IntrinsicInst *II, Value *Result, Constant *Overflow)
Creates a result tuple for an overflow intrinsic II with a given Result and a constant Overflow value...
Definition InstCombineCalls.cpp:850

findInitTrampolineFromAlloca
static IntrinsicInst * findInitTrampolineFromAlloca(Value *TrampMem)
Definition InstCombineCalls.cpp:4119

removeTriviallyEmptyRange
static bool removeTriviallyEmptyRange(IntrinsicInst &EndI, InstCombinerImpl &IC, std::function< bool(const IntrinsicInst &)> IsStart)
Definition InstCombineCalls.cpp:799

inputDenormalIsDAZ
static bool inputDenormalIsDAZ(const Function &F, const Type *Ty)
Definition InstCombineCalls.cpp:903

reassociateMinMaxWithConstantInOperand
static Instruction * reassociateMinMaxWithConstantInOperand(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
If this min/max has a matching min/max operand with a constant, try to push the constant operand into...
Definition InstCombineCalls.cpp:1322

isIdempotentBinaryIntrinsic
static bool isIdempotentBinaryIntrinsic(Intrinsic::ID IID)
Helper to match idempotent binary intrinsics, namely, intrinsics where f(f(x, y), y) == f(x,...
Definition InstCombineCalls.cpp:1543

signBitMustBeTheSame
static bool signBitMustBeTheSame(Value *Op0, Value *Op1, const SimplifyQuery &SQ)
Return true if two values Op0 and Op1 are known to have the same sign.
Definition InstCombineCalls.cpp:1136

moveAddAfterMinMax
static Instruction * moveAddAfterMinMax(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
Try to canonicalize min/max(X + C0, C1) as min/max(X, C1 - C0) + C0.
Definition InstCombineCalls.cpp:1149

simplifyInvariantGroupIntrinsic
static Instruction * simplifyInvariantGroupIntrinsic(IntrinsicInst &II, InstCombinerImpl &IC)
This function transforms launder.invariant.group and strip.invariant.group like: launder(launder(x)) ...
Definition InstCombineCalls.cpp:445

haveSameOperands
static bool haveSameOperands(const IntrinsicInst &I, const IntrinsicInst &E, unsigned NumOperands)
Definition InstCombineCalls.cpp:779

getKnownSign
static std::optional< bool > getKnownSign(Value *Op, const SimplifyQuery &SQ)
Definition InstCombineCalls.cpp:1109

GuardWideningWindow
static cl::opt< unsigned > GuardWideningWindow("instcombine-guard-widening-window", cl::init(3), cl::desc("How wide an instruction window to bypass looking for " "another guard"))

hasUndefSource
static bool hasUndefSource(AnyMemTransferInst *MI)
Recognize a memcpy/memmove from a trivially otherwise unused alloca.
Definition InstCombineCalls.cpp:107

factorizeMinMaxTree
static Instruction * factorizeMinMaxTree(IntrinsicInst *II)
Reduce a sequence of min/max intrinsics with a common operand.
Definition InstCombineCalls.cpp:1350

simplifyNeonTbl1
static Value * simplifyNeonTbl1(const IntrinsicInst &II, InstCombiner::BuilderTy &Builder)
Convert a table lookup to shufflevector if the mask is constant.
Definition InstCombineCalls.cpp:743

foldClampRangeOfTwo
static Instruction * foldClampRangeOfTwo(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
If we have a clamp pattern like max (min X, 42), 41 – where the output can only be one of two possibl...
Definition InstCombineCalls.cpp:1248

simplifyReductionOperand
static Value * simplifyReductionOperand(Value *Arg, bool CanReorderLanes)
Definition InstCombineCalls.cpp:1586

findInitTrampolineFromBB
static IntrinsicInst * findInitTrampolineFromBB(IntrinsicInst *AdjustTramp, Value *TrampMem)
Definition InstCombineCalls.cpp:4158

foldIntrinsicUsingDistributiveLaws
static Value * foldIntrinsicUsingDistributiveLaws(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
Definition InstCombineCalls.cpp:1674

getKnownSignOrZero
static std::optional< bool > getKnownSignOrZero(Value *Op, const SimplifyQuery &SQ)
Definition InstCombineCalls.cpp:1123

foldMinimumOverTrailingOrLeadingZeroCount
static Value * foldMinimumOverTrailingOrLeadingZeroCount(Value *I0, Value *I1, const DataLayout &DL, InstCombiner::BuilderTy &Builder)
Fold an unsigned minimum of trailing or leading zero bits counts: umin(cttz(CtOp, ZeroUndef),...
Definition InstCombineCalls.cpp:1619

foldIdempotentBinaryIntrinsicRecurrence
static Value * foldIdempotentBinaryIntrinsicRecurrence(InstCombinerImpl &IC, IntrinsicInst *II)
Attempt to simplify value-accumulating recurrences of kind: umax.acc = phi i8 [ umax,...
Definition InstCombineCalls.cpp:1566

foldCtpop
static Instruction * foldCtpop(IntrinsicInst &II, InstCombinerImpl &IC)
Definition InstCombineCalls.cpp:651

foldCttzCtlz
static Instruction * foldCttzCtlz(IntrinsicInst &II, InstCombinerImpl &IC)
Definition InstCombineCalls.cpp:475

findInitTrampoline
static IntrinsicInst * findInitTrampoline(Value *Callee)
Definition InstCombineCalls.cpp:4179

fpclassTestIsFCmp0
static FCmpInst::Predicate fpclassTestIsFCmp0(FPClassTest Mask, const Function &F, Type *Ty)
Definition InstCombineCalls.cpp:911

leftDistributesOverRight
static bool leftDistributesOverRight(Instruction::BinaryOps LOp, bool HasNUW, bool HasNSW, Intrinsic::ID ROp)
Return whether "X LOp (Y ROp Z)" is always equal to "(X LOp Y) ROp (X LOp Z)".
Definition InstCombineCalls.cpp:1652

reassociateMinMaxWithConstants
static Value * reassociateMinMaxWithConstants(IntrinsicInst *II, IRBuilderBase &Builder, const SimplifyQuery &SQ)
If this min/max has a constant operand and an operand that is a matching min/max with a constant oper...
Definition InstCombineCalls.cpp:1288

canonicalizeConstantArg0ToArg1
static CallInst * canonicalizeConstantArg0ToArg1(CallInst &Call)
Definition InstCombineCalls.cpp:837

InstCombineInternal.h
This file provides internal interfaces used to implement the InstCombine.

InstCombiner.h
This file provides the interface for the instcombine pass implementation.

InstrTypes.h

hasNoSignedWrap
static bool hasNoSignedWrap(BinaryOperator &I)
Definition InstructionCombining.cpp:390

InstructionSimplify.h

InstructionWorklist.h

Instructions.h

Intrinsics.h

TemplateParamKind::Type
@ Type
Definition ItaniumDemangle.h:1243

KnownBits.h

inputDenormalIsIEEE
static bool inputDenormalIsIEEE(DenormalMode Mode)
Return true if it's possible to assume IEEE treatment of input denormals in F for Val.
Definition KnownFPClass.cpp:21

KnownFPClass.h

LLVMContext.h

Loads.h

F
#define F(x, y, z)
Definition MD5.cpp:55

I
#define I(x, y, z)
Definition MD5.cpp:58

MathExtras.h

getCalledFunction
static const Function * getCalledFunction(const Value *V)
Definition MemoryBuiltins.cpp:159

MemoryBuiltins.h

Metadata.h
This file contains the declarations for metadata subclasses.

Range
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))

II
uint64_t IntrinsicInst * II
Definition NVVMIntrRange.cpp:46

Mod
if(auto Err=PB.parsePassPipeline(MPM, Passes)) return wrap(std MPM run * Mod
Definition PassBuilderBindings.cpp:95

PatternMatch.h

Cond
const SmallVectorImpl< MachineOperand > & Cond
Definition RISCVRedundantCopyElimination.cpp:71

STLFunctionalExtras.h

SimplifyLibCalls.h

SmallBitVector.h
This file implements the SmallBitVector class.

SmallVector.h
This file defines the SmallVector class.

Statepoint.h

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition Statistic.h:171

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition Debug.h:114

DEBUG_WITH_TYPE
#define DEBUG_WITH_TYPE(TYPE,...)
DEBUG_WITH_TYPE macro - This macro should be used by passes to emit debug information.
Definition Debug.h:72

Y
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")

X
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")

Ptr
@ Ptr
Definition TargetLibraryInfo.cpp:77

Struct
@ Struct
Definition TargetLibraryInfo.cpp:78

Local.h

TypeSize.h

getOpcode
static std::optional< unsigned > getOpcode(ArrayRef< VPValue * > Values)
Returns the opcode of Values or ~0 if they do not all agree.
Definition VPlanSLP.cpp:247

ValueHandle.h

ValueTracking.h

VectorUtils.h

RHS
Value * RHS
Definition X86PartialReduction.cpp:81

LHS
Value * LHS
Definition X86PartialReduction.cpp:80

llvm::APFloat
Definition APFloat.h:940

llvm::APFloat::isNegative
bool isNegative() const
Definition APFloat.h:1431

llvm::APFloat::clearSign
void clearSign()
Definition APFloat.h:1280

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::APInt::getAllOnes
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition APInt.h:235

llvm::APInt::getSignMask
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition APInt.h:230

llvm::APInt::sgt
bool sgt(const APInt &RHS) const
Signed greater than comparison.
Definition APInt.h:1202

llvm::APInt::usub_ov
LLVM_ABI APInt usub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1948

llvm::APInt::ugt
bool ugt(const APInt &RHS) const
Unsigned greater than comparison.
Definition APInt.h:1183

llvm::APInt::isZero
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition APInt.h:381

llvm::APInt::urem
LLVM_ABI APInt urem(const APInt &RHS) const
Unsigned remainder operation.
Definition APInt.cpp:1666

llvm::APInt::getBitWidth
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition APInt.h:1489

llvm::APInt::ult
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition APInt.h:1112

llvm::APInt::sadd_ov
LLVM_ABI APInt sadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1928

llvm::APInt::uadd_ov
LLVM_ABI APInt uadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1935

llvm::APInt::getSplat
static LLVM_ABI APInt getSplat(unsigned NewLen, const APInt &V)
Return a value containing V broadcasted over NewLen bits.
Definition APInt.cpp:651

llvm::APInt::getSignedMinValue
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition APInt.h:220

llvm::APInt::uadd_sat
LLVM_ABI APInt uadd_sat(const APInt &RHS) const
Definition APInt.cpp:2036

llvm::APInt::isNonNegative
bool isNonNegative() const
Determine if this APInt Value is non-negative (>= 0)
Definition APInt.h:335

llvm::APInt::getLowBitsSet
static APInt getLowBitsSet(unsigned numBits, unsigned loBitsSet)
Constructs an APInt value that has the bottom loBitsSet bits set.
Definition APInt.h:307

llvm::APInt::getZero
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition APInt.h:201

llvm::APInt::ssub_ov
LLVM_ABI APInt ssub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1941

llvm::APSInt::getMinValue
static APSInt getMinValue(uint32_t numBits, bool Unsigned)
Return the APSInt representing the minimum integer value with the given bit width and signedness.
Definition APSInt.h:312

llvm::APSInt::getMaxValue
static APSInt getMaxValue(uint32_t numBits, bool Unsigned)
Return the APSInt representing the maximum integer value with the given bit width and signedness.
Definition APSInt.h:304

llvm::AnyMemSetInst
This class represents any memset intrinsic.
Definition IntrinsicInst.h:1316

llvm::AnyMemTransferInst
Definition IntrinsicInst.h:1336

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:41

llvm::AttributeSet::hasAttribute
LLVM_ABI bool hasAttribute(Attribute::AttrKind Kind) const
Return true if the attribute exists in this set.
Definition Attributes.cpp:1131

llvm::AttributeSet::get
static LLVM_ABI AttributeSet get(LLVMContext &C, const AttrBuilder &B)
Definition Attributes.cpp:921

llvm::Attribute::get
static LLVM_ABI Attribute get(LLVMContext &Context, AttrKind Kind, uint64_t Val=0)
Return a uniquified Attribute object.
Definition Attributes.cpp:95

llvm::Attribute::getWithDereferenceableBytes
static LLVM_ABI Attribute getWithDereferenceableBytes(LLVMContext &Context, uint64_t Bytes)
Definition Attributes.cpp:244

llvm::Attribute::getWithDereferenceableOrNullBytes
static LLVM_ABI Attribute getWithDereferenceableOrNullBytes(LLVMContext &Context, uint64_t Bytes)
Definition Attributes.cpp:250

llvm::Attribute::getWithAlignment
static LLVM_ABI Attribute getWithAlignment(LLVMContext &Context, Align Alignment)
Return a uniquified Attribute object that has the specific alignment set.
Definition Attributes.cpp:234

llvm::BasicBlock::reverse_iterator
InstListType::reverse_iterator reverse_iterator
Definition BasicBlock.h:172

llvm::BasicBlock::iterator
InstListType::iterator iterator
Instruction iterators...
Definition BasicBlock.h:170

llvm::BinaryOpIntrinsic::getRHS
Value * getRHS() const
Definition IntrinsicInst.h:937

llvm::BinaryOpIntrinsic::isSigned
LLVM_ABI bool isSigned() const
Whether the intrinsic is signed or unsigned.
Definition IntrinsicInst.cpp:827

llvm::BinaryOpIntrinsic::getBinaryOp
LLVM_ABI Instruction::BinaryOps getBinaryOp() const
Returns the binary operation underlying the intrinsic.
Definition IntrinsicInst.cpp:807

llvm::BinaryOpIntrinsic::getLHS
Value * getLHS() const
Definition IntrinsicInst.h:936

llvm::BinaryOperator
Definition InstrTypes.h:171

llvm::BinaryOperator::CreateFAddFMF
static BinaryOperator * CreateFAddFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition InstrTypes.h:236

llvm::BinaryOperator::CreateNeg
static LLVM_ABI BinaryOperator * CreateNeg(Value *Op, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Helper functions to construct and inspect unary operations (NEG and NOT) via binary operators SUB and...
Definition Instructions.cpp:2715

llvm::BinaryOperator::CreateNSW
static BinaryOperator * CreateNSW(BinaryOps Opc, Value *V1, Value *V2, const Twine &Name="")
Definition InstrTypes.h:279

llvm::BinaryOperator::CreateNot
static LLVM_ABI BinaryOperator * CreateNot(Value *Op, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition Instructions.cpp:2728

llvm::BinaryOperator::Create
static LLVM_ABI BinaryOperator * Create(BinaryOps Op, Value *S1, Value *S2, const Twine &Name=Twine(), InsertPosition InsertBefore=nullptr)
Construct a binary instruction, given the opcode and the two operands.
Definition Instructions.cpp:2707

llvm::BinaryOperator::CreateNUW
static BinaryOperator * CreateNUW(BinaryOps Opc, Value *V1, Value *V2, const Twine &Name="")
Definition InstrTypes.h:294

llvm::BinaryOperator::CreateFMulFMF
static BinaryOperator * CreateFMulFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition InstrTypes.h:244

llvm::BinaryOperator::CreateFDivFMF
static BinaryOperator * CreateFDivFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition InstrTypes.h:248

llvm::BinaryOperator::CreateFSubFMF
static BinaryOperator * CreateFSubFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition InstrTypes.h:240

llvm::BinaryOperator::CreateNSWNeg
static LLVM_ABI BinaryOperator * CreateNSWNeg(Value *Op, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition Instructions.cpp:2722

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition InstrTypes.h:1114

llvm::CallBase::setCallingConv
void setCallingConv(CallingConv::ID CC)
Definition InstrTypes.h:1408

llvm::CallBase::setDoesNotThrow
void setDoesNotThrow()
Definition InstrTypes.h:1954

llvm::CallBase::getRetAlign
MaybeAlign getRetAlign() const
Extract the alignment of the return value.
Definition InstrTypes.h:1767

llvm::CallBase::getOperandBundlesAsDefs
LLVM_ABI void getOperandBundlesAsDefs(SmallVectorImpl< OperandBundleDef > &Defs) const
Return the list of operand bundles attached to this instruction as a vector of OperandBundleDefs.
Definition Instructions.cpp:509

llvm::CallBase::getOperandBundleAt
OperandBundleUse getOperandBundleAt(unsigned Index) const
Return the operand bundle at a specific index.
Definition InstrTypes.h:2050

llvm::CallBase::getOperandBundle
std::optional< OperandBundleUse > getOperandBundle(StringRef Name) const
Return an operand bundle by name, if present.
Definition InstrTypes.h:2081

llvm::CallBase::getCalledFunction
Function * getCalledFunction() const
Returns the function called, or null if this is an indirect function invocation or the function signa...
Definition InstrTypes.h:1346

llvm::CallBase::isInAllocaArgument
bool isInAllocaArgument(unsigned ArgNo) const
Determine whether this argument is passed in an alloca.
Definition InstrTypes.h:1712

llvm::CallBase::hasRetAttr
bool hasRetAttr(Attribute::AttrKind Kind) const
Determine whether the return value has the given attribute.
Definition InstrTypes.h:1589

llvm::CallBase::getNumOperandBundles
unsigned getNumOperandBundles() const
Return the number of operand bundles associated with this User.
Definition InstrTypes.h:1994

llvm::CallBase::getParamDereferenceableBytes
uint64_t getParamDereferenceableBytes(unsigned i) const
Extract the number of dereferenceable bytes for a call or parameter (0=unknown).
Definition InstrTypes.h:1847

llvm::CallBase::getCallingConv
CallingConv::ID getCallingConv() const
Definition InstrTypes.h:1404

llvm::CallBase::paramHasAttr
LLVM_ABI bool paramHasAttr(unsigned ArgNo, Attribute::AttrKind Kind) const
Determine whether the argument or parameter has the given attribute.
Definition Instructions.cpp:418

llvm::CallBase::arg_begin
User::op_iterator arg_begin()
Return the iterator pointing to the beginning of the argument list.
Definition InstrTypes.h:1265

llvm::CallBase::isIndirectCall
LLVM_ABI bool isIndirectCall() const
Return true if the callsite is an indirect call.
Definition Instructions.cpp:335

llvm::CallBase::setNotConvergent
void setNotConvergent()
Definition InstrTypes.h:1967

llvm::CallBase::getCalledOperand
Value * getCalledOperand() const
Definition InstrTypes.h:1338

llvm::CallBase::setAttributes
void setAttributes(AttributeList A)
Set the attributes for this call.
Definition InstrTypes.h:1425

llvm::CallBase::doesNotThrow
bool doesNotThrow() const
Determine if the call cannot unwind.
Definition InstrTypes.h:1953

llvm::CallBase::addRetAttr
void addRetAttr(Attribute::AttrKind Kind)
Adds the attribute to the return value.
Definition InstrTypes.h:1489

llvm::CallBase::getArgOperand
Value * getArgOperand(unsigned i) const
Definition InstrTypes.h:1290

llvm::CallBase::arg_end
User::op_iterator arg_end()
Return the iterator pointing to the end of the argument list.
Definition InstrTypes.h:1271

llvm::CallBase::isConvergent
bool isConvergent() const
Determine if the invoke is convergent.
Definition InstrTypes.h:1965

llvm::CallBase::getFunctionType
FunctionType * getFunctionType() const
Definition InstrTypes.h:1203

llvm::CallBase::getIntrinsicID
LLVM_ABI Intrinsic::ID getIntrinsicID() const
Returns the intrinsic ID of the intrinsic called or Intrinsic::not_intrinsic if the called function i...
Definition Instructions.cpp:357

llvm::CallBase::getReturnedArgOperand
Value * getReturnedArgOperand() const
If one of the arguments has the 'returned' attribute, returns its operand value.
Definition InstrTypes.h:1893

llvm::CallBase::Create
static LLVM_ABI CallBase * Create(CallBase *CB, ArrayRef< OperandBundleDef > Bundles, InsertPosition InsertPt=nullptr)
Create a clone of CB with a different set of operand bundles and insert it before InsertPt.
Definition Instructions.cpp:302

llvm::CallBase::args
iterator_range< User::op_iterator > args()
Iteration adapter for range-for loops.
Definition InstrTypes.h:1281

llvm::CallBase::setCalledOperand
void setCalledOperand(Value *V)
Definition InstrTypes.h:1382

llvm::CallBase::removeOperandBundle
static LLVM_ABI CallBase * removeOperandBundle(CallBase *CB, uint32_t ID, InsertPosition InsertPt=nullptr)
Create a clone of CB with operand bundle ID removed.
Definition Instructions.cpp:600

llvm::CallBase::arg_size
unsigned arg_size() const
Definition InstrTypes.h:1288

llvm::CallBase::getAttributes
AttributeList getAttributes() const
Return the attributes for this call.
Definition InstrTypes.h:1422

llvm::CallBase::setCalledFunction
void setCalledFunction(Function *Fn)
Sets the function called, including updating the function type.
Definition InstrTypes.h:1385

llvm::CallBase::getCaller
LLVM_ABI Function * getCaller()
Helper to get the caller (the parent function).
Definition Instructions.cpp:328

llvm::CallBrInst
CallBr instruction, tracking function calls that may not return control but instead transfer it to a ...
Definition Instructions.h:3877

llvm::CallBrInst::Create
static CallBrInst * Create(FunctionType *Ty, Value *Func, BasicBlock *DefaultDest, ArrayRef< BasicBlock * > IndirectDests, ArrayRef< Value * > Args, const Twine &NameStr, InsertPosition InsertBefore=nullptr)
Definition Instructions.h:3912

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition Instructions.h:1511

llvm::CallInst::isNoTailCall
bool isNoTailCall() const
Definition Instructions.h:1629

llvm::CallInst::Create
static CallInst * Create(FunctionType *Ty, Value *F, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Definition Instructions.h:1546

llvm::CallInst::isMustTailCall
bool isMustTailCall() const
Definition Instructions.h:1627

llvm::CastInst::getCastOpcode
static LLVM_ABI Instruction::CastOps getCastOpcode(const Value *Val, bool SrcIsSigned, Type *Ty, bool DstIsSigned)
Returns the opcode necessary to cast Val into Ty using usual casting rules.
Definition Instructions.cpp:3217

llvm::CastInst::CreateIntegerCast
static LLVM_ABI CastInst * CreateIntegerCast(Value *S, Type *Ty, bool isSigned, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Create a ZExt, BitCast, or Trunc for int -> int casts.
Definition Instructions.cpp:3131

llvm::CastInst::isBitOrNoopPointerCastable
static LLVM_ABI bool isBitOrNoopPointerCastable(Type *SrcTy, Type *DestTy, const DataLayout &DL)
Check whether a bitcast, inttoptr, or ptrtoint cast between these types is valid and a no-op.
Definition Instructions.cpp:3195

llvm::CastInst::CreateBitOrPointerCast
static LLVM_ABI CastInst * CreateBitOrPointerCast(Value *S, Type *Ty, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Create a BitCast, a PtrToInt, or an IntToPTr cast instruction.
Definition Instructions.cpp:3120

llvm::CastInst::Create
static LLVM_ABI CastInst * Create(Instruction::CastOps, Value *S, Type *Ty, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Provides a way to construct any of the CastInst subclasses using an opcode instead of the subclass's ...
Definition Instructions.cpp:3044

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:676

llvm::CmpInst::FCMP_OEQ
@ FCMP_OEQ
0 0 0 1 True if ordered and equal
Definition InstrTypes.h:679

llvm::CmpInst::BAD_ICMP_PREDICATE
@ BAD_ICMP_PREDICATE
Definition InstrTypes.h:709

llvm::CmpInst::ICMP_SLT
@ ICMP_SLT
signed less than
Definition InstrTypes.h:705

llvm::CmpInst::ICMP_SLE
@ ICMP_SLE
signed less or equal
Definition InstrTypes.h:706

llvm::CmpInst::FCMP_OLT
@ FCMP_OLT
0 1 0 0 True if ordered and less than
Definition InstrTypes.h:682

llvm::CmpInst::FCMP_OGT
@ FCMP_OGT
0 0 1 0 True if ordered and greater than
Definition InstrTypes.h:680

llvm::CmpInst::FCMP_OGE
@ FCMP_OGE
0 0 1 1 True if ordered and greater than or equal
Definition InstrTypes.h:681

llvm::CmpInst::ICMP_UGT
@ ICMP_UGT
unsigned greater than
Definition InstrTypes.h:699

llvm::CmpInst::ICMP_SGT
@ ICMP_SGT
signed greater than
Definition InstrTypes.h:703

llvm::CmpInst::FCMP_ONE
@ FCMP_ONE
0 1 1 0 True if ordered and operands are unequal
Definition InstrTypes.h:684

llvm::CmpInst::FCMP_UEQ
@ FCMP_UEQ
1 0 0 1 True if unordered or equal
Definition InstrTypes.h:687

llvm::CmpInst::ICMP_ULT
@ ICMP_ULT
unsigned less than
Definition InstrTypes.h:701

llvm::CmpInst::FCMP_OLE
@ FCMP_OLE
0 1 0 1 True if ordered and less than or equal
Definition InstrTypes.h:683

llvm::CmpInst::ICMP_EQ
@ ICMP_EQ
equal
Definition InstrTypes.h:697

llvm::CmpInst::ICMP_NE
@ ICMP_NE
not equal
Definition InstrTypes.h:698

llvm::CmpInst::FCMP_UNE
@ FCMP_UNE
1 1 1 0 True if unordered or not equal
Definition InstrTypes.h:692

llvm::CmpInst::BAD_FCMP_PREDICATE
@ BAD_FCMP_PREDICATE
Definition InstrTypes.h:696

llvm::CmpInst::getSwappedPredicate
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Definition InstrTypes.h:827

llvm::CmpInst::getNonStrictPredicate
Predicate getNonStrictPredicate() const
For example, SGT -> SGE, SLT -> SLE, ULT -> ULE, UGT -> UGE.
Definition InstrTypes.h:871

llvm::CmpInst::getUnorderedPredicate
Predicate getUnorderedPredicate() const
Definition InstrTypes.h:811

llvm::ConstantAggregateZero::get
static LLVM_ABI ConstantAggregateZero * get(Type *Ty)
Definition Constants.cpp:1680

llvm::ConstantExpr::getPointerCast
static LLVM_ABI Constant * getPointerCast(Constant *C, Type *Ty)
Create a BitCast, AddrSpaceCast, or a PtrToInt cast constant expression.
Definition Constants.cpp:2249

llvm::ConstantExpr::getSub
static LLVM_ABI Constant * getSub(Constant *C1, Constant *C2, bool HasNUW=false, bool HasNSW=false)
Definition Constants.cpp:2657

llvm::ConstantExpr::getNeg
static LLVM_ABI Constant * getNeg(Constant *C, bool HasNSW=false)
Definition Constants.cpp:2638

llvm::ConstantFP::getInfinity
static LLVM_ABI Constant * getInfinity(Type *Ty, bool Negative=false)
Definition Constants.cpp:1108

llvm::ConstantFP::getZero
static LLVM_ABI Constant * getZero(Type *Ty, bool Negative=false)
Definition Constants.cpp:1062

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition Constants.h:87

llvm::ConstantInt::getLimitedValue
uint64_t getLimitedValue(uint64_t Limit=~0ULL) const
getLimitedValue - If the value is smaller than the specified limit, return it, otherwise return the l...
Definition Constants.h:264

llvm::ConstantInt::getTrue
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
Definition Constants.cpp:871

llvm::ConstantInt::getFalse
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
Definition Constants.cpp:878

llvm::ConstantInt::getZExtValue
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
Definition Constants.h:163

llvm::ConstantInt::getValue
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition Constants.h:154

llvm::ConstantInt::getBool
static LLVM_ABI ConstantInt * getBool(LLVMContext &Context, bool V)
Definition Constants.cpp:885

llvm::ConstantPointerNull::get
static LLVM_ABI ConstantPointerNull * get(PointerType *T)
Static factory methods - Return objects of the specified value.
Definition Constants.cpp:1836

llvm::ConstantPtrAuth::get
static LLVM_ABI ConstantPtrAuth * get(Constant *Ptr, ConstantInt *Key, ConstantInt *Disc, Constant *AddrDisc)
Return a pointer signed with the specified parameters.
Definition Constants.cpp:2066

llvm::ConstantRange
This class represents a range of values.
Definition ConstantRange.h:47

llvm::ConstantRange::Unsigned
@ Unsigned
Definition ConstantRange.h:333

llvm::ConstantRange::isFullSet
LLVM_ABI bool isFullSet() const
Return true if this set contains all of the elements possible for this data-type.
Definition ConstantRange.cpp:424

llvm::ConstantRange::icmp
LLVM_ABI bool icmp(CmpInst::Predicate Pred, const ConstantRange &Other) const
Does the predicate Pred hold between ranges this and Other?
Definition ConstantRange.cpp:253

llvm::ConstantRange::contains
LLVM_ABI bool contains(const APInt &Val) const
Return true if the specified value is in the set.
Definition ConstantRange.cpp:517

llvm::ConstantStruct::get
static LLVM_ABI Constant * get(StructType *T, ArrayRef< Constant * > V)
Definition Constants.cpp:1383

llvm::Constant
This is an important base class in LLVM.
Definition Constant.h:43

llvm::Constant::getIntegerValue
static LLVM_ABI Constant * getIntegerValue(Type *Ty, const APInt &V)
Return the value for an integer or pointer constant, or a vector thereof, with the given scalar value...
Definition Constants.cpp:403

llvm::Constant::getAllOnesValue
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
Definition Constants.cpp:420

llvm::Constant::getNullValue
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
Definition Constants.cpp:373

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:63

llvm::DbgVariableRecord
Record of a variable value-assignment, aka a non instruction representation of the dbg....
Definition DebugProgramInstruction.h:277

llvm::DenseMapBase::try_emplace
std::pair< iterator, bool > try_emplace(KeyT &&Key, Ts &&...Args)
Definition DenseMap.h:248

llvm::DenseMapBase::count
size_type count(const_arg_type_t< KeyT > Val) const
Return 1 if the specified key is in the map, 0 otherwise.
Definition DenseMap.h:174

llvm::DominatorTree::dominates
LLVM_ABI bool dominates(const BasicBlock *BB, const Use &U) const
Return true if the (end of the) basic block BB dominates the use U.
Definition Dominators.cpp:135

llvm::ElementCount
Definition TypeSize.h:299

llvm::FMFSource::intersect
static FMFSource intersect(Value *A, Value *B)
Intersect the FMF from two instructions.
Definition IRBuilder.h:107

llvm::FPExtInst
This class represents an extension of floating point types.
Definition Instructions.h:4721

llvm::FastMathFlags
Convenience struct for specifying and reasoning about fast-math flags.
Definition FMF.h:22

llvm::FastMathFlags::setNoSignedZeros
void setNoSignedZeros(bool B=true)
Definition FMF.h:84

llvm::FastMathFlags::allowReassoc
bool allowReassoc() const
Flag queries.
Definition FMF.h:64

llvm::FenceInst
An instruction for ordering other memory operations.
Definition Instructions.h:430

llvm::FenceInst::getSyncScopeID
SyncScope::ID getSyncScopeID() const
Returns the synchronization scope ID of this fence instruction.
Definition Instructions.h:466

llvm::FenceInst::getOrdering
AtomicOrdering getOrdering() const
Returns the ordering constraint of this fence instruction.
Definition Instructions.h:455

llvm::FunctionType
Class to represent function types.
Definition DerivedTypes.h:105

llvm::FunctionType::param_iterator
Type::subtype_iterator param_iterator
Definition DerivedTypes.h:128

llvm::FunctionType::get
static LLVM_ABI FunctionType * get(Type *Result, ArrayRef< Type * > Params, bool isVarArg)
This static method is the primary way of constructing a FunctionType.

llvm::Function
Definition Function.h:64

llvm::Function::isConvergent
bool isConvergent() const
Determine if the call is convergent.
Definition Function.h:610

llvm::Function::getFunctionType
FunctionType * getFunctionType() const
Returns the FunctionType for me.
Definition Function.h:209

llvm::Function::getCallingConv
CallingConv::ID getCallingConv() const
getCallingConv()/setCallingConv(CC) - These method get and set the calling convention of this functio...
Definition Function.h:270

llvm::Function::getAttributes
AttributeList getAttributes() const
Return the attribute list for this Function.
Definition Function.h:352

llvm::Function::doesNotThrow
bool doesNotThrow() const
Determine if the function cannot unwind.
Definition Function.h:594

llvm::Function::isIntrinsic
bool isIntrinsic() const
isIntrinsic - Returns true if the function's name starts with "llvm.".
Definition Function.h:249

llvm::GCRelocateInst::getBasePtr
LLVM_ABI Value * getBasePtr() const
Definition IntrinsicInst.cpp:872

llvm::GCRelocateInst::getBasePtrIndex
unsigned getBasePtrIndex() const
The index into the associate statepoint's argument list which contains the base pointer of the pointe...
Definition IntrinsicInst.h:1724

llvm::GCRelocateInst::getDerivedPtr
LLVM_ABI Value * getDerivedPtr() const
Definition IntrinsicInst.cpp:883

llvm::GCRelocateInst::getDerivedPtrIndex
unsigned getDerivedPtrIndex() const
The index into the associate statepoint's argument list which contains the pointer whose relocation t...
Definition IntrinsicInst.h:1730

llvm::GCStatepointInst::getGCRelocates
std::vector< const GCRelocateInst * > getGCRelocates() const
Get list of all gc reloactes linked to this statepoint May contain several relocations for the same b...
Definition Statepoint.h:206

llvm::GlobalObject::getMetadata
MDNode * getMetadata(unsigned KindID) const
Get the current metadata attachments for the given kind, if any.
Definition Value.h:576

llvm::GlobalValue::isDeclaration
LLVM_ABI bool isDeclaration() const
Return true if the primary definition of this global value is outside of the current translation unit...
Definition Globals.cpp:328

llvm::GlobalValue::getType
PointerType * getType() const
Global values are always pointers.
Definition GlobalValue.h:296

llvm::GlobalVariable
Definition GlobalVariable.h:40

llvm::IRBuilderBase
Common base class shared among various IRBuilders.
Definition IRBuilder.h:114

llvm::IRBuilderBase::CreateLaunderInvariantGroup
LLVM_ABI Value * CreateLaunderInvariantGroup(Value *Ptr)
Create a launder.invariant.group intrinsic call.
Definition IRBuilder.cpp:1061

llvm::IRBuilderBase::getTrue
ConstantInt * getTrue()
Get the constant value for i1 true.
Definition IRBuilder.h:502

llvm::IRBuilderBase::CreateBinaryIntrinsic
LLVM_ABI Value * CreateBinaryIntrinsic(Intrinsic::ID ID, Value *LHS, Value *RHS, FMFSource FMFSource={}, const Twine &Name="")
Create a call to intrinsic ID with 2 operands which is mangled on the first type.
Definition IRBuilder.cpp:834

llvm::IRBuilderBase::CreateIntrinsic
LLVM_ABI CallInst * CreateIntrinsic(Intrinsic::ID ID, ArrayRef< Type * > Types, ArrayRef< Value * > Args, FMFSource FMFSource={}, const Twine &Name="")
Create a call to intrinsic ID with Args, mangled using Types.
Definition IRBuilder.cpp:845

llvm::IRBuilderBase::CreateSub
Value * CreateSub(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition IRBuilder.h:1420

llvm::IRBuilderBase::CreateUnaryIntrinsic
LLVM_ABI CallInst * CreateUnaryIntrinsic(Intrinsic::ID ID, Value *V, FMFSource FMFSource={}, const Twine &Name="")
Create a call to intrinsic ID with 1 operand which is mangled on its type.
Definition IRBuilder.cpp:826

llvm::IRBuilderBase::CreateZExt
Value * CreateZExt(Value *V, Type *DestTy, const Twine &Name="", bool IsNonNeg=false)
Definition IRBuilder.h:2085

llvm::IRBuilderBase::getFalse
ConstantInt * getFalse()
Get the constant value for i1 false.
Definition IRBuilder.h:507

llvm::IRBuilderBase::CreateICmp
Value * CreateICmp(CmpInst::Predicate P, Value *LHS, Value *RHS, const Twine &Name="")
Definition IRBuilder.h:2442

llvm::IRBuilderBase::CreateAddrSpaceCast
Value * CreateAddrSpaceCast(Value *V, Type *DestTy, const Twine &Name="")
Definition IRBuilder.h:2212

llvm::IRBuilderBase::CreateStripInvariantGroup
LLVM_ABI Value * CreateStripInvariantGroup(Value *Ptr)
Create a strip.invariant.group intrinsic call.
Definition IRBuilder.cpp:1077

llvm::Init
Definition Record.h:286

llvm::InsertValueInst::Create
static InsertValueInst * Create(Value *Agg, Value *Val, ArrayRef< unsigned > Idxs, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Definition Instructions.h:2558

llvm::InstCombinerImpl
Definition InstCombineInternal.h:63

llvm::InstCombinerImpl::computeKnownFPClass
KnownFPClass computeKnownFPClass(Value *Val, FastMathFlags FMF, FPClassTest Interested=fcAllFlags, const Instruction *CtxI=nullptr, unsigned Depth=0) const
Definition InstCombineInternal.h:205

llvm::InstCombinerImpl::foldOpIntoPhi
Instruction * foldOpIntoPhi(Instruction &I, PHINode *PN, bool AllowMultipleUses=false)
Given a binary operator, cast instruction, or select which has a PHI node as operand #0,...
Definition InstructionCombining.cpp:1876

llvm::InstCombinerImpl::SimplifyDemandedVectorElts
Value * SimplifyDemandedVectorElts(Value *V, APInt DemandedElts, APInt &PoisonElts, unsigned Depth=0, bool AllowMultipleUsers=false) override
The specified value produces a vector with any number of elements.
Definition InstCombineSimplifyDemanded.cpp:1457

llvm::InstCombinerImpl::SimplifyDemandedBits
bool SimplifyDemandedBits(Instruction *I, unsigned Op, const APInt &DemandedMask, KnownBits &Known, const SimplifyQuery &Q, unsigned Depth=0) override
This form of SimplifyDemandedBits simplifies the specified instruction operand if possible,...
Definition InstCombineSimplifyDemanded.cpp:153

llvm::InstCombinerImpl::FoldOpIntoSelect
Instruction * FoldOpIntoSelect(Instruction &Op, SelectInst *SI, bool FoldWithMultiUse=false, bool SimplifyBothArms=false)
Given an instruction with a select as one operand and a constant as the other operand,...
Definition InstructionCombining.cpp:1779

llvm::InstCombinerImpl::SimplifyAnyMemSet
Instruction * SimplifyAnyMemSet(AnyMemSetInst *MI)
Definition InstCombineCalls.cpp:219

llvm::InstCombinerImpl::visitFree
Instruction * visitFree(CallInst &FI, Value *FreedOp)
Definition InstructionCombining.cpp:3960

llvm::InstCombinerImpl::visitCallBrInst
Instruction * visitCallBrInst(CallBrInst &CBI)
Definition InstCombineCalls.cpp:4090

llvm::InstCombinerImpl::eraseInstFromFunction
Instruction * eraseInstFromFunction(Instruction &I) override
Combiner aware instruction erasure.
Definition InstCombineInternal.h:502

llvm::InstCombinerImpl::foldReversedIntrinsicOperands
Value * foldReversedIntrinsicOperands(IntrinsicInst *II)
If all arguments of the intrinsic are reverses, try to pull the reverse after the intrinsic.
Definition InstCombineCalls.cpp:1467

llvm::InstCombinerImpl::tryGetLog2
Value * tryGetLog2(Value *Op, bool AssumeNonZero)
Definition InstCombineInternal.h:847

llvm::InstCombinerImpl::visitFenceInst
Instruction * visitFenceInst(FenceInst &FI)
Definition InstCombineCalls.cpp:4057

llvm::InstCombinerImpl::foldShuffledIntrinsicOperands
Instruction * foldShuffledIntrinsicOperands(IntrinsicInst *II)
If all arguments of the intrinsic are unary shuffles with the same mask, try to shuffle after the int...
Definition InstCombineCalls.cpp:1410

llvm::InstCombinerImpl::visitInvokeInst
Instruction * visitInvokeInst(InvokeInst &II)
Definition InstCombineCalls.cpp:4085

llvm::InstCombinerImpl::SimplifyDemandedInstructionBits
bool SimplifyDemandedInstructionBits(Instruction &Inst)
Tries to simplify operands to an integer instruction based on its demanded bits.
Definition InstCombineSimplifyDemanded.cpp:145

llvm::InstCombinerImpl::CreateNonTerminatorUnreachable
void CreateNonTerminatorUnreachable(Instruction *InsertAt)
Create and insert the idiom we use to indicate a block is unreachable without having to rewrite the C...
Definition InstCombineInternal.h:489

llvm::InstCombinerImpl::visitVAEndInst
Instruction * visitVAEndInst(VAEndInst &I)
Definition InstCombineCalls.cpp:826

llvm::InstCombinerImpl::matchBSwapOrBitReverse
Instruction * matchBSwapOrBitReverse(Instruction &I, bool MatchBSwaps, bool MatchBitReversals)
Given an initial instruction, check to see if it is the root of a bswap/bitreverse idiom.
Definition InstCombineAndOrXor.cpp:2907

llvm::InstCombinerImpl::unshuffleConstant
Constant * unshuffleConstant(ArrayRef< int > ShMask, Constant *C, VectorType *NewCTy)
Find a constant NewC that has property: shuffle(NewC, ShMask) = C Returns nullptr if such a constant ...
Definition InstructionCombining.cpp:2293

llvm::InstCombinerImpl::visitAllocSite
Instruction * visitAllocSite(Instruction &FI)
Definition InstructionCombining.cpp:3710

llvm::InstCombinerImpl::SimplifyAnyMemTransfer
Instruction * SimplifyAnyMemTransfer(AnyMemTransferInst *MI)
Definition InstCombineCalls.cpp:117

llvm::InstCombinerImpl::computeOverflow
OverflowResult computeOverflow(Instruction::BinaryOps BinaryOp, bool IsSigned, Value *LHS, Value *RHS, Instruction *CxtI) const
Definition InstCombineCompares.cpp:6489

llvm::InstCombinerImpl::visitCallInst
Instruction * visitCallInst(CallInst &CI)
CallInst simplification.
Definition InstCombineCalls.cpp:1735

llvm::InstCombiner::SQ
SimplifyQuery SQ
Definition InstCombiner.h:79

llvm::InstCombiner::ComputeMaxSignificantBits
unsigned ComputeMaxSignificantBits(const Value *Op, const Instruction *CxtI=nullptr, unsigned Depth=0) const
Definition InstCombiner.h:464

llvm::InstCombiner::BuilderTy
IRBuilder< TargetFolder, IRBuilderCallbackInserter > BuilderTy
An IRBuilder that automatically inserts new instructions into the worklist.
Definition InstCombiner.h:60

llvm::InstCombiner::isFreeToInvert
bool isFreeToInvert(Value *V, bool WillInvertAllUses, bool &DoesConsume)
Return true if the specified value is free to invert (apply ~ to).
Definition InstCombiner.h:230

llvm::InstCombiner::getDominatorTree
DominatorTree & getDominatorTree() const
Definition InstCombiner.h:338

llvm::InstCombiner::BFI
BlockFrequencyInfo * BFI
Definition InstCombiner.h:81

llvm::InstCombiner::TLI
TargetLibraryInfo & TLI
Definition InstCombiner.h:76

llvm::InstCombiner::InsertNewInstBefore
Instruction * InsertNewInstBefore(Instruction *New, BasicBlock::iterator Old)
Inserts an instruction New before instruction Old.
Definition InstCombiner.h:370

llvm::InstCombiner::AA
AAResults * AA
Definition InstCombiner.h:72

llvm::InstCombiner::replaceInstUsesWith
Instruction * replaceInstUsesWith(Instruction &I, Value *V)
A combiner-aware RAUW-like routine.
Definition InstCombiner.h:390

llvm::InstCombiner::replaceUse
void replaceUse(Use &U, Value *NewValue)
Replace use and add the previously used value to the worklist.
Definition InstCombiner.h:422

llvm::InstCombiner::Worklist
InstructionWorklist & Worklist
A worklist of the instructions that need to be simplified.
Definition InstCombiner.h:65

llvm::InstCombiner::DL
const DataLayout & DL
Definition InstCombiner.h:78

llvm::InstCombiner::DC
DomConditionCache DC
Definition InstCombiner.h:84

llvm::InstCombiner::computeKnownBits
void computeKnownBits(const Value *V, KnownBits &Known, const Instruction *CxtI, unsigned Depth=0) const
Definition InstCombiner.h:435

llvm::InstCombiner::targetInstCombineIntrinsic
std::optional< Instruction * > targetInstCombineIntrinsic(IntrinsicInst &II)
Definition InstructionCombining.cpp:162

llvm::InstCombiner::AC
AssumptionCache & AC
Definition InstCombiner.h:75

llvm::InstCombiner::replaceOperand
Instruction * replaceOperand(Instruction &I, unsigned OpNum, Value *V)
Replace operand of instruction and add old operand to the worklist.
Definition InstCombiner.h:414

llvm::InstCombiner::MaskedValueIsZero
bool MaskedValueIsZero(const Value *V, const APInt &Mask, const Instruction *CxtI=nullptr, unsigned Depth=0) const
Definition InstCombiner.h:452

llvm::InstCombiner::DT
DominatorTree & DT
Definition InstCombiner.h:77

llvm::InstCombiner::PSI
ProfileSummaryInfo * PSI
Definition InstCombiner.h:83

llvm::InstCombiner::Builder
BuilderTy & Builder
Definition InstCombiner.h:61

llvm::InstCombiner::getAssumptionCache
AssumptionCache & getAssumptionCache() const
Definition InstCombiner.h:336

llvm::InstCombiner::ORE
OptimizationRemarkEmitter & ORE
Definition InstCombiner.h:80

llvm::InstCombiner::getFreelyInverted
Value * getFreelyInverted(Value *V, bool WillInvertAllUses, BuilderTy *Builder, bool &DoesConsume)
Definition InstCombiner.h:211

llvm::InstCombiner::getSimplifyQuery
const SimplifyQuery & getSimplifyQuery() const
Definition InstCombiner.h:340

llvm::InstCombiner::isKnownToBeAPowerOfTwo
bool isKnownToBeAPowerOfTwo(const Value *V, bool OrZero=false, const Instruction *CxtI=nullptr, unsigned Depth=0)
Definition InstCombiner.h:445

llvm::Instruction
Definition Instruction.h:69

llvm::Instruction::setHasNoUnsignedWrap
LLVM_ABI void setHasNoUnsignedWrap(bool b=true)
Set or clear the nuw flag on this instruction, which must be an operator which supports this flag.
Definition Instruction.cpp:391

llvm::Instruction::mayWriteToMemory
LLVM_ABI bool mayWriteToMemory() const LLVM_READONLY
Return true if this instruction may modify memory.
Definition Instruction.cpp:1047

llvm::Instruction::copyIRFlags
LLVM_ABI void copyIRFlags(const Value *V, bool IncludeWrapFlags=true)
Convenience method to copy supported exact, fast-math, and (optionally) wrapping flags from V to this...
Definition Instruction.cpp:692

llvm::Instruction::setHasNoSignedWrap
LLVM_ABI void setHasNoSignedWrap(bool b=true)
Set or clear the nsw flag on this instruction, which must be an operator which supports this flag.
Definition Instruction.cpp:398

llvm::Instruction::getDebugLoc
const DebugLoc & getDebugLoc() const
Return the debug location for this node as a DebugLoc.
Definition Instruction.h:513

llvm::Instruction::getModule
LLVM_ABI const Module * getModule() const
Return the module owning the function this instruction belongs to or nullptr it the function does not...
Definition Instruction.cpp:82

llvm::Instruction::setAAMetadata
LLVM_ABI void setAAMetadata(const AAMDNodes &N)
Sets the AA metadata on this instruction from the AAMDNodes structure.
Definition Metadata.cpp:1832

llvm::Instruction::moveBefore
LLVM_ABI void moveBefore(InstListType::iterator InsertPos)
Unlink this instruction from its current basic block and insert it into the basic block that MovePos ...
Definition Instruction.cpp:188

llvm::Instruction::getFunction
LLVM_ABI const Function * getFunction() const
Return the function this instruction belongs to.
Definition Instruction.cpp:86

llvm::Instruction::getMetadata
MDNode * getMetadata(unsigned KindID) const
Get the metadata of given kind attached to this Instruction.
Definition Instruction.h:428

llvm::Instruction::isTerminator
bool isTerminator() const
Definition Instruction.h:315

llvm::Instruction::setMetadata
LLVM_ABI void setMetadata(unsigned KindID, MDNode *Node)
Set the metadata of the specified kind to the specified node.
Definition Metadata.cpp:1746

llvm::Instruction::BinaryOps
BinaryOps
Definition Instruction.h:998

llvm::Instruction::getInsertionPointAfterDef
LLVM_ABI std::optional< InstListType::iterator > getInsertionPointAfterDef()
Get the first insertion point at which the result of this instruction is defined.
Definition Instruction.cpp:356

llvm::Instruction::isIdenticalTo
LLVM_ABI bool isIdenticalTo(const Instruction *I) const LLVM_READONLY
Return true if the specified instruction is exactly identical to the current one.
Definition Instruction.cpp:951

llvm::Instruction::setDebugLoc
void setDebugLoc(DebugLoc Loc)
Set the debug location information for this instruction.
Definition Instruction.h:510

llvm::Instruction::copyMetadata
LLVM_ABI void copyMetadata(const Instruction &SrcInst, ArrayRef< unsigned > WL=ArrayRef< unsigned >())
Copy metadata from SrcInst to this instruction.
Definition Instruction.cpp:1359

llvm::Instruction::CastOps
CastOps
Definition Instruction.h:1012

llvm::IntegerType
Class to represent integer types.
Definition DerivedTypes.h:42

llvm::IntegerType::get
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:319

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition IntrinsicInst.h:49

llvm::IntrinsicInst::getIntrinsicID
Intrinsic::ID getIntrinsicID() const
Return the intrinsic ID of this intrinsic.
Definition IntrinsicInst.h:56

llvm::InvokeInst
Invoke instruction.
Definition Instructions.h:3716

llvm::InvokeInst::Create
static InvokeInst * Create(FunctionType *Ty, Value *Func, BasicBlock *IfNormal, BasicBlock *IfException, ArrayRef< Value * > Args, const Twine &NameStr, InsertPosition InsertBefore=nullptr)
Definition Instructions.h:3756

llvm::LLVMContext::OB_kcfi
@ OB_kcfi
Definition LLVMContext.h:98

llvm::LLVMContext::OB_ptrauth
@ OB_ptrauth
Definition LLVMContext.h:97

llvm::LLVMContext::OB_gc_live
@ OB_gc_live
Definition LLVMContext.h:95

llvm::LoadInst
An instruction for reading from memory.
Definition Instructions.h:181

llvm::MDNode
Metadata node.
Definition Metadata.h:1078

llvm::MDNode::get
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
Definition Metadata.h:1569

llvm::MinMaxIntrinsic::getPredicate
static ICmpInst::Predicate getPredicate(Intrinsic::ID ID)
Returns the comparison predicate underlying the intrinsic.
Definition IntrinsicInst.h:785

llvm::MinMaxIntrinsic::getPredicate
ICmpInst::Predicate getPredicate() const
Returns the comparison predicate underlying the intrinsic.
Definition IntrinsicInst.h:801

llvm::MinMaxIntrinsic::isSigned
bool isSigned() const
Whether the intrinsic is signed or unsigned.
Definition IntrinsicInst.h:811

llvm::Module
A Module instance is used to store all the information related to an LLVM module.
Definition Module.h:67

llvm::Module::getName
StringRef getName() const
Get a short "name" for the module.
Definition Module.h:269

llvm::Operator::getOpcode
unsigned getOpcode() const
Return the opcode for this Instruction or ConstantExpr.
Definition Operator.h:43

llvm::OverflowingBinaryOperator
Utility class for integer operators which may exhibit overflow - Add, Sub, Mul, and Shl.
Definition Operator.h:78

llvm::OverflowingBinaryOperator::hasNoSignedWrap
bool hasNoSignedWrap() const
Test whether this operation is known to never undergo signed overflow, aka the nsw property.
Definition Operator.h:111

llvm::OverflowingBinaryOperator::hasNoUnsignedWrap
bool hasNoUnsignedWrap() const
Test whether this operation is known to never undergo unsigned overflow, aka the nuw property.
Definition Operator.h:105

llvm::OverflowingBinaryOperator::isCommutative
bool isCommutative() const
Return true if the instruction is commutative.
Definition Operator.h:128

llvm::PHINode
Definition Instructions.h:2639

llvm::PoisonValue::get
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition Constants.cpp:1888

llvm::SaturatingInst
Represents a saturating add/sub intrinsic.
Definition IntrinsicInst.h:971

llvm::SelectInst
This class represents the LLVM 'select' instruction.
Definition Instructions.h:1690

llvm::SelectInst::Create
static SelectInst * Create(Value *C, Value *S1, Value *S2, const Twine &NameStr="", InsertPosition InsertBefore=nullptr, const Instruction *MDFrom=nullptr)
Definition Instructions.h:1715

llvm::ShuffleVectorInst
This instruction constructs a fixed permutation of two input vectors.
Definition Instructions.h:1935

llvm::SmallBitVector
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
Definition SmallBitVector.h:35

llvm::SmallBitVector::set
SmallBitVector & set()
Definition SmallBitVector.h:366

llvm::SmallBitVector::test
bool test(unsigned Idx) const
Definition SmallBitVector.h:474

llvm::SmallBitVector::all
bool all() const
Returns true if all bits are set.
Definition SmallBitVector.h:216

llvm::SmallPtrSetImplBase::size
size_type size() const
Definition SmallPtrSet.h:99

llvm::SmallPtrSetImpl::count
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
Definition SmallPtrSet.h:455

llvm::SmallPtrSetImpl::insert
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
Definition SmallPtrSet.h:389

llvm::SmallVectorImpl::emplace_back
reference emplace_back(ArgTypes &&... Args)
Definition SmallVector.h:944

llvm::SmallVectorImpl::reserve
void reserve(size_type N)
Definition SmallVector.h:664

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:417

llvm::SmallVectorTemplateCommon::size
size_t size() const
Definition SmallVector.h:80

llvm::SmallVectorTemplateCommon::empty
bool empty() const
Definition SmallVector.h:83

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1203

llvm::StoreInst
An instruction for storing to memory.
Definition Instructions.h:297

llvm::StoreInst::setVolatile
void setVolatile(bool V)
Specify whether this is a volatile store or not.
Definition Instructions.h:334

llvm::StoreInst::setAlignment
void setAlignment(Align Align)
Definition Instructions.h:343

llvm::StoreInst::setOrdering
void setOrdering(AtomicOrdering Ordering)
Sets the ordering constraint of this store instruction.
Definition Instructions.h:354

llvm::StructType
Class to represent struct types.
Definition DerivedTypes.h:218

llvm::TargetLibraryInfoImpl::isCallingConvCCompatible
static LLVM_ABI bool isCallingConvCCompatible(CallBase *CI)
Returns true if call site / callee has cdecl-compatible calling conventions.
Definition TargetLibraryInfo.cpp:152

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition TargetLibraryInfo.h:285

llvm::TruncInst
This class represents a truncation of integer types.
Definition Instructions.h:4559

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45

llvm::Type::getInt64Ty
static LLVM_ABI IntegerType * getInt64Ty(LLVMContext &C)
Definition Type.cpp:298

llvm::Type::getIntegerBitWidth
LLVM_ABI unsigned getIntegerBitWidth() const
Definition DerivedTypes.h:99

llvm::Type::getInt32Ty
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:297

llvm::Type::isPointerTy
bool isPointerTy() const
True if this is an instance of PointerType.
Definition Type.h:267

llvm::Type::canLosslesslyBitCastTo
LLVM_ABI bool canLosslesslyBitCastTo(Type *Ty) const
Return true if this type could be converted with a lossless BitCast to type 'Ty'.
Definition Type.cpp:154

llvm::Type::getScalarType
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition Type.h:352

llvm::Type::isStructTy
bool isStructTy() const
True if this is an instance of StructType.
Definition Type.h:261

llvm::Type::getWithNewBitWidth
LLVM_ABI Type * getWithNewBitWidth(unsigned NewBitWidth) const
Given an integer or vector type, change the lane bitwidth to NewBitwidth, whilst keeping the old numb...
Definition DerivedTypes.h:766

llvm::Type::getScalarSizeInBits
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
Definition Type.cpp:231

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:240

llvm::Type::isVoidTy
bool isVoidTy() const
Return true if this is 'void'.
Definition Type.h:139

llvm::UnaryOperator::CreateWithCopiedFlags
static UnaryOperator * CreateWithCopiedFlags(UnaryOps Opc, Value *V, Instruction *CopyO, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition InstrTypes.h:139

llvm::UnaryOperator::CreateFNegFMF
static UnaryOperator * CreateFNegFMF(Value *Op, Instruction *FMFSource, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition InstrTypes.h:147

llvm::UndefValue::get
static LLVM_ABI UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
Definition Constants.cpp:1869

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition Use.h:35

llvm::Use::getOperandNo
LLVM_ABI unsigned getOperandNo() const
Return the operand # of this use in its User.
Definition Use.cpp:35

llvm::User
Definition User.h:44

llvm::User::setOperand
void setOperand(unsigned i, Value *Val)
Definition User.h:237

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition User.h:232

llvm::VAEndInst
This represents the llvm.va_end intrinsic.
Definition IntrinsicInst.h:1408

llvm::ValueHandleBase::ValueIsDeleted
static LLVM_ABI void ValueIsDeleted(Value *V)
Definition Value.cpp:1226

llvm::ValueHandleBase::ValueIsRAUWd
static LLVM_ABI void ValueIsRAUWd(Value *Old, Value *New)
Definition Value.cpp:1279

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:256

llvm::Value::MaximumAlignment
static constexpr uint64_t MaximumAlignment
Definition Value.h:830

llvm::Value::hasOneUse
bool hasOneUse() const
Return true if there is exactly one use of this value.
Definition Value.h:439

llvm::Value::users
iterator_range< user_iterator > users()
Definition Value.h:426

llvm::Value::dropDroppableUse
static LLVM_ABI void dropDroppableUse(Use &U)
Remove the droppable use U.
Definition Value.cpp:226

llvm::Value::stripPointerCasts
LLVM_ABI const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
Definition Value.cpp:701

llvm::Value::use_empty
bool use_empty() const
Definition Value.h:346

llvm::Value::getContext
LLVM_ABI LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.cpp:1099

llvm::Value::MaxAlignmentExponent
static constexpr unsigned MaxAlignmentExponent
The maximum alignment for instructions.
Definition Value.h:829

llvm::Value::getName
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
Definition Value.cpp:322

llvm::Value::takeName
LLVM_ABI void takeName(Value *V)
Transfer the name from V to this value.
Definition Value.cpp:396

llvm::VectorType
Base class of all SIMD vector types.
Definition DerivedTypes.h:430

llvm::VectorType::getElementCount
ElementCount getElementCount() const
Return an ElementCount instance to represent the (possibly scalable) number of elements in the vector...
Definition DerivedTypes.h:697

llvm::VectorType::get
static LLVM_ABI VectorType * get(Type *ElementType, ElementCount EC)
This static method is the primary way to construct an VectorType.

llvm::cl::opt
Definition CommandLine.h:1455

llvm::details::FixedOrScalableQuantity::getFixedValue
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:201

llvm::details::FixedOrScalableQuantity< ElementCount, unsigned >::isKnownLT
static constexpr bool isKnownLT(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition TypeSize.h:217

llvm::details::FixedOrScalableQuantity::isFixed
constexpr bool isFixed() const
Returns true if the quantity is not scaled by vscale.
Definition TypeSize.h:172

llvm::details::FixedOrScalableQuantity< ElementCount, unsigned >::isKnownGT
static constexpr bool isKnownGT(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition TypeSize.h:224

llvm::ilist_detail::node_parent_access::getParent
const ParentTy * getParent() const
Definition ilist_node.h:34

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition ilist_node.h:123

llvm::ilist_node_with_parent::getPrevNode
NodeTy * getPrevNode()
Definition ilist_node.h:334

llvm::ilist_node_with_parent::getNextNode
NodeTy * getNextNode()
Get the next node, or nullptr for the list tail.
Definition ilist_node.h:348

uint32_t

uint64_t

unsigned

Call
CallInst * Call
Definition ObjCARCOpts.cpp:2359

Changed
Changed
Definition ObjCARCOpts.cpp:2369

DebugInfo.h

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::AArch64PACKey::IA
@ IA
Definition AArch64BaseInfo.h:953

llvm::AMDGPU::HSAMD::Kernel::Arg::Key::Align
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
Definition AMDGPUMetadata.h:183

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition AMDGPUMetadata.h:396

llvm::AMDGPU::HSAMD::Kernel::Key::Attrs
constexpr char Attrs[]
Key for Kernel::Metadata::mAttrs.
Definition AMDGPUMetadata.h:394

llvm::BitmaskEnumDetail::Mask
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
Definition BitmaskEnum.h:127

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::ISD::BasicBlock
@ BasicBlock
Various leaf nodes.
Definition ISDOpcodes.h:81

llvm::ISD::Constant
@ Constant
Definition ISDOpcodes.h:86

llvm::Intrinsic::getOrInsertDeclaration
LLVM_ABI Function * getOrInsertDeclaration(Module *M, ID id, ArrayRef< Type * > Tys={})
Look up the Function declaration of the intrinsic id in the Module M.
Definition Intrinsics.cpp:723

llvm::Intrinsic::ID
unsigned ID
Definition GenericSSAContext.h:28

llvm::M68k::MemAddrModeKind::U
@ U
Definition M68kBaseInfo.h:61

llvm::M68k::MemAddrModeKind::V
@ V
Definition M68kBaseInfo.h:63

llvm::M68k::MemAddrModeKind::L
@ L
Definition M68kBaseInfo.h:70

llvm::MIPatternMatch::m_ZeroInt
SpecificConstantMatch m_ZeroInt()
Convenience matchers for specific integer values.
Definition MIPatternMatch.h:278

llvm::MIPatternMatch::m_Neg
BinaryOp_match< SpecificConstantMatch, SrcTy, TargetOpcode::G_SUB > m_Neg(const SrcTy &&Src)
Matches a register negated by a G_SUB.
Definition MIPatternMatch.h:929

llvm::MIPatternMatch::m_Not
BinaryOp_match< SrcTy, SpecificConstantMatch, TargetOpcode::G_XOR, true > m_Not(const SrcTy &&Src)
Matches a register not-ed by a G_XOR.
Definition MIPatternMatch.h:937

llvm::MIPatternMatch::m_OneUse
OneUse_match< SubPat > m_OneUse(const SubPat &SP)
Definition MIPatternMatch.h:56

llvm::PatternMatch
Definition PatternMatch.h:47

llvm::PatternMatch::m_AllOnes
cst_pred_ty< is_all_ones > m_AllOnes()
Match an integer or vector with all bits set.
Definition PatternMatch.h:536

llvm::PatternMatch::m_Poison
class_match< PoisonValue > m_Poison()
Match an arbitrary poison constant.
Definition PatternMatch.h:173

llvm::PatternMatch::m_And
BinaryOp_match< LHS, RHS, Instruction::And > m_And(const LHS &L, const RHS &R)
Definition PatternMatch.h:1308

llvm::PatternMatch::m_Add
BinaryOp_match< LHS, RHS, Instruction::Add > m_Add(const LHS &L, const RHS &R)
Definition PatternMatch.h:1194

llvm::PatternMatch::m_BinOp
class_match< BinaryOperator > m_BinOp()
Match an arbitrary binary operation and ignore it.
Definition PatternMatch.h:113

llvm::PatternMatch::m_PtrToIntOrAddr
auto m_PtrToIntOrAddr(const OpTy &Op)
Matches PtrToInt or PtrToAddr.
Definition PatternMatch.h:2215

llvm::PatternMatch::m_BitReverse
m_Intrinsic_Ty< Opnd0 >::Ty m_BitReverse(const Opnd0 &Op0)
Definition PatternMatch.h:2865

llvm::PatternMatch::m_Constant
class_match< Constant > m_Constant()
Match an arbitrary Constant and ignore it.
Definition PatternMatch.h:178

llvm::PatternMatch::m_APInt
ap_match< APInt > m_APInt(const APInt *&Res)
Match a ConstantInt or splatted ConstantVector, binding the specified pointer to the contained APInt.
Definition PatternMatch.h:311

llvm::PatternMatch::m_c_And
BinaryOp_match< LHS, RHS, Instruction::And, true > m_c_And(const LHS &L, const RHS &R)
Matches an And with LHS and RHS in either order.
Definition PatternMatch.h:3001

llvm::PatternMatch::m_Trunc
CastInst_match< OpTy, TruncInst > m_Trunc(const OpTy &Op)
Matches Trunc.
Definition PatternMatch.h:2235

llvm::PatternMatch::m_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor > m_Xor(const LHS &L, const RHS &R)
Definition PatternMatch.h:1320

llvm::PatternMatch::m_APIntAllowPoison
ap_match< APInt > m_APIntAllowPoison(const APInt *&Res)
Match APInt while allowing poison in splat vector constants.
Definition PatternMatch.h:317

llvm::PatternMatch::m_NSWSub
OverflowingBinaryOp_match< LHS, RHS, Instruction::Sub, OverflowingBinaryOperator::NoSignedWrap > m_NSWSub(const LHS &L, const RHS &R)
Definition PatternMatch.h:1428

llvm::PatternMatch::m_SpecificInt
specific_intval< false > m_SpecificInt(const APInt &V)
Match a specific integer value or vector with all elements equal to the value.
Definition PatternMatch.h:1072

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition PatternMatch.h:49

llvm::PatternMatch::m_Instruction
bind_ty< Instruction > m_Instruction(Instruction *&I)
Match an instruction, capturing it if we match.
Definition PatternMatch.h:874

llvm::PatternMatch::m_Specific
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
Definition PatternMatch.h:974

llvm::PatternMatch::m_APFloat
ap_match< APFloat > m_APFloat(const APFloat *&Res)
Match a ConstantFP or splatted ConstantVector, binding the specified pointer to the contained APFloat...
Definition PatternMatch.h:328

llvm::PatternMatch::m_NSWNeg
OverflowingBinaryOp_match< cst_pred_ty< is_zero_int >, ValTy, Instruction::Sub, OverflowingBinaryOperator::NoSignedWrap > m_NSWNeg(const ValTy &V)
Matches a 'Neg' as 'sub nsw 0, V'.
Definition PatternMatch.h:3032

llvm::PatternMatch::m_ConstantInt
class_match< ConstantInt > m_ConstantInt()
Match an arbitrary ConstantInt and ignore it.
Definition PatternMatch.h:181

llvm::PatternMatch::m_One
cst_pred_ty< is_one > m_One()
Match an integer 1 or a vector with all elements equal to 1.
Definition PatternMatch.h:604

llvm::PatternMatch::m_Intrinsic
IntrinsicID_match m_Intrinsic()
Match intrinsic calls like this: m_Intrinsic<Intrinsic::fabs>(m_Value(X))
Definition PatternMatch.h:2796

llvm::PatternMatch::m_Select
ThreeOps_match< Cond, LHS, RHS, Instruction::Select > m_Select(const Cond &C, const LHS &L, const RHS &R)
Matches SelectInst.
Definition PatternMatch.h:1940

llvm::PatternMatch::m_NegZeroFP
cstfp_pred_ty< is_neg_zero_fp > m_NegZeroFP()
Match a floating-point negative zero.
Definition PatternMatch.h:796

llvm::PatternMatch::m_SpecificFP
specific_fpval m_SpecificFP(double V)
Match a specific floating point value or vector with all elements equal to the value.
Definition PatternMatch.h:1017

llvm::PatternMatch::m_ExtractValue
ExtractValue_match< Ind, Val_t > m_ExtractValue(const Val_t &V)
Match a single index ExtractValue instruction.
Definition PatternMatch.h:3153

llvm::PatternMatch::m_LogicalShift
BinOpPred_match< LHS, RHS, is_logical_shift_op > m_LogicalShift(const LHS &L, const RHS &R)
Matches logical shift operations.
Definition PatternMatch.h:1672

llvm::PatternMatch::m_CombineAnd
match_combine_and< LTy, RTy > m_CombineAnd(const LTy &L, const RTy &R)
Combine two pattern matchers matching L && R.
Definition PatternMatch.h:278

llvm::PatternMatch::m_SMin
MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > m_SMin(const LHS &L, const RHS &R)
Definition PatternMatch.h:2516

llvm::PatternMatch::m_c_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor, true > m_c_Xor(const LHS &L, const RHS &R)
Matches an Xor with LHS and RHS in either order.
Definition PatternMatch.h:3015

llvm::PatternMatch::m_Deferred
deferredval_ty< Value > m_Deferred(Value *const &V)
Like m_Specific(), but works if the specific value to match is determined as part of the same match()...
Definition PatternMatch.h:992

llvm::PatternMatch::m_ZExtOrSExtOrSelf
match_combine_or< match_combine_or< CastInst_match< OpTy, ZExtInst >, CastInst_match< OpTy, SExtInst > >, OpTy > m_ZExtOrSExtOrSelf(const OpTy &Op)
Definition PatternMatch.h:2306

llvm::PatternMatch::m_LogicalOr
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
Definition PatternMatch.h:3275

llvm::PatternMatch::m_Shuffle
TwoOps_match< V1_t, V2_t, Instruction::ShuffleVector > m_Shuffle(const V1_t &v1, const V2_t &v2)
Matches ShuffleVectorInst independently of mask value.
Definition PatternMatch.h:2052

llvm::PatternMatch::m_StrictlyPositive
cst_pred_ty< is_strictlypositive > m_StrictlyPositive()
Match an integer or vector of strictly positive values.
Definition PatternMatch.h:582

llvm::PatternMatch::m_c_Select
ThreeOps_match< decltype(m_Value()), LHS, RHS, Instruction::Select, true > m_c_Select(const LHS &L, const RHS &R)
Match Select(C, LHS, RHS) or Select(C, RHS, LHS)
Definition PatternMatch.h:1956

llvm::PatternMatch::m_FPExt
CastInst_match< OpTy, FPExtInst > m_FPExt(const OpTy &Op)
Definition PatternMatch.h:2344

llvm::PatternMatch::m_SpecificICmp
SpecificCmpClass_match< LHS, RHS, ICmpInst > m_SpecificICmp(CmpPredicate MatchPred, const LHS &L, const RHS &R)
Definition PatternMatch.h:1829

llvm::PatternMatch::m_ZExt
CastInst_match< OpTy, ZExtInst > m_ZExt(const OpTy &Op)
Matches ZExt.
Definition PatternMatch.h:2267

llvm::PatternMatch::m_NUWShl
OverflowingBinaryOp_match< LHS, RHS, Instruction::Shl, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWShl(const LHS &L, const RHS &R)
Definition PatternMatch.h:1487

llvm::PatternMatch::m_NUWMul
OverflowingBinaryOp_match< LHS, RHS, Instruction::Mul, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWMul(const LHS &L, const RHS &R)
Definition PatternMatch.h:1479

llvm::PatternMatch::m_UMax
MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty > m_UMax(const LHS &L, const RHS &R)
Definition PatternMatch.h:2522

llvm::PatternMatch::m_NegatedPower2
cst_pred_ty< is_negated_power2 > m_NegatedPower2()
Match a integer or vector negated power-of-2.
Definition PatternMatch.h:639

llvm::PatternMatch::m_ImmConstant
match_immconstant_ty m_ImmConstant()
Match an arbitrary immediate Constant and ignore it.
Definition PatternMatch.h:943

llvm::PatternMatch::m_CheckedInt
cst_pred_ty< custom_checkfn< APInt > > m_CheckedInt(function_ref< bool(const APInt &)> CheckFn)
Match an integer or vector where CheckFn(ele) for each element is true.
Definition PatternMatch.h:493

llvm::PatternMatch::m_FShl
m_Intrinsic_Ty< Opnd0, Opnd1, Opnd2 >::Ty m_FShl(const Opnd0 &Op0, const Opnd1 &Op1, const Opnd2 &Op2)
Definition PatternMatch.h:2922

llvm::PatternMatch::m_c_MaxOrMin
match_combine_or< match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty, true >, MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty, true > >, match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty, true >, MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty, true > > > m_c_MaxOrMin(const LHS &L, const RHS &R)
Definition PatternMatch.h:3067

llvm::PatternMatch::m_UnOp
class_match< UnaryOperator > m_UnOp()
Match an arbitrary unary operation and ignore it.
Definition PatternMatch.h:108

llvm::PatternMatch::m_NUWSub
OverflowingBinaryOp_match< LHS, RHS, Instruction::Sub, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWSub(const LHS &L, const RHS &R)
Definition PatternMatch.h:1471

llvm::PatternMatch::m_SMax
MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty > m_SMax(const LHS &L, const RHS &R)
Definition PatternMatch.h:2510

llvm::PatternMatch::m_NSWAddLike
match_combine_or< OverflowingBinaryOp_match< LHS, RHS, Instruction::Add, OverflowingBinaryOperator::NoSignedWrap >, DisjointOr_match< LHS, RHS > > m_NSWAddLike(const LHS &L, const RHS &R)
Match either "add nsw" or "or disjoint".
Definition PatternMatch.h:1558

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition PatternMatch.h:105

llvm::PatternMatch::m_LShr
BinaryOp_match< LHS, RHS, Instruction::LShr > m_LShr(const LHS &L, const RHS &R)
Definition PatternMatch.h:1332

llvm::PatternMatch::m_Exact
Exact_match< T > m_Exact(const T &SubPattern)
Definition PatternMatch.h:1719

llvm::PatternMatch::m_FNeg
FNeg_match< OpTy > m_FNeg(const OpTy &X)
Match 'fneg X' as 'fsub -0.0, X'.
Definition PatternMatch.h:1248

llvm::PatternMatch::m_Shift
BinOpPred_match< LHS, RHS, is_shift_op > m_Shift(const LHS &L, const RHS &R)
Matches shift operations.
Definition PatternMatch.h:1657

llvm::PatternMatch::m_PosZeroFP
cstfp_pred_ty< is_pos_zero_fp > m_PosZeroFP()
Match a floating-point positive zero.
Definition PatternMatch.h:787

llvm::PatternMatch::m_Shl
BinaryOp_match< LHS, RHS, Instruction::Shl > m_Shl(const LHS &L, const RHS &R)
Definition PatternMatch.h:1326

llvm::PatternMatch::m_VecReverse
m_Intrinsic_Ty< Opnd0 >::Ty m_VecReverse(const Opnd0 &Op0)
Definition PatternMatch.h:2944

llvm::PatternMatch::m_LogicalAnd
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
Definition PatternMatch.h:3257

llvm::PatternMatch::m_MaxOrMin
match_combine_or< match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > >, match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty > > > m_MaxOrMin(const LHS &L, const RHS &R)
Definition PatternMatch.h:2539

llvm::PatternMatch::m_FShr
m_Intrinsic_Ty< Opnd0, Opnd1, Opnd2 >::Ty m_FShr(const Opnd0 &Op0, const Opnd1 &Op1, const Opnd2 &Op2)
Definition PatternMatch.h:2928

llvm::PatternMatch::m_SRem
BinaryOp_match< LHS, RHS, Instruction::SRem > m_SRem(const LHS &L, const RHS &R)
Definition PatternMatch.h:1296

llvm::PatternMatch::m_Undef
auto m_Undef()
Match an arbitrary undef constant.
Definition PatternMatch.h:165

llvm::PatternMatch::m_BSwap
m_Intrinsic_Ty< Opnd0 >::Ty m_BSwap(const Opnd0 &Op0)
Definition PatternMatch.h:2870

llvm::PatternMatch::m_SExt
CastInst_match< OpTy, SExtInst > m_SExt(const OpTy &Op)
Matches SExt.
Definition PatternMatch.h:2261

llvm::PatternMatch::m_Zero
is_zero m_Zero()
Match any null constant or a vector with all elements equal to 0.
Definition PatternMatch.h:624

llvm::PatternMatch::m_c_Or
BinaryOp_match< LHS, RHS, Instruction::Or, true > m_c_Or(const LHS &L, const RHS &R)
Matches an Or with LHS and RHS in either order.
Definition PatternMatch.h:3008

llvm::PatternMatch::m_NUWAddLike
match_combine_or< OverflowingBinaryOp_match< LHS, RHS, Instruction::Add, OverflowingBinaryOperator::NoUnsignedWrap >, DisjointOr_match< LHS, RHS > > m_NUWAddLike(const LHS &L, const RHS &R)
Match either "add nuw" or "or disjoint".
Definition PatternMatch.h:1568

llvm::PatternMatch::m_BitwiseLogic
BinOpPred_match< LHS, RHS, is_bitwiselogic_op > m_BitwiseLogic(const LHS &L, const RHS &R)
Matches bitwise logic operations.
Definition PatternMatch.h:1679

llvm::PatternMatch::m_FAbs
m_Intrinsic_Ty< Opnd0 >::Ty m_FAbs(const Opnd0 &Op0)
Definition PatternMatch.h:2875

llvm::PatternMatch::m_c_Mul
BinaryOp_match< LHS, RHS, Instruction::Mul, true > m_c_Mul(const LHS &L, const RHS &R)
Matches a Mul with LHS and RHS in either order.
Definition PatternMatch.h:2994

llvm::PatternMatch::m_CopySign
m_Intrinsic_Ty< Opnd0, Opnd1 >::Ty m_CopySign(const Opnd0 &Op0, const Opnd1 &Op1)
Definition PatternMatch.h:2938

llvm::PatternMatch::match_fn
MatchFunctor< Val, Pattern > match_fn(const Pattern &P)
A match functor that can be used as a UnaryPredicate in functional algorithms like all_of.
Definition PatternMatch.h:62

llvm::PatternMatch::m_UMin
MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty > m_UMin(const LHS &L, const RHS &R)
Definition PatternMatch.h:2528

llvm::PatternMatch::m_CombineOr
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
Definition PatternMatch.h:272

llvm::SI
Definition SIInstrInfo.h:1805

llvm::SyncScope::SingleThread
@ SingleThread
Synchronized with respect to signal handlers executing in the same thread.
Definition LLVMContext.h:55

llvm::SyncScope::System
@ System
Synchronized with respect to all concurrently executing threads.
Definition LLVMContext.h:58

llvm::X86::FirstMacroFusionInstKind::AddSub
@ AddSub
Definition X86BaseInfo.h:111

llvm::at::getDVRAssignmentMarkers
SmallVector< DbgVariableRecord * > getDVRAssignmentMarkers(const Instruction *Inst)
Return a range of dbg_assign records for which Inst performs the assignment they encode.
Definition DebugInfo.h:193

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition CommandLine.h:445

llvm::codeview::EncodedFramePtrReg::BasePtr
@ BasePtr
Definition CodeView.h:528

llvm::codeview::PublicSymFlags::Function
@ Function
Definition CodeView.h:409

llvm::logicalview::LVAttributeKind::Inserted
@ Inserted
Definition LVOptions.h:109

llvm::logicalview::LVAttributeKind::Discriminator
@ Discriminator
Definition LVOptions.h:100

llvm::logicalview::LVAttributeKind::Zero
@ Zero
Definition LVOptions.h:130

llvm::mdconst::extract
std::enable_if_t< detail::IsValidPointer< X, Y >::value, X * > extract(Y &&MD)
Extract a Value from Metadata.
Definition Metadata.h:667

llvm::ms_demangle::QualifierMangleMode::Result
@ Result
Definition MicrosoftDemangle.h:132

llvm::numbers::e
constexpr double e
Definition STLForwardCompat.h:61

llvm::ore::NV
DiagnosticInfoOptimizationBase::Argument NV
Definition OptimizationRemarkEmitter.h:139

llvm::pdb::PDB_SymType::Caller
@ Caller
Definition PDBTypes.h:281

llvm::pdb::PDB_SymType::VectorType
@ VectorType
Definition PDBTypes.h:278

llvm::pdb::PDB_SymType::Callee
@ Callee
Definition PDBTypes.h:282

llvm::sandboxir::Instruction
friend class Instruction
Iterator for Instructions in a `BasicBlock.
Definition BasicBlock.h:73

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::EnableKnowledgeRetention
LLVM_ABI cl::opt< bool > EnableKnowledgeRetention

llvm::getInverseMinMaxIntrinsic
LLVM_ABI Intrinsic::ID getInverseMinMaxIntrinsic(Intrinsic::ID MinMaxID)
Definition ValueTracking.cpp:9027

llvm::Log2_32_Ceil
unsigned Log2_32_Ceil(uint32_t Value)
Return the ceil log base 2 of the specified value, 32 if the value is zero.
Definition MathExtras.h:344

llvm::Offset
@ Offset
Definition DWP.cpp:477

llvm::Value
FunctionAddr VTableAddr Value
Definition InstrProf.h:137

llvm::OverflowResult
OverflowResult
Definition ValueTracking.h:622

llvm::OverflowResult::NeverOverflows
@ NeverOverflows
Never overflows.
Definition ValueTracking.h:630

llvm::OverflowResult::AlwaysOverflowsHigh
@ AlwaysOverflowsHigh
Always overflows in the direction of signed/unsigned max value.
Definition ValueTracking.h:626

llvm::OverflowResult::AlwaysOverflowsLow
@ AlwaysOverflowsLow
Always overflows in the direction of signed/unsigned min value.
Definition ValueTracking.h:624

llvm::OverflowResult::MayOverflow
@ MayOverflow
May or may not overflow.
Definition ValueTracking.h:628

llvm::simplifyFMulInst
LLVM_ABI Value * simplifyFMulInst(Value *LHS, Value *RHS, FastMathFlags FMF, const SimplifyQuery &Q, fp::ExceptionBehavior ExBehavior=fp::ebIgnore, RoundingMode Rounding=RoundingMode::NearestTiesToEven)
Given operands for an FMul, fold the result or return null.
Definition InstructionSimplify.cpp:6043

llvm::isValidAssumeForContext
LLVM_ABI bool isValidAssumeForContext(const Instruction *I, const Instruction *CxtI, const DominatorTree *DT=nullptr, bool AllowEphemerals=false)
Return true if it is valid to use the assumptions provided by an assume intrinsic,...
Definition ValueTracking.cpp:518

llvm::TailFoldingOpts::Reverse
@ Reverse
Definition AArch64BaseInfo.h:619

llvm::possiblyDemandedEltsInMask
LLVM_ABI APInt possiblyDemandedEltsInMask(Value *Mask)
Given a mask vector of the form <Y x i1>, return an APInt (of bitwidth Y) for each lane which may be ...
Definition VectorUtils.cpp:1335

llvm::simplifyRetainedKnowledge
LLVM_ABI RetainedKnowledge simplifyRetainedKnowledge(AssumeInst *Assume, RetainedKnowledge RK, AssumptionCache *AC, DominatorTree *DT)
canonicalize the RetainedKnowledge RK.
Definition AssumeBundleBuilder.cpp:318

llvm::dyn_cast
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643

llvm::isRemovableAlloc
LLVM_ABI bool isRemovableAlloc(const CallBase *V, const TargetLibraryInfo *TLI)
Return true if this is a call to an allocation function that does not have side effects that we are r...
Definition MemoryBuiltins.cpp:330

llvm::lowerObjectSizeCall
LLVM_ABI Value * lowerObjectSizeCall(IntrinsicInst *ObjectSize, const DataLayout &DL, const TargetLibraryInfo *TLI, bool MustSucceed)
Try to turn a call to @llvm.objectsize into an integer value of the given Type.
Definition MemoryBuiltins.cpp:645

llvm::getAllocAlignment
LLVM_ABI Value * getAllocAlignment(const CallBase *V, const TargetLibraryInfo *TLI)
Gets the alignment argument for an aligned_alloc-like function, using either built-in knowledge based...
Definition MemoryBuiltins.cpp:341

llvm::getKnowledgeFromOperandInAssume
LLVM_ABI RetainedKnowledge getKnowledgeFromOperandInAssume(AssumeInst &Assume, unsigned Idx)
Retreive the information help by Assume on the operand at index Idx.
Definition AssumeBundleQueries.cpp:126

llvm::maximum
LLVM_READONLY APFloat maximum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximum semantics.
Definition APFloat.h:1625

llvm::simplifyCall
LLVM_ABI Value * simplifyCall(CallBase *Call, Value *Callee, ArrayRef< Value * > Args, const SimplifyQuery &Q)
Given a callsite, callee, and arguments, fold the result or return null.
Definition InstructionSimplify.cpp:7278

llvm::ConstantFoldCompareInstOperands
LLVM_ABI Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
Definition ConstantFolding.cpp:1199

llvm::alignDown
constexpr T alignDown(U Value, V Align, W Skew=0)
Returns the largest unsigned integer less than or equal to Value and is Skew mod Align.
Definition MathExtras.h:546

llvm::isPowerOf2_64
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
Definition MathExtras.h:284

llvm::isAssumeWithEmptyBundle
LLVM_ABI bool isAssumeWithEmptyBundle(const AssumeInst &Assume)
Return true iff the operand bundles of the provided llvm.assume doesn't contain any valuable informat...
Definition AssumeBundleQueries.cpp:132

llvm::isSafeToSpeculativelyExecute
LLVM_ABI bool isSafeToSpeculativelyExecute(const Instruction *I, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr, bool UseVariableInfo=true, bool IgnoreUBImplyingAttrs=true)
Return true if the instruction does not have any effects besides calculating the result and does not ...
Definition ValueTracking.cpp:6958

llvm::getSplatValue
LLVM_ABI Value * getSplatValue(const Value *V)
Get splat value if the input is a splat vector or return nullptr.
Definition VectorUtils.cpp:391

llvm::MinAlign
constexpr T MinAlign(U A, V B)
A and B are either alignments or offsets.
Definition MathExtras.h:357

llvm::getKnowledgeFromBundle
LLVM_ABI RetainedKnowledge getKnowledgeFromBundle(AssumeInst &Assume, const CallBase::BundleOpInfo &BOI)
This extracts the Knowledge from an element of an operand bundle.
Definition AssumeBundleQueries.cpp:100

llvm::dyn_cast_or_null
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:753

llvm::getKnownAlignment
Align getKnownAlignment(Value *V, const DataLayout &DL, const Instruction *CxtI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr)
Try to infer an alignment for the specified pointer.
Definition Local.h:252

llvm::isSplatValue
LLVM_ABI bool isSplatValue(const Value *V, int Index=-1, unsigned Depth=0)
Return true if each element of the vector value V is poisoned or equal to every other non-poisoned el...
Definition VectorUtils.cpp:406

llvm::maxnum
LLVM_READONLY APFloat maxnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 maxNum semantics.
Definition APFloat.h:1580

llvm::HexPrintStyle::Upper
@ Upper
Definition NativeFormatting.h:23

llvm::HexPrintStyle::Lower
@ Lower
Definition NativeFormatting.h:23

llvm::fneg
LLVM_ABI FPClassTest fneg(FPClassTest Mask)
Return the test mask which returns true if the value's sign bit is flipped.
Definition FloatingPointMode.cpp:14

llvm::SelectPatternFlavor
SelectPatternFlavor
Specific patterns of select instructions we can match.
Definition ValueTracking.h:834

llvm::SPF_ABS
@ SPF_ABS
Floating point maxnum.
Definition ValueTracking.h:842

llvm::SPF_NABS
@ SPF_NABS
Absolute value.
Definition ValueTracking.h:843

llvm::getLosslessUnsignedTrunc
LLVM_ABI Constant * getLosslessUnsignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
Definition ConstantFolding.cpp:4706

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition MathExtras.h:279

llvm::isModSet
bool isModSet(const ModRefInfo MRI)
Definition ModRef.h:49

llvm::ComplexDeinterleavingOperation::Splat
@ Splat
Definition ComplexDeinterleavingPass.h:42

llvm::FPClassTest
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
Definition FloatingPointMode.h:240

llvm::fcInf
@ fcInf
Definition FloatingPointMode.h:255

llvm::fcNegSubnormal
@ fcNegSubnormal
Definition FloatingPointMode.h:247

llvm::fcPosNormal
@ fcPosNormal
Definition FloatingPointMode.h:251

llvm::fcNegZero
@ fcNegZero
Definition FloatingPointMode.h:248

llvm::fcNegInf
@ fcNegInf
Definition FloatingPointMode.h:245

llvm::fcSubnormal
@ fcSubnormal
Definition FloatingPointMode.h:257

llvm::fcNone
@ fcNone
Definition FloatingPointMode.h:241

llvm::fcPositive
@ fcPositive
Definition FloatingPointMode.h:262

llvm::fcPosZero
@ fcPosZero
Definition FloatingPointMode.h:249

llvm::fcNegNormal
@ fcNegNormal
Definition FloatingPointMode.h:246

llvm::fcZero
@ fcZero
Definition FloatingPointMode.h:258

llvm::fcNegative
@ fcNegative
Definition FloatingPointMode.h:263

llvm::fcAllFlags
@ fcAllFlags
Definition FloatingPointMode.h:265

llvm::fcPosSubnormal
@ fcPosSubnormal
Definition FloatingPointMode.h:250

llvm::fcPosInf
@ fcPosInf
Definition FloatingPointMode.h:252

llvm::fcNan
@ fcNan
Definition FloatingPointMode.h:254

llvm::computeKnownBits
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
Definition ValueTracking.cpp:152

llvm::None
@ None
Definition CodeGenData.h:107

llvm::matchSelectPattern
LLVM_ABI SelectPatternResult matchSelectPattern(Value *V, Value *&LHS, Value *&RHS, Instruction::CastOps *CastOp=nullptr, unsigned Depth=0)
Pattern match integer [SU]MIN, [SU]MAX and ABS idioms, returning the kind and providing the out param...
Definition ValueTracking.cpp:8933

llvm::matchSimpleBinaryIntrinsicRecurrence
LLVM_ABI bool matchSimpleBinaryIntrinsicRecurrence(const IntrinsicInst *I, PHINode *&P, Value *&Init, Value *&OtherOp)
Attempt to match a simple value-accumulating recurrence of the form: llvm.intrinsic....
Definition ValueTracking.cpp:9145

llvm::NullPointerIsDefined
LLVM_ABI bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
Definition Function.cpp:1172

llvm::find_if_not
auto find_if_not(R &&Range, UnaryPredicate P)
Definition STLExtras.h:1763

llvm::dbgs
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207

llvm::none_of
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1739

llvm::isAtLeastOrStrongerThan
bool isAtLeastOrStrongerThan(AtomicOrdering AO, AtomicOrdering Other)
Definition AtomicOrdering.h:106

llvm::getLosslessSignedTrunc
LLVM_ABI Constant * getLosslessSignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
Definition ConstantFolding.cpp:4712

llvm::buildAssumeFromKnowledge
LLVM_ABI AssumeInst * buildAssumeFromKnowledge(ArrayRef< RetainedKnowledge > Knowledge, Instruction *CtxI, AssumptionCache *AC=nullptr, DominatorTree *DT=nullptr)
Build and return a new assume created from the provided knowledge if the knowledge in the assume is f...
Definition AssumeBundleBuilder.cpp:309

llvm::inverse_fabs
LLVM_ABI FPClassTest inverse_fabs(FPClassTest Mask)
Return the test mask which returns true after fabs is applied to the value.
Definition FloatingPointMode.cpp:35

llvm::SmallVector
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
Definition SmallVector.h:1129

llvm::isa
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547

llvm::isNotCrossLaneOperation
LLVM_ABI bool isNotCrossLaneOperation(const Instruction *I)
Return true if the instruction doesn't potentially cross vector lanes.
Definition ValueTracking.cpp:6950

llvm::maskIsAllOneOrUndef
LLVM_ABI bool maskIsAllOneOrUndef(Value *Mask)
Given a mask vector of i1, Return true if all of the elements of this predicate mask are known to be ...
Definition VectorUtils.cpp:1282

llvm::Key
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
Definition PassManager.h:668

llvm::ConstantFoldBinaryOpOperands
LLVM_ABI Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
Definition ConstantFolding.cpp:1318

llvm::isKnownNonZero
LLVM_ABI bool isKnownNonZero(const Value *V, const SimplifyQuery &Q, unsigned Depth=0)
Return true if the given value is known to be non-zero when defined.
Definition ValueTracking.cpp:3583

llvm::PoisonMaskElem
constexpr int PoisonMaskElem
Definition Instructions.h:1923

llvm::AtomicOrdering::Unordered
@ Unordered
Definition AtomicOrdering.h:58

llvm::ModRefInfo::Mod
@ Mod
The access may modify the value stored in memory.
Definition ModRef.h:34

llvm::simplifyFMAFMul
LLVM_ABI Value * simplifyFMAFMul(Value *LHS, Value *RHS, FastMathFlags FMF, const SimplifyQuery &Q, fp::ExceptionBehavior ExBehavior=fp::ebIgnore, RoundingMode Rounding=RoundingMode::NearestTiesToEven)
Given operands for the multiplication of a FMA, fold the result or return null.
Definition InstructionSimplify.cpp:6051

llvm::IRMemLocation::Other
@ Other
Any other memory.
Definition ModRef.h:68

llvm::Data
FunctionAddr VTableAddr uintptr_t uintptr_t Data
Definition InstrProf.h:189

llvm::simplifyConstrainedFPCall
LLVM_ABI Value * simplifyConstrainedFPCall(CallBase *Call, const SimplifyQuery &Q)
Given a constrained FP intrinsic call, tries to compute its simplified version.
Definition InstructionSimplify.cpp:7304

llvm::minnum
LLVM_READONLY APFloat minnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 minNum semantics.
Definition APFloat.h:1561

llvm::OperandBundleDef
OperandBundleDefT< Value * > OperandBundleDef
Definition AutoUpgrade.h:34

llvm::RecurKind::Add
@ Add
Sum of integers.
Definition IVDescriptors.h:37

llvm::isVectorIntrinsicWithScalarOpAtArg
LLVM_ABI bool isVectorIntrinsicWithScalarOpAtArg(Intrinsic::ID ID, unsigned ScalarOpdIdx, const TargetTransformInfo *TTI)
Identifies if the vector form of the intrinsic has a scalar operand.
Definition VectorUtils.cpp:148

llvm::computeConstantRangeIncludingKnownBits
LLVM_ABI ConstantRange computeConstantRangeIncludingKnownBits(const WithCache< const Value * > &V, bool ForSigned, const SimplifyQuery &SQ)
Combine constant ranges from computeConstantRange() and computeKnownBits().
Definition ValueTracking.cpp:7107

llvm::Next
FunctionAddr VTableAddr Next
Definition InstrProf.h:141

llvm::Op
DWARFExpression::Operation Op
Definition DWARFExpressionPrinter.cpp:22

llvm::isSafeToSpeculativelyExecuteWithVariableReplaced
bool isSafeToSpeculativelyExecuteWithVariableReplaced(const Instruction *I, bool IgnoreUBImplyingAttrs=true)
Don't use information from its non-constant operands.
Definition ValueTracking.h:560

llvm::ArrayRef
ArrayRef(const T &OneElt) -> ArrayRef< T >

llvm::getFreedOperand
LLVM_ABI Value * getFreedOperand(const CallBase *CB, const TargetLibraryInfo *TLI)
If this if a call to a free function, return the freed operand.
Definition MemoryBuiltins.cpp:548

llvm::BitWidth
constexpr unsigned BitWidth
Definition BitmaskEnum.h:220

llvm::isDereferenceablePointer
LLVM_ABI bool isDereferenceablePointer(const Value *V, Type *Ty, const DataLayout &DL, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr)
Return true if this is always a dereferenceable pointer.
Definition Loads.cpp:249

llvm::maskIsAllZeroOrUndef
LLVM_ABI bool maskIsAllZeroOrUndef(Value *Mask)
Given a mask vector of i1, Return true if all of the elements of this predicate mask are known to be ...
Definition VectorUtils.cpp:1256

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559

llvm::is_contained
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
Definition STLExtras.h:1897

llvm::getAllocSize
LLVM_ABI std::optional< APInt > getAllocSize(const CallBase *CB, const TargetLibraryInfo *TLI, function_ref< const Value *(const Value *)> Mapper=[](const Value *V) { return V;})
Return the size of the requested allocation.
Definition MemoryBuiltins.cpp:367

llvm::Log2
unsigned Log2(Align A)
Returns the log2 of the alignment.
Definition Alignment.h:197

llvm::maskContainsAllOneOrUndef
LLVM_ABI bool maskContainsAllOneOrUndef(Value *Mask)
Given a mask vector of i1, Return true if any of the elements of this predicate mask are known to be ...
Definition VectorUtils.cpp:1308

llvm::isImpliedByDomCondition
LLVM_ABI std::optional< bool > isImpliedByDomCondition(const Value *Cond, const Instruction *ContextI, const DataLayout &DL)
Return the boolean condition value in the context of the given instruction if it is known based on do...
Definition ValueTracking.cpp:9673

llvm::minimum
LLVM_READONLY APFloat minimum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimum semantics.
Definition APFloat.h:1598

llvm::isKnownNegation
LLVM_ABI bool isKnownNegation(const Value *X, const Value *Y, bool NeedNSW=false, bool AllowPoison=true)
Return true if the two given values are negation.
Definition ValueTracking.cpp:8457

llvm::getUnderlyingObject
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
Definition ValueTracking.cpp:6683

llvm::isKnownNonNegative
LLVM_ABI bool isKnownNonNegative(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Returns true if the give value is known to be non-negative.
Definition ValueTracking.cpp:281

llvm::isTriviallyVectorizable
LLVM_ABI bool isTriviallyVectorizable(Intrinsic::ID ID)
Identify if the intrinsic is trivially vectorizable.
Definition VectorUtils.cpp:46

llvm::computeKnownFPSignBit
LLVM_ABI std::optional< bool > computeKnownFPSignBit(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Return false if we can prove that the specified FP value's sign bit is 0.
Definition ValueTracking.cpp:6010

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:869

raw_ostream.h

NC
#define NC
Definition regutils.h:42

llvm::AAMDNodes
A collection of metadata nodes that might be associated with a memory access used by the alias-analys...
Definition Metadata.h:761

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39

llvm::DenormalMode::IEEE
@ IEEE
IEEE-754 denormal numbers preserved.
Definition FloatingPointMode.h:78

llvm::KnownBits
Definition KnownBits.h:24

llvm::KnownBits::isNonNegative
bool isNonNegative() const
Returns true if this value is known to be non-negative.
Definition KnownBits.h:108

llvm::KnownBits::countMinTrailingZeros
unsigned countMinTrailingZeros() const
Returns the minimum number of trailing zero bits.
Definition KnownBits.h:242

llvm::KnownBits::countMaxTrailingZeros
unsigned countMaxTrailingZeros() const
Returns the maximum number of trailing zero bits possible.
Definition KnownBits.h:274

llvm::KnownBits::countMaxPopulation
unsigned countMaxPopulation() const
Returns the maximum number of bits that could be one.
Definition KnownBits.h:289

llvm::KnownBits::getBitWidth
unsigned getBitWidth() const
Get the bit width of this value.
Definition KnownBits.h:44

llvm::KnownBits::isNonZero
bool isNonZero() const
Returns true if this value is known to be non-zero.
Definition KnownBits.h:111

llvm::KnownBits::countMinLeadingZeros
unsigned countMinLeadingZeros() const
Returns the minimum number of leading zero bits.
Definition KnownBits.h:248

llvm::KnownBits::isNegative
bool isNegative() const
Returns true if this value is known to be negative.
Definition KnownBits.h:105

llvm::KnownBits::countMaxLeadingZeros
unsigned countMaxLeadingZeros() const
Returns the maximum number of leading zero bits possible.
Definition KnownBits.h:280

llvm::KnownBits::One
APInt One
Definition KnownBits.h:26

llvm::KnownBits::Zero
APInt Zero
Definition KnownBits.h:25

llvm::KnownBits::countMinPopulation
unsigned countMinPopulation() const
Returns the number of bits known to be one.
Definition KnownBits.h:286

llvm::KnownBits::isAllOnes
bool isAllOnes() const
Returns true if value is all one bits.
Definition KnownBits.h:83

llvm::KnownFPClass::KnownFPClasses
FPClassTest KnownFPClasses
Floating-point classes the value could be one of.
Definition KnownFPClass.h:25

llvm::MIPatternMatch::And
Matching combinators.
Definition MIPatternMatch.h:314

llvm::MaybeAlign
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Definition Alignment.h:106

llvm::MaybeAlign::valueOrOne
Align valueOrOne() const
For convenience, returns a valid alignment or 1 if undefined.
Definition Alignment.h:130

llvm::MinMax
Definition AssumeBundleQueries.h:72

llvm::OperandBundleUse
A lightweight accessor for an operand bundle meant to be passed around by value.
Definition InstrTypes.h:1009

llvm::OperandBundleUse::getTagName
StringRef getTagName() const
Return the tag of this operand bundle as a string.
Definition InstrTypes.h:1028

llvm::OperandBundleUse::getTagID
uint32_t getTagID() const
Return the tag of this operand bundle as an integer.
Definition InstrTypes.h:1037

llvm::OperandBundleUse::Inputs
ArrayRef< Use > Inputs
Definition InstrTypes.h:1010

llvm::PatternMatch::m_Mask
Definition PatternMatch.h:2000

llvm::PatternMatch::m_SpecificMask
Definition PatternMatch.h:2015

llvm::RetainedKnowledge
Represent one information held inside an operand bundle of an llvm.assume.
Definition AssumeBundleQueries.h:102

llvm::RetainedKnowledge::AttrKind
Attribute::AttrKind AttrKind
Definition AssumeBundleQueries.h:103

llvm::RetainedKnowledge::ArgValue
uint64_t ArgValue
Definition AssumeBundleQueries.h:104

llvm::RetainedKnowledge::WasOn
Value * WasOn
Definition AssumeBundleQueries.h:106

llvm::RetainedKnowledge::IRArgValue
Value * IRArgValue
Definition AssumeBundleQueries.h:105

llvm::SelectPatternResult::Flavor
SelectPatternFlavor Flavor
Definition ValueTracking.h:858

llvm::SimplifyQuery
Definition SimplifyQuery.h:71

llvm::SimplifyQuery::DL
const DataLayout & DL
Definition SimplifyQuery.h:72

llvm::SimplifyQuery::CxtI
const Instruction * CxtI
Definition SimplifyQuery.h:76

llvm::SimplifyQuery::getWithInstruction
SimplifyQuery getWithInstruction(const Instruction *I) const
Definition SimplifyQuery.h:108

llvm::UnderlyingObject
Definition ScheduleDAGInstrs.h:105

llvm::cl::desc
Definition CommandLine.h:411