doxygen/InstCombineCalls_8cpp_source.html

//===- InstCombineCalls.cpp -----------------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the visitCall, visitInvoke, and visitCallBr functions.

//

//===----------------------------------------------------------------------===//


#include "InstCombineInternal.h"

#include "llvm/ADT/APFloat.h"

#include "llvm/ADT/APInt.h"

#include "llvm/ADT/APSInt.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/ADT/STLFunctionalExtras.h"

#include "llvm/ADT/SmallBitVector.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/AliasAnalysis.h"

#include "llvm/Analysis/AssumeBundleQueries.h"

#include "llvm/Analysis/AssumptionCache.h"

#include "llvm/Analysis/InstructionSimplify.h"

#include "llvm/Analysis/Loads.h"

#include "llvm/Analysis/MemoryBuiltins.h"

#include "llvm/Analysis/ValueTracking.h"

#include "llvm/Analysis/VectorUtils.h"

#include "llvm/IR/AttributeMask.h"

#include "llvm/IR/Attributes.h"

#include "llvm/IR/BasicBlock.h"

#include "llvm/IR/Constant.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/IR/DebugInfo.h"

#include "llvm/IR/DerivedTypes.h"

#include "llvm/IR/Function.h"

#include "llvm/IR/GlobalVariable.h"

#include "llvm/IR/InlineAsm.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Instruction.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Intrinsics.h"

#include "llvm/IR/IntrinsicsAArch64.h"

#include "llvm/IR/IntrinsicsAMDGPU.h"

#include "llvm/IR/IntrinsicsARM.h"

#include "llvm/IR/IntrinsicsHexagon.h"

#include "llvm/IR/LLVMContext.h"

#include "llvm/IR/Metadata.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/IR/Statepoint.h"

#include "llvm/IR/Type.h"

#include "llvm/IR/User.h"

#include "llvm/IR/Value.h"

#include "llvm/IR/ValueHandle.h"

#include "llvm/Support/AtomicOrdering.h"

#include "llvm/Support/Casting.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/KnownBits.h"

#include "llvm/Support/MathExtras.h"

#include "llvm/Support/raw_ostream.h"

#include "llvm/Transforms/InstCombine/InstCombiner.h"

#include "llvm/Transforms/Utils/AssumeBundleBuilder.h"

#include "llvm/Transforms/Utils/Local.h"

#include "llvm/Transforms/Utils/SimplifyLibCalls.h"

#include <algorithm>

#include <cassert>

#include <cstdint>

#include <optional>

#include <utility>

#include <vector>


#define DEBUG_TYPE "instcombine"

#include "llvm/Transforms/Utils/InstructionWorklist.h"


using namespace llvm;

using namespace PatternMatch;


STATISTIC(NumSimplified, "Number of library calls simplified");


static cl::opt<unsigned> GuardWideningWindow(

    "instcombine-guard-widening-window",

    cl::init(3),

    cl::desc("How wide an instruction window to bypass looking for "

             "another guard"));


/// Return the specified type promoted as it would be to pass though a va_arg

/// area.

static Type *getPromotedType(Type *Ty) {

  if (IntegerType* ITy = dyn_cast<IntegerType>(Ty)) {

    if (ITy->getBitWidth() < 32)

      return Type::getInt32Ty(Ty->getContext());

  }

  return Ty;

}


/// Recognize a memcpy/memmove from a trivially otherwise unused alloca.

/// TODO: This should probably be integrated with visitAllocSites, but that

/// requires a deeper change to allow either unread or unwritten objects.

static bool hasUndefSource(AnyMemTransferInst *MI) {

  auto *Src = MI->getRawSource();

  while (isa<GetElementPtrInst>(Src) || isa<BitCastInst>(Src)) {

    if (!Src->hasOneUse())

      return false;

    Src = cast<Instruction>(Src)->getOperand(0);

  }

  return isa<AllocaInst>(Src) && Src->hasOneUse();

}


Instruction *InstCombinerImpl::SimplifyAnyMemTransfer(AnyMemTransferInst *MI) {

  Align DstAlign = getKnownAlignment(MI->getRawDest(), DL, MI, &AC, &DT);

  MaybeAlign CopyDstAlign = MI->getDestAlign();

  if (!CopyDstAlign || *CopyDstAlign < DstAlign) {

    MI->setDestAlignment(DstAlign);

    return MI;

  }


  Align SrcAlign = getKnownAlignment(MI->getRawSource(), DL, MI, &AC, &DT);

  MaybeAlign CopySrcAlign = MI->getSourceAlign();

  if (!CopySrcAlign || *CopySrcAlign < SrcAlign) {

    MI->setSourceAlignment(SrcAlign);

    return MI;

  }


  // If we have a store to a location which is known constant, we can conclude

  // that the store must be storing the constant value (else the memory

  // wouldn't be constant), and this must be a noop.

  if (!isModSet(AA->getModRefInfoMask(MI->getDest()))) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // If the source is provably undef, the memcpy/memmove doesn't do anything

  // (unless the transfer is volatile).

  if (hasUndefSource(MI) && !MI->isVolatile()) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // If MemCpyInst length is 1/2/4/8 bytes then replace memcpy with

  // load/store.

  ConstantInt *MemOpLength = dyn_cast<ConstantInt>(MI->getLength());

  if (!MemOpLength) return nullptr;


  // Source and destination pointer types are always "i8*" for intrinsic.  See

  // if the size is something we can handle with a single primitive load/store.

  // A single load+store correctly handles overlapping memory in the memmove

  // case.

  uint64_t Size = MemOpLength->getLimitedValue();

  assert(Size && "0-sized memory transferring should be removed already.");


  if (Size > 8 || (Size&(Size-1)))

    return nullptr;  // If not 1/2/4/8 bytes, exit.


  // If it is an atomic and alignment is less than the size then we will

  // introduce the unaligned memory access which will be later transformed

  // into libcall in CodeGen. This is not evident performance gain so disable

  // it now.

  if (isa<AtomicMemTransferInst>(MI))

    if (*CopyDstAlign < Size || *CopySrcAlign < Size)

      return nullptr;


  // Use an integer load+store unless we can find something better.

  IntegerType* IntType = IntegerType::get(MI->getContext(), Size<<3);


  // If the memcpy has metadata describing the members, see if we can get the

  // TBAA tag describing our copy.

  AAMDNodes AACopyMD = MI->getAAMetadata().adjustForAccess(Size);


  Value *Src = MI->getArgOperand(1);

  Value *Dest = MI->getArgOperand(0);

  LoadInst *L = Builder.CreateLoad(IntType, Src);

  // Alignment from the mem intrinsic will be better, so use it.

  L->setAlignment(*CopySrcAlign);

  L->setAAMetadata(AACopyMD);

  MDNode *LoopMemParallelMD =

    MI->getMetadata(LLVMContext::MD_mem_parallel_loop_access);

  if (LoopMemParallelMD)

    L->setMetadata(LLVMContext::MD_mem_parallel_loop_access, LoopMemParallelMD);

  MDNode *AccessGroupMD = MI->getMetadata(LLVMContext::MD_access_group);

  if (AccessGroupMD)

    L->setMetadata(LLVMContext::MD_access_group, AccessGroupMD);


  StoreInst *S = Builder.CreateStore(L, Dest);

  // Alignment from the mem intrinsic will be better, so use it.

  S->setAlignment(*CopyDstAlign);

  S->setAAMetadata(AACopyMD);

  if (LoopMemParallelMD)

    S->setMetadata(LLVMContext::MD_mem_parallel_loop_access, LoopMemParallelMD);

  if (AccessGroupMD)

    S->setMetadata(LLVMContext::MD_access_group, AccessGroupMD);

  S->copyMetadata(*MI, LLVMContext::MD_DIAssignID);


  if (auto *MT = dyn_cast<MemTransferInst>(MI)) {

    // non-atomics can be volatile

    L->setVolatile(MT->isVolatile());

    S->setVolatile(MT->isVolatile());

  }

  if (isa<AtomicMemTransferInst>(MI)) {

    // atomics have to be unordered

    L->setOrdering(AtomicOrdering::Unordered);

    S->setOrdering(AtomicOrdering::Unordered);

  }


  // Set the size of the copy to 0, it will be deleted on the next iteration.

  MI->setLength(Constant::getNullValue(MemOpLength->getType()));

  return MI;

}


Instruction *InstCombinerImpl::SimplifyAnyMemSet(AnyMemSetInst *MI) {

  const Align KnownAlignment =

      getKnownAlignment(MI->getDest(), DL, MI, &AC, &DT);

  MaybeAlign MemSetAlign = MI->getDestAlign();

  if (!MemSetAlign || *MemSetAlign < KnownAlignment) {

    MI->setDestAlignment(KnownAlignment);

    return MI;

  }


  // If we have a store to a location which is known constant, we can conclude

  // that the store must be storing the constant value (else the memory

  // wouldn't be constant), and this must be a noop.

  if (!isModSet(AA->getModRefInfoMask(MI->getDest()))) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // Remove memset with an undef value.

  // FIXME: This is technically incorrect because it might overwrite a poison

  // value. Change to PoisonValue once #52930 is resolved.

  if (isa<UndefValue>(MI->getValue())) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // Extract the length and alignment and fill if they are constant.

  ConstantInt *LenC = dyn_cast<ConstantInt>(MI->getLength());

  ConstantInt *FillC = dyn_cast<ConstantInt>(MI->getValue());

  if (!LenC || !FillC || !FillC->getType()->isIntegerTy(8))

    return nullptr;

  const uint64_t Len = LenC->getLimitedValue();

  assert(Len && "0-sized memory setting should be removed already.");

  const Align Alignment = MI->getDestAlign().valueOrOne();


  // If it is an atomic and alignment is less than the size then we will

  // introduce the unaligned memory access which will be later transformed

  // into libcall in CodeGen. This is not evident performance gain so disable

  // it now.

  if (isa<AtomicMemSetInst>(MI))

    if (Alignment < Len)

      return nullptr;


  // memset(s,c,n) -> store s, c (for n=1,2,4,8)

  if (Len <= 8 && isPowerOf2_32((uint32_t)Len)) {

    Type *ITy = IntegerType::get(MI->getContext(), Len*8);  // n=1 -> i8.


    Value *Dest = MI->getDest();


    // Extract the fill value and store.

    const uint64_t Fill = FillC->getZExtValue()*0x0101010101010101ULL;

    Constant *FillVal = ConstantInt::get(ITy, Fill);

    StoreInst *S = Builder.CreateStore(FillVal, Dest, MI->isVolatile());

    S->copyMetadata(*MI, LLVMContext::MD_DIAssignID);

    auto replaceOpForAssignmentMarkers = [FillC, FillVal](auto *DbgAssign) {

      if (llvm::is_contained(DbgAssign->location_ops(), FillC))

        DbgAssign->replaceVariableLocationOp(FillC, FillVal);

    };

    for_each(at::getAssignmentMarkers(S), replaceOpForAssignmentMarkers);

    for_each(at::getDVRAssignmentMarkers(S), replaceOpForAssignmentMarkers);


    S->setAlignment(Alignment);

    if (isa<AtomicMemSetInst>(MI))

      S->setOrdering(AtomicOrdering::Unordered);


    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(LenC->getType()));

    return MI;

  }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Narrow width by halfs excluding zero/undef lanes

Value *InstCombinerImpl::simplifyMaskedLoad(IntrinsicInst &II) {

  Value *LoadPtr = II.getArgOperand(0);

  const Align Alignment =

      cast<ConstantInt>(II.getArgOperand(1))->getAlignValue();


  // If the mask is all ones or undefs, this is a plain vector load of the 1st

  // argument.

  if (maskIsAllOneOrUndef(II.getArgOperand(2))) {

    LoadInst *L = Builder.CreateAlignedLoad(II.getType(), LoadPtr, Alignment,

                                            "unmaskedload");

    L->copyMetadata(II);

    return L;

  }


  // If we can unconditionally load from this address, replace with a

  // load/select idiom. TODO: use DT for context sensitive query

  if (isDereferenceablePointer(LoadPtr, II.getType(),

                               II.getDataLayout(), &II, &AC)) {

    LoadInst *LI = Builder.CreateAlignedLoad(II.getType(), LoadPtr, Alignment,

                                             "unmaskedload");

    LI->copyMetadata(II);

    return Builder.CreateSelect(II.getArgOperand(2), LI, II.getArgOperand(3));

  }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane -> store

// * Narrow width by halfs excluding zero/undef lanes

Instruction *InstCombinerImpl::simplifyMaskedStore(IntrinsicInst &II) {

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(3));

  if (!ConstMask)

    return nullptr;


  // If the mask is all zeros, this instruction does nothing.

  if (ConstMask->isNullValue())

    return eraseInstFromFunction(II);


  // If the mask is all ones, this is a plain vector store of the 1st argument.

  if (ConstMask->isAllOnesValue()) {

    Value *StorePtr = II.getArgOperand(1);

    Align Alignment = cast<ConstantInt>(II.getArgOperand(2))->getAlignValue();

    StoreInst *S =

        new StoreInst(II.getArgOperand(0), StorePtr, false, Alignment);

    S->copyMetadata(II);

    return S;

  }


  if (isa<ScalableVectorType>(ConstMask->getType()))

    return nullptr;


  // Use masked off lanes to simplify operands via SimplifyDemandedVectorElts

  APInt DemandedElts = possiblyDemandedEltsInMask(ConstMask);

  APInt PoisonElts(DemandedElts.getBitWidth(), 0);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(0), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 0, V);


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane load -> load

// * Dereferenceable address & few lanes -> scalarize speculative load/selects

// * Adjacent vector addresses -> masked.load

// * Narrow width by halfs excluding zero/undef lanes

// * Vector incrementing address -> vector masked load

Instruction *InstCombinerImpl::simplifyMaskedGather(IntrinsicInst &II) {

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(2));

  if (!ConstMask)

    return nullptr;


  // Vector splat address w/known mask -> scalar load

  // Fold the gather to load the source vector first lane

  // because it is reloading the same value each time

  if (ConstMask->isAllOnesValue())

    if (auto *SplatPtr = getSplatValue(II.getArgOperand(0))) {

      auto *VecTy = cast<VectorType>(II.getType());

      const Align Alignment =

          cast<ConstantInt>(II.getArgOperand(1))->getAlignValue();

      LoadInst *L = Builder.CreateAlignedLoad(VecTy->getElementType(), SplatPtr,

                                              Alignment, "load.scalar");

      Value *Shuf =

          Builder.CreateVectorSplat(VecTy->getElementCount(), L, "broadcast");

      return replaceInstUsesWith(II, cast<Instruction>(Shuf));

    }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane -> store

// * Adjacent vector addresses -> masked.store

// * Narrow store width by halfs excluding zero/undef lanes

// * Vector incrementing address -> vector masked store

Instruction *InstCombinerImpl::simplifyMaskedScatter(IntrinsicInst &II) {

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(3));

  if (!ConstMask)

    return nullptr;


  // If the mask is all zeros, a scatter does nothing.

  if (ConstMask->isNullValue())

    return eraseInstFromFunction(II);


  // Vector splat address -> scalar store

  if (auto *SplatPtr = getSplatValue(II.getArgOperand(1))) {

    // scatter(splat(value), splat(ptr), non-zero-mask) -> store value, ptr

    if (auto *SplatValue = getSplatValue(II.getArgOperand(0))) {

      if (maskContainsAllOneOrUndef(ConstMask)) {

        Align Alignment =

            cast<ConstantInt>(II.getArgOperand(2))->getAlignValue();

        StoreInst *S = new StoreInst(SplatValue, SplatPtr, /*IsVolatile=*/false,

                                     Alignment);

        S->copyMetadata(II);

        return S;

      }

    }

    // scatter(vector, splat(ptr), splat(true)) -> store extract(vector,

    // lastlane), ptr

    if (ConstMask->isAllOnesValue()) {

      Align Alignment = cast<ConstantInt>(II.getArgOperand(2))->getAlignValue();

      VectorType *WideLoadTy = cast<VectorType>(II.getArgOperand(1)->getType());

      ElementCount VF = WideLoadTy->getElementCount();

      Value *RunTimeVF = Builder.CreateElementCount(Builder.getInt32Ty(), VF);

      Value *LastLane = Builder.CreateSub(RunTimeVF, Builder.getInt32(1));

      Value *Extract =

          Builder.CreateExtractElement(II.getArgOperand(0), LastLane);

      StoreInst *S =

          new StoreInst(Extract, SplatPtr, /*IsVolatile=*/false, Alignment);

      S->copyMetadata(II);

      return S;

    }

  }

  if (isa<ScalableVectorType>(ConstMask->getType()))

    return nullptr;


  // Use masked off lanes to simplify operands via SimplifyDemandedVectorElts

  APInt DemandedElts = possiblyDemandedEltsInMask(ConstMask);

  APInt PoisonElts(DemandedElts.getBitWidth(), 0);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(0), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 0, V);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(1), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 1, V);


  return nullptr;

}


/// This function transforms launder.invariant.group and strip.invariant.group

/// like:

/// launder(launder(%x)) -> launder(%x)       (the result is not the argument)

/// launder(strip(%x)) -> launder(%x)

/// strip(strip(%x)) -> strip(%x)             (the result is not the argument)

/// strip(launder(%x)) -> strip(%x)

/// This is legal because it preserves the most recent information about

/// the presence or absence of invariant.group.

static Instruction *simplifyInvariantGroupIntrinsic(IntrinsicInst &II,

                                                    InstCombinerImpl &IC) {

  auto *Arg = II.getArgOperand(0);

  auto *StrippedArg = Arg->stripPointerCasts();

  auto *StrippedInvariantGroupsArg = StrippedArg;

  while (auto *Intr = dyn_cast<IntrinsicInst>(StrippedInvariantGroupsArg)) {

    if (Intr->getIntrinsicID() != Intrinsic::launder_invariant_group &&

        Intr->getIntrinsicID() != Intrinsic::strip_invariant_group)

      break;

    StrippedInvariantGroupsArg = Intr->getArgOperand(0)->stripPointerCasts();

  }

  if (StrippedArg == StrippedInvariantGroupsArg)

    return nullptr; // No launders/strips to remove.


  Value *Result = nullptr;


  if (II.getIntrinsicID() == Intrinsic::launder_invariant_group)

    Result = IC.Builder.CreateLaunderInvariantGroup(StrippedInvariantGroupsArg);

  else if (II.getIntrinsicID() == Intrinsic::strip_invariant_group)

    Result = IC.Builder.CreateStripInvariantGroup(StrippedInvariantGroupsArg);

  else

    llvm_unreachable(

        "simplifyInvariantGroupIntrinsic only handles launder and strip");

  if (Result->getType()->getPointerAddressSpace() !=

      II.getType()->getPointerAddressSpace())

    Result = IC.Builder.CreateAddrSpaceCast(Result, II.getType());


  return cast<Instruction>(Result);

}


static Instruction *foldCttzCtlz(IntrinsicInst &II, InstCombinerImpl &IC) {

  assert((II.getIntrinsicID() == Intrinsic::cttz ||

          II.getIntrinsicID() == Intrinsic::ctlz) &&

         "Expected cttz or ctlz intrinsic");

  bool IsTZ = II.getIntrinsicID() == Intrinsic::cttz;

  Value *Op0 = II.getArgOperand(0);

  Value *Op1 = II.getArgOperand(1);

  Value *X;

  // ctlz(bitreverse(x)) -> cttz(x)

  // cttz(bitreverse(x)) -> ctlz(x)

  if (match(Op0, m_BitReverse(m_Value(X)))) {

    Intrinsic::ID ID = IsTZ ? Intrinsic::ctlz : Intrinsic::cttz;

    Function *F = Intrinsic::getDeclaration(II.getModule(), ID, II.getType());

    return CallInst::Create(F, {X, II.getArgOperand(1)});

  }


  if (II.getType()->isIntOrIntVectorTy(1)) {

    // ctlz/cttz i1 Op0 --> not Op0

    if (match(Op1, m_Zero()))

      return BinaryOperator::CreateNot(Op0);

    // If zero is poison, then the input can be assumed to be "true", so the

    // instruction simplifies to "false".

    assert(match(Op1, m_One()) && "Expected ctlz/cttz operand to be 0 or 1");

    return IC.replaceInstUsesWith(II, ConstantInt::getNullValue(II.getType()));

  }


  // If ctlz/cttz is only used as a shift amount, set is_zero_poison to true.

  if (II.hasOneUse() && match(Op1, m_Zero()) &&

      match(II.user_back(), m_Shift(m_Value(), m_Specific(&II))))

    return IC.replaceOperand(II, 1, IC.Builder.getTrue());


  Constant *C;


  if (IsTZ) {

    // cttz(-x) -> cttz(x)

    if (match(Op0, m_Neg(m_Value(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(-x & x) -> cttz(x)

    if (match(Op0, m_c_And(m_Neg(m_Value(X)), m_Deferred(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(sext(x)) -> cttz(zext(x))

    if (match(Op0, m_OneUse(m_SExt(m_Value(X))))) {

      auto *Zext = IC.Builder.CreateZExt(X, II.getType());

      auto *CttzZext =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, Zext, Op1);

      return IC.replaceInstUsesWith(II, CttzZext);

    }


    // Zext doesn't change the number of trailing zeros, so narrow:

    // cttz(zext(x)) -> zext(cttz(x)) if the 'ZeroIsPoison' parameter is 'true'.

    if (match(Op0, m_OneUse(m_ZExt(m_Value(X)))) && match(Op1, m_One())) {

      auto *Cttz = IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, X,

                                                    IC.Builder.getTrue());

      auto *ZextCttz = IC.Builder.CreateZExt(Cttz, II.getType());

      return IC.replaceInstUsesWith(II, ZextCttz);

    }


    // cttz(abs(x)) -> cttz(x)

    // cttz(nabs(x)) -> cttz(x)

    Value *Y;

    SelectPatternFlavor SPF = matchSelectPattern(Op0, X, Y).Flavor;

    if (SPF == SPF_ABS || SPF == SPF_NABS)

      return IC.replaceOperand(II, 0, X);


    if (match(Op0, m_Intrinsic<Intrinsic::abs>(m_Value(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(shl(%const, %val), 1) --> add(cttz(%const, 1), %val)

    if (match(Op0, m_Shl(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCttz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, C, Op1);

      return BinaryOperator::CreateAdd(ConstCttz, X);

    }


    // cttz(lshr exact (%const, %val), 1) --> sub(cttz(%const, 1), %val)

    if (match(Op0, m_Exact(m_LShr(m_ImmConstant(C), m_Value(X)))) &&

        match(Op1, m_One())) {

      Value *ConstCttz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, C, Op1);

      return BinaryOperator::CreateSub(ConstCttz, X);

    }


    // cttz(add(lshr(UINT_MAX, %val), 1)) --> sub(width, %val)

    if (match(Op0, m_Add(m_LShr(m_AllOnes(), m_Value(X)), m_One()))) {

      Value *Width =

          ConstantInt::get(II.getType(), II.getType()->getScalarSizeInBits());

      return BinaryOperator::CreateSub(Width, X);

    }

  } else {

    // ctlz(lshr(%const, %val), 1) --> add(ctlz(%const, 1), %val)

    if (match(Op0, m_LShr(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCtlz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::ctlz, C, Op1);

      return BinaryOperator::CreateAdd(ConstCtlz, X);

    }


    // ctlz(shl nuw (%const, %val), 1) --> sub(ctlz(%const, 1), %val)

    if (match(Op0, m_NUWShl(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCtlz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::ctlz, C, Op1);

      return BinaryOperator::CreateSub(ConstCtlz, X);

    }

  }


  KnownBits Known = IC.computeKnownBits(Op0, 0, &II);


  // Create a mask for bits above (ctlz) or below (cttz) the first known one.

  unsigned PossibleZeros = IsTZ ? Known.countMaxTrailingZeros()

                                : Known.countMaxLeadingZeros();

  unsigned DefiniteZeros = IsTZ ? Known.countMinTrailingZeros()

                                : Known.countMinLeadingZeros();


  // If all bits above (ctlz) or below (cttz) the first known one are known

  // zero, this value is constant.

  // FIXME: This should be in InstSimplify because we're replacing an

  // instruction with a constant.

  if (PossibleZeros == DefiniteZeros) {

    auto *C = ConstantInt::get(Op0->getType(), DefiniteZeros);

    return IC.replaceInstUsesWith(II, C);

  }


  // If the input to cttz/ctlz is known to be non-zero,

  // then change the 'ZeroIsPoison' parameter to 'true'

  // because we know the zero behavior can't affect the result.

  if (!Known.One.isZero() ||

      isKnownNonZero(Op0, IC.getSimplifyQuery().getWithInstruction(&II))) {

    if (!match(II.getArgOperand(1), m_One()))

      return IC.replaceOperand(II, 1, IC.Builder.getTrue());

  }


  // Add range attribute since known bits can't completely reflect what we know.

  unsigned BitWidth = Op0->getType()->getScalarSizeInBits();

  if (BitWidth != 1 && !II.hasRetAttr(Attribute::Range) &&

      !II.getMetadata(LLVMContext::MD_range)) {

    ConstantRange Range(APInt(BitWidth, DefiniteZeros),

                        APInt(BitWidth, PossibleZeros + 1));

    II.addRangeRetAttr(Range);

    return &II;

  }


  return nullptr;

}


static Instruction *foldCtpop(IntrinsicInst &II, InstCombinerImpl &IC) {

  assert(II.getIntrinsicID() == Intrinsic::ctpop &&

         "Expected ctpop intrinsic");

  Type *Ty = II.getType();

  unsigned BitWidth = Ty->getScalarSizeInBits();

  Value *Op0 = II.getArgOperand(0);

  Value *X, *Y;


  // ctpop(bitreverse(x)) -> ctpop(x)

  // ctpop(bswap(x)) -> ctpop(x)

  if (match(Op0, m_BitReverse(m_Value(X))) || match(Op0, m_BSwap(m_Value(X))))

    return IC.replaceOperand(II, 0, X);


  // ctpop(rot(x)) -> ctpop(x)

  if ((match(Op0, m_FShl(m_Value(X), m_Value(Y), m_Value())) ||

       match(Op0, m_FShr(m_Value(X), m_Value(Y), m_Value()))) &&

      X == Y)

    return IC.replaceOperand(II, 0, X);


  // ctpop(x | -x) -> bitwidth - cttz(x, false)

  if (Op0->hasOneUse() &&

      match(Op0, m_c_Or(m_Value(X), m_Neg(m_Deferred(X))))) {

    Function *F =

        Intrinsic::getDeclaration(II.getModule(), Intrinsic::cttz, Ty);

    auto *Cttz = IC.Builder.CreateCall(F, {X, IC.Builder.getFalse()});

    auto *Bw = ConstantInt::get(Ty, APInt(BitWidth, BitWidth));

    return IC.replaceInstUsesWith(II, IC.Builder.CreateSub(Bw, Cttz));

  }


  // ctpop(~x & (x - 1)) -> cttz(x, false)

  if (match(Op0,

            m_c_And(m_Not(m_Value(X)), m_Add(m_Deferred(X), m_AllOnes())))) {

    Function *F =

        Intrinsic::getDeclaration(II.getModule(), Intrinsic::cttz, Ty);

    return CallInst::Create(F, {X, IC.Builder.getFalse()});

  }


  // Zext doesn't change the number of set bits, so narrow:

  // ctpop (zext X) --> zext (ctpop X)

  if (match(Op0, m_OneUse(m_ZExt(m_Value(X))))) {

    Value *NarrowPop = IC.Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, X);

    return CastInst::Create(Instruction::ZExt, NarrowPop, Ty);

  }


  KnownBits Known(BitWidth);

  IC.computeKnownBits(Op0, Known, 0, &II);


  // If all bits are zero except for exactly one fixed bit, then the result

  // must be 0 or 1, and we can get that answer by shifting to LSB:

  // ctpop (X & 32) --> (X & 32) >> 5

  // TODO: Investigate removing this as its likely unnecessary given the below

  // `isKnownToBeAPowerOfTwo` check.

  if ((~Known.Zero).isPowerOf2())

    return BinaryOperator::CreateLShr(

        Op0, ConstantInt::get(Ty, (~Known.Zero).exactLogBase2()));


  // More generally we can also handle non-constant power of 2 patterns such as

  // shl/shr(Pow2, X), (X & -X), etc... by transforming:

  // ctpop(Pow2OrZero) --> icmp ne X, 0

  if (IC.isKnownToBeAPowerOfTwo(Op0, /* OrZero */ true))

    return CastInst::Create(Instruction::ZExt,

                            IC.Builder.CreateICmp(ICmpInst::ICMP_NE, Op0,

                                                  Constant::getNullValue(Ty)),

                            Ty);


  // Add range attribute since known bits can't completely reflect what we know.

  if (BitWidth != 1 && !II.hasRetAttr(Attribute::Range) &&

      !II.getMetadata(LLVMContext::MD_range)) {

    ConstantRange Range(APInt(BitWidth, Known.countMinPopulation()),

                        APInt(BitWidth, Known.countMaxPopulation() + 1));

    II.addRangeRetAttr(Range);

    return &II;

  }


  return nullptr;

}


/// Convert a table lookup to shufflevector if the mask is constant.

/// This could benefit tbl1 if the mask is { 7,6,5,4,3,2,1,0 }, in

/// which case we could lower the shufflevector with rev64 instructions

/// as it's actually a byte reverse.

static Value *simplifyNeonTbl1(const IntrinsicInst &II,

                               InstCombiner::BuilderTy &Builder) {

  // Bail out if the mask is not a constant.

  auto *C = dyn_cast<Constant>(II.getArgOperand(1));

  if (!C)

    return nullptr;


  auto *VecTy = cast<FixedVectorType>(II.getType());

  unsigned NumElts = VecTy->getNumElements();


  // Only perform this transformation for <8 x i8> vector types.

  if (!VecTy->getElementType()->isIntegerTy(8) || NumElts != 8)

    return nullptr;


  int Indexes[8];


  for (unsigned I = 0; I < NumElts; ++I) {

    Constant *COp = C->getAggregateElement(I);


    if (!COp || !isa<ConstantInt>(COp))

      return nullptr;


    Indexes[I] = cast<ConstantInt>(COp)->getLimitedValue();


    // Make sure the mask indices are in range.

    if ((unsigned)Indexes[I] >= NumElts)

      return nullptr;

  }


  auto *V1 = II.getArgOperand(0);

  auto *V2 = Constant::getNullValue(V1->getType());

  return Builder.CreateShuffleVector(V1, V2, ArrayRef(Indexes));

}


// Returns true iff the 2 intrinsics have the same operands, limiting the

// comparison to the first NumOperands.

static bool haveSameOperands(const IntrinsicInst &I, const IntrinsicInst &E,

                             unsigned NumOperands) {

  assert(I.arg_size() >= NumOperands && "Not enough operands");

  assert(E.arg_size() >= NumOperands && "Not enough operands");

  for (unsigned i = 0; i < NumOperands; i++)

    if (I.getArgOperand(i) != E.getArgOperand(i))

      return false;

  return true;

}


// Remove trivially empty start/end intrinsic ranges, i.e. a start

// immediately followed by an end (ignoring debuginfo or other

// start/end intrinsics in between). As this handles only the most trivial

// cases, tracking the nesting level is not needed:

//

//   call @llvm.foo.start(i1 0)

//   call @llvm.foo.start(i1 0) ; This one won't be skipped: it will be removed

//   call @llvm.foo.end(i1 0)

//   call @llvm.foo.end(i1 0) ; &I

static bool

removeTriviallyEmptyRange(IntrinsicInst &EndI, InstCombinerImpl &IC,

                          std::function<bool(const IntrinsicInst &)> IsStart) {

  // We start from the end intrinsic and scan backwards, so that InstCombine

  // has already processed (and potentially removed) all the instructions

  // before the end intrinsic.

  BasicBlock::reverse_iterator BI(EndI), BE(EndI.getParent()->rend());

  for (; BI != BE; ++BI) {

    if (auto *I = dyn_cast<IntrinsicInst>(&*BI)) {

      if (I->isDebugOrPseudoInst() ||

          I->getIntrinsicID() == EndI.getIntrinsicID())

        continue;

      if (IsStart(*I)) {

        if (haveSameOperands(EndI, *I, EndI.arg_size())) {

          IC.eraseInstFromFunction(*I);

          IC.eraseInstFromFunction(EndI);

          return true;

        }

        // Skip start intrinsics that don't pair with this end intrinsic.

        continue;

      }

    }

    break;

  }


  return false;

}


Instruction *InstCombinerImpl::visitVAEndInst(VAEndInst &I) {

  removeTriviallyEmptyRange(I, *this, [](const IntrinsicInst &I) {

    return I.getIntrinsicID() == Intrinsic::vastart ||

           I.getIntrinsicID() == Intrinsic::vacopy;

  });

  return nullptr;

}


static CallInst *canonicalizeConstantArg0ToArg1(CallInst &Call) {

  assert(Call.arg_size() > 1 && "Need at least 2 args to swap");

  Value *Arg0 = Call.getArgOperand(0), *Arg1 = Call.getArgOperand(1);

  if (isa<Constant>(Arg0) && !isa<Constant>(Arg1)) {

    Call.setArgOperand(0, Arg1);

    Call.setArgOperand(1, Arg0);

    return &Call;

  }

  return nullptr;

}


/// Creates a result tuple for an overflow intrinsic \p II with a given

/// \p Result and a constant \p Overflow value.

static Instruction *createOverflowTuple(IntrinsicInst *II, Value *Result,

                                        Constant *Overflow) {

  Constant *V[] = {PoisonValue::get(Result->getType()), Overflow};

  StructType *ST = cast<StructType>(II->getType());

  Constant *Struct = ConstantStruct::get(ST, V);

  return InsertValueInst::Create(Struct, Result, 0);

}


Instruction *

InstCombinerImpl::foldIntrinsicWithOverflowCommon(IntrinsicInst *II) {

  WithOverflowInst *WO = cast<WithOverflowInst>(II);

  Value *OperationResult = nullptr;

  Constant *OverflowResult = nullptr;

  if (OptimizeOverflowCheck(WO->getBinaryOp(), WO->isSigned(), WO->getLHS(),

                            WO->getRHS(), *WO, OperationResult, OverflowResult))

    return createOverflowTuple(WO, OperationResult, OverflowResult);

  return nullptr;

}


static bool inputDenormalIsIEEE(const Function &F, const Type *Ty) {

  Ty = Ty->getScalarType();

  return F.getDenormalMode(Ty->getFltSemantics()).Input == DenormalMode::IEEE;

}


static bool inputDenormalIsDAZ(const Function &F, const Type *Ty) {

  Ty = Ty->getScalarType();

  return F.getDenormalMode(Ty->getFltSemantics()).inputsAreZero();

}


/// \returns the compare predicate type if the test performed by

/// llvm.is.fpclass(x, \p Mask) is equivalent to fcmp o__ x, 0.0 with the

/// floating-point environment assumed for \p F for type \p Ty

static FCmpInst::Predicate fpclassTestIsFCmp0(FPClassTest Mask,

                                              const Function &F, Type *Ty) {

  switch (static_cast<unsigned>(Mask)) {

  case fcZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OEQ;

    break;

  case fcZero | fcSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OEQ;

    break;

  case fcPositive | fcNegZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OGE;

    break;

  case fcPositive | fcNegZero | fcNegSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OGE;

    break;

  case fcPosSubnormal | fcPosNormal | fcPosInf:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OGT;

    break;

  case fcNegative | fcPosZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OLE;

    break;

  case fcNegative | fcPosZero | fcPosSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OLE;

    break;

  case fcNegSubnormal | fcNegNormal | fcNegInf:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OLT;

    break;

  case fcPosNormal | fcPosInf:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OGT;

    break;

  case fcNegNormal | fcNegInf:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OLT;

    break;

  case ~fcZero & ~fcNan:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_ONE;

    break;

  case ~(fcZero | fcSubnormal) & ~fcNan:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_ONE;

    break;

  default:

    break;

  }


  return FCmpInst::BAD_FCMP_PREDICATE;

}


Instruction *InstCombinerImpl::foldIntrinsicIsFPClass(IntrinsicInst &II) {

  Value *Src0 = II.getArgOperand(0);

  Value *Src1 = II.getArgOperand(1);

  const ConstantInt *CMask = cast<ConstantInt>(Src1);

  FPClassTest Mask = static_cast<FPClassTest>(CMask->getZExtValue());

  const bool IsUnordered = (Mask & fcNan) == fcNan;

  const bool IsOrdered = (Mask & fcNan) == fcNone;

  const FPClassTest OrderedMask = Mask & ~fcNan;

  const FPClassTest OrderedInvertedMask = ~OrderedMask & ~fcNan;


  const bool IsStrict =

      II.getFunction()->getAttributes().hasFnAttr(Attribute::StrictFP);


  Value *FNegSrc;

  if (match(Src0, m_FNeg(m_Value(FNegSrc)))) {

    // is.fpclass (fneg x), mask -> is.fpclass x, (fneg mask)


    II.setArgOperand(1, ConstantInt::get(Src1->getType(), fneg(Mask)));

    return replaceOperand(II, 0, FNegSrc);

  }


  Value *FAbsSrc;

  if (match(Src0, m_FAbs(m_Value(FAbsSrc)))) {

    II.setArgOperand(1, ConstantInt::get(Src1->getType(), inverse_fabs(Mask)));

    return replaceOperand(II, 0, FAbsSrc);

  }


  if ((OrderedMask == fcInf || OrderedInvertedMask == fcInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, fcInf) -> fcmp oeq fabs(x), +inf

    // is.fpclass(x, ~fcInf) -> fcmp one fabs(x), +inf

    // is.fpclass(x, fcInf|fcNan) -> fcmp ueq fabs(x), +inf

    // is.fpclass(x, ~(fcInf|fcNan)) -> fcmp une fabs(x), +inf

    Constant *Inf = ConstantFP::getInfinity(Src0->getType());

    FCmpInst::Predicate Pred =

        IsUnordered ? FCmpInst::FCMP_UEQ : FCmpInst::FCMP_OEQ;

    if (OrderedInvertedMask == fcInf)

      Pred = IsUnordered ? FCmpInst::FCMP_UNE : FCmpInst::FCMP_ONE;


    Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Src0);

    Value *CmpInf = Builder.CreateFCmp(Pred, Fabs, Inf);

    CmpInf->takeName(&II);

    return replaceInstUsesWith(II, CmpInf);

  }


  if ((OrderedMask == fcPosInf || OrderedMask == fcNegInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, fcPosInf) -> fcmp oeq x, +inf

    // is.fpclass(x, fcNegInf) -> fcmp oeq x, -inf

    // is.fpclass(x, fcPosInf|fcNan) -> fcmp ueq x, +inf

    // is.fpclass(x, fcNegInf|fcNan) -> fcmp ueq x, -inf

    Constant *Inf =

        ConstantFP::getInfinity(Src0->getType(), OrderedMask == fcNegInf);

    Value *EqInf = IsUnordered ? Builder.CreateFCmpUEQ(Src0, Inf)

                               : Builder.CreateFCmpOEQ(Src0, Inf);


    EqInf->takeName(&II);

    return replaceInstUsesWith(II, EqInf);

  }


  if ((OrderedInvertedMask == fcPosInf || OrderedInvertedMask == fcNegInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, ~fcPosInf) -> fcmp one x, +inf

    // is.fpclass(x, ~fcNegInf) -> fcmp one x, -inf

    // is.fpclass(x, ~fcPosInf|fcNan) -> fcmp une x, +inf

    // is.fpclass(x, ~fcNegInf|fcNan) -> fcmp une x, -inf

    Constant *Inf = ConstantFP::getInfinity(Src0->getType(),

                                            OrderedInvertedMask == fcNegInf);

    Value *NeInf = IsUnordered ? Builder.CreateFCmpUNE(Src0, Inf)

                               : Builder.CreateFCmpONE(Src0, Inf);

    NeInf->takeName(&II);

    return replaceInstUsesWith(II, NeInf);

  }


  if (Mask == fcNan && !IsStrict) {

    // Equivalent of isnan. Replace with standard fcmp if we don't care about FP

    // exceptions.

    Value *IsNan =

        Builder.CreateFCmpUNO(Src0, ConstantFP::getZero(Src0->getType()));

    IsNan->takeName(&II);

    return replaceInstUsesWith(II, IsNan);

  }


  if (Mask == (~fcNan & fcAllFlags) && !IsStrict) {

    // Equivalent of !isnan. Replace with standard fcmp.

    Value *FCmp =

        Builder.CreateFCmpORD(Src0, ConstantFP::getZero(Src0->getType()));

    FCmp->takeName(&II);

    return replaceInstUsesWith(II, FCmp);

  }


  FCmpInst::Predicate PredType = FCmpInst::BAD_FCMP_PREDICATE;


  // Try to replace with an fcmp with 0

  //

  // is.fpclass(x, fcZero) -> fcmp oeq x, 0.0

  // is.fpclass(x, fcZero | fcNan) -> fcmp ueq x, 0.0

  // is.fpclass(x, ~fcZero & ~fcNan) -> fcmp one x, 0.0

  // is.fpclass(x, ~fcZero) -> fcmp une x, 0.0

  //

  // is.fpclass(x, fcPosSubnormal | fcPosNormal | fcPosInf) -> fcmp ogt x, 0.0

  // is.fpclass(x, fcPositive | fcNegZero) -> fcmp oge x, 0.0

  //

  // is.fpclass(x, fcNegSubnormal | fcNegNormal | fcNegInf) -> fcmp olt x, 0.0

  // is.fpclass(x, fcNegative | fcPosZero) -> fcmp ole x, 0.0

  //

  if (!IsStrict && (IsOrdered || IsUnordered) &&

      (PredType = fpclassTestIsFCmp0(OrderedMask, *II.getFunction(),

                                     Src0->getType())) !=

          FCmpInst::BAD_FCMP_PREDICATE) {

    Constant *Zero = ConstantFP::getZero(Src0->getType());

    // Equivalent of == 0.

    Value *FCmp = Builder.CreateFCmp(

        IsUnordered ? FCmpInst::getUnorderedPredicate(PredType) : PredType,

        Src0, Zero);


    FCmp->takeName(&II);

    return replaceInstUsesWith(II, FCmp);

  }


  KnownFPClass Known = computeKnownFPClass(Src0, Mask, &II);


  // Clear test bits we know must be false from the source value.

  // fp_class (nnan x), qnan|snan|other -> fp_class (nnan x), other

  // fp_class (ninf x), ninf|pinf|other -> fp_class (ninf x), other

  if ((Mask & Known.KnownFPClasses) != Mask) {

    II.setArgOperand(

        1, ConstantInt::get(Src1->getType(), Mask & Known.KnownFPClasses));

    return &II;

  }


  // If none of the tests which can return false are possible, fold to true.

  // fp_class (nnan x), ~(qnan|snan) -> true

  // fp_class (ninf x), ~(ninf|pinf) -> true

  if (Mask == Known.KnownFPClasses)

    return replaceInstUsesWith(II, ConstantInt::get(II.getType(), true));


  return nullptr;

}


static std::optional<bool> getKnownSign(Value *Op, const SimplifyQuery &SQ) {

  KnownBits Known = computeKnownBits(Op, /*Depth=*/0, SQ);

  if (Known.isNonNegative())

    return false;

  if (Known.isNegative())

    return true;


  Value *X, *Y;

  if (match(Op, m_NSWSub(m_Value(X), m_Value(Y))))

    return isImpliedByDomCondition(ICmpInst::ICMP_SLT, X, Y, SQ.CxtI, SQ.DL);


  return std::nullopt;

}


static std::optional<bool> getKnownSignOrZero(Value *Op,

                                              const SimplifyQuery &SQ) {

  if (std::optional<bool> Sign = getKnownSign(Op, SQ))

    return Sign;


  Value *X, *Y;

  if (match(Op, m_NSWSub(m_Value(X), m_Value(Y))))

    return isImpliedByDomCondition(ICmpInst::ICMP_SLE, X, Y, SQ.CxtI, SQ.DL);


  return std::nullopt;

}


/// Return true if two values \p Op0 and \p Op1 are known to have the same sign.

static bool signBitMustBeTheSame(Value *Op0, Value *Op1,

                                 const SimplifyQuery &SQ) {

  std::optional<bool> Known1 = getKnownSign(Op1, SQ);

  if (!Known1)

    return false;

  std::optional<bool> Known0 = getKnownSign(Op0, SQ);

  if (!Known0)

    return false;

  return *Known0 == *Known1;

}


/// Try to canonicalize min/max(X + C0, C1) as min/max(X, C1 - C0) + C0. This

/// can trigger other combines.

static Instruction *moveAddAfterMinMax(IntrinsicInst *II,

                                       InstCombiner::BuilderTy &Builder) {

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  assert((MinMaxID == Intrinsic::smax || MinMaxID == Intrinsic::smin ||

          MinMaxID == Intrinsic::umax || MinMaxID == Intrinsic::umin) &&

         "Expected a min or max intrinsic");


  // TODO: Match vectors with undef elements, but undef may not propagate.

  Value *Op0 = II->getArgOperand(0), *Op1 = II->getArgOperand(1);

  Value *X;

  const APInt *C0, *C1;

  if (!match(Op0, m_OneUse(m_Add(m_Value(X), m_APInt(C0)))) ||

      !match(Op1, m_APInt(C1)))

    return nullptr;


  // Check for necessary no-wrap and overflow constraints.

  bool IsSigned = MinMaxID == Intrinsic::smax || MinMaxID == Intrinsic::smin;

  auto *Add = cast<BinaryOperator>(Op0);

  if ((IsSigned && !Add->hasNoSignedWrap()) ||

      (!IsSigned && !Add->hasNoUnsignedWrap()))

    return nullptr;


  // If the constant difference overflows, then instsimplify should reduce the

  // min/max to the add or C1.

  bool Overflow;

  APInt CDiff =

      IsSigned ? C1->ssub_ov(*C0, Overflow) : C1->usub_ov(*C0, Overflow);

  assert(!Overflow && "Expected simplify of min/max");


  // min/max (add X, C0), C1 --> add (min/max X, C1 - C0), C0

  // Note: the "mismatched" no-overflow setting does not propagate.

  Constant *NewMinMaxC = ConstantInt::get(II->getType(), CDiff);

  Value *NewMinMax = Builder.CreateBinaryIntrinsic(MinMaxID, X, NewMinMaxC);

  return IsSigned ? BinaryOperator::CreateNSWAdd(NewMinMax, Add->getOperand(1))

                  : BinaryOperator::CreateNUWAdd(NewMinMax, Add->getOperand(1));

}

/// Match a sadd_sat or ssub_sat which is using min/max to clamp the value.

Instruction *InstCombinerImpl::matchSAddSubSat(IntrinsicInst &MinMax1) {

  Type *Ty = MinMax1.getType();


  // We are looking for a tree of:

  // max(INT_MIN, min(INT_MAX, add(sext(A), sext(B))))

  // Where the min and max could be reversed

  Instruction *MinMax2;

  BinaryOperator *AddSub;

  const APInt *MinValue, *MaxValue;

  if (match(&MinMax1, m_SMin(m_Instruction(MinMax2), m_APInt(MaxValue)))) {

    if (!match(MinMax2, m_SMax(m_BinOp(AddSub), m_APInt(MinValue))))

      return nullptr;

  } else if (match(&MinMax1,

                   m_SMax(m_Instruction(MinMax2), m_APInt(MinValue)))) {

    if (!match(MinMax2, m_SMin(m_BinOp(AddSub), m_APInt(MaxValue))))

      return nullptr;

  } else

    return nullptr;


  // Check that the constants clamp a saturate, and that the new type would be

  // sensible to convert to.

  if (!(*MaxValue + 1).isPowerOf2() || -*MinValue != *MaxValue + 1)

    return nullptr;

  // In what bitwidth can this be treated as saturating arithmetics?

  unsigned NewBitWidth = (*MaxValue + 1).logBase2() + 1;

  // FIXME: This isn't quite right for vectors, but using the scalar type is a

  // good first approximation for what should be done there.

  if (!shouldChangeType(Ty->getScalarType()->getIntegerBitWidth(), NewBitWidth))

    return nullptr;


  // Also make sure that the inner min/max and the add/sub have one use.

  if (!MinMax2->hasOneUse() || !AddSub->hasOneUse())

    return nullptr;


  // Create the new type (which can be a vector type)

  Type *NewTy = Ty->getWithNewBitWidth(NewBitWidth);


  Intrinsic::ID IntrinsicID;

  if (AddSub->getOpcode() == Instruction::Add)

    IntrinsicID = Intrinsic::sadd_sat;

  else if (AddSub->getOpcode() == Instruction::Sub)

    IntrinsicID = Intrinsic::ssub_sat;

  else

    return nullptr;


  // The two operands of the add/sub must be nsw-truncatable to the NewTy. This

  // is usually achieved via a sext from a smaller type.

  if (ComputeMaxSignificantBits(AddSub->getOperand(0), 0, AddSub) >

          NewBitWidth ||

      ComputeMaxSignificantBits(AddSub->getOperand(1), 0, AddSub) > NewBitWidth)

    return nullptr;


  // Finally create and return the sat intrinsic, truncated to the new type

  Function *F = Intrinsic::getDeclaration(MinMax1.getModule(), IntrinsicID, NewTy);

  Value *AT = Builder.CreateTrunc(AddSub->getOperand(0), NewTy);

  Value *BT = Builder.CreateTrunc(AddSub->getOperand(1), NewTy);

  Value *Sat = Builder.CreateCall(F, {AT, BT});

  return CastInst::Create(Instruction::SExt, Sat, Ty);

}


/// If we have a clamp pattern like max (min X, 42), 41 -- where the output

/// can only be one of two possible constant values -- turn that into a select

/// of constants.

static Instruction *foldClampRangeOfTwo(IntrinsicInst *II,

                                        InstCombiner::BuilderTy &Builder) {

  Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

  Value *X;

  const APInt *C0, *C1;

  if (!match(I1, m_APInt(C1)) || !I0->hasOneUse())

    return nullptr;


  CmpInst::Predicate Pred = CmpInst::BAD_ICMP_PREDICATE;

  switch (II->getIntrinsicID()) {

  case Intrinsic::smax:

    if (match(I0, m_SMin(m_Value(X), m_APInt(C0))) && *C0 == *C1 + 1)

      Pred = ICmpInst::ICMP_SGT;

    break;

  case Intrinsic::smin:

    if (match(I0, m_SMax(m_Value(X), m_APInt(C0))) && *C1 == *C0 + 1)

      Pred = ICmpInst::ICMP_SLT;

    break;

  case Intrinsic::umax:

    if (match(I0, m_UMin(m_Value(X), m_APInt(C0))) && *C0 == *C1 + 1)

      Pred = ICmpInst::ICMP_UGT;

    break;

  case Intrinsic::umin:

    if (match(I0, m_UMax(m_Value(X), m_APInt(C0))) && *C1 == *C0 + 1)

      Pred = ICmpInst::ICMP_ULT;

    break;

  default:

    llvm_unreachable("Expected min/max intrinsic");

  }

  if (Pred == CmpInst::BAD_ICMP_PREDICATE)

    return nullptr;


  // max (min X, 42), 41 --> X > 41 ? 42 : 41

  // min (max X, 42), 43 --> X < 43 ? 42 : 43

  Value *Cmp = Builder.CreateICmp(Pred, X, I1);

  return SelectInst::Create(Cmp, ConstantInt::get(II->getType(), *C0), I1);

}


/// If this min/max has a constant operand and an operand that is a matching

/// min/max with a constant operand, constant-fold the 2 constant operands.

static Value *reassociateMinMaxWithConstants(IntrinsicInst *II,

                                             IRBuilderBase &Builder,

                                             const SimplifyQuery &SQ) {

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  auto *LHS = dyn_cast<MinMaxIntrinsic>(II->getArgOperand(0));

  if (!LHS)

    return nullptr;


  Constant *C0, *C1;

  if (!match(LHS->getArgOperand(1), m_ImmConstant(C0)) ||

      !match(II->getArgOperand(1), m_ImmConstant(C1)))

    return nullptr;


  // max (max X, C0), C1 --> max X, (max C0, C1)

  // min (min X, C0), C1 --> min X, (min C0, C1)

  // umax (smax X, nneg C0), nneg C1 --> smax X, (umax C0, C1)

  // smin (umin X, nneg C0), nneg C1 --> umin X, (smin C0, C1)

  Intrinsic::ID InnerMinMaxID = LHS->getIntrinsicID();

  if (InnerMinMaxID != MinMaxID &&

      !(((MinMaxID == Intrinsic::umax && InnerMinMaxID == Intrinsic::smax) ||

         (MinMaxID == Intrinsic::smin && InnerMinMaxID == Intrinsic::umin)) &&

        isKnownNonNegative(C0, SQ) && isKnownNonNegative(C1, SQ)))

    return nullptr;


  ICmpInst::Predicate Pred = MinMaxIntrinsic::getPredicate(MinMaxID);

  Value *CondC = Builder.CreateICmp(Pred, C0, C1);

  Value *NewC = Builder.CreateSelect(CondC, C0, C1);

  return Builder.CreateIntrinsic(InnerMinMaxID, II->getType(),

                                 {LHS->getArgOperand(0), NewC});

}


/// If this min/max has a matching min/max operand with a constant, try to push

/// the constant operand into this instruction. This can enable more folds.

static Instruction *

reassociateMinMaxWithConstantInOperand(IntrinsicInst *II,

                                       InstCombiner::BuilderTy &Builder) {

  // Match and capture a min/max operand candidate.

  Value *X, *Y;

  Constant *C;

  Instruction *Inner;

  if (!match(II, m_c_MaxOrMin(m_OneUse(m_CombineAnd(

                                  m_Instruction(Inner),

                                  m_MaxOrMin(m_Value(X), m_ImmConstant(C)))),

                              m_Value(Y))))

    return nullptr;


  // The inner op must match. Check for constants to avoid infinite loops.

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  auto *InnerMM = dyn_cast<IntrinsicInst>(Inner);

  if (!InnerMM || InnerMM->getIntrinsicID() != MinMaxID ||

      match(X, m_ImmConstant()) || match(Y, m_ImmConstant()))

    return nullptr;


  // max (max X, C), Y --> max (max X, Y), C

  Function *MinMax =

      Intrinsic::getDeclaration(II->getModule(), MinMaxID, II->getType());

  Value *NewInner = Builder.CreateBinaryIntrinsic(MinMaxID, X, Y);

  NewInner->takeName(Inner);

  return CallInst::Create(MinMax, {NewInner, C});

}


/// Reduce a sequence of min/max intrinsics with a common operand.

static Instruction *factorizeMinMaxTree(IntrinsicInst *II) {

  // Match 3 of the same min/max ops. Example: umin(umin(), umin()).

  auto *LHS = dyn_cast<IntrinsicInst>(II->getArgOperand(0));

  auto *RHS = dyn_cast<IntrinsicInst>(II->getArgOperand(1));

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  if (!LHS || !RHS || LHS->getIntrinsicID() != MinMaxID ||

      RHS->getIntrinsicID() != MinMaxID ||

      (!LHS->hasOneUse() && !RHS->hasOneUse()))

    return nullptr;


  Value *A = LHS->getArgOperand(0);

  Value *B = LHS->getArgOperand(1);

  Value *C = RHS->getArgOperand(0);

  Value *D = RHS->getArgOperand(1);


  // Look for a common operand.

  Value *MinMaxOp = nullptr;

  Value *ThirdOp = nullptr;

  if (LHS->hasOneUse()) {

    // If the LHS is only used in this chain and the RHS is used outside of it,

    // reuse the RHS min/max because that will eliminate the LHS.

    if (D == A || C == A) {

      // min(min(a, b), min(c, a)) --> min(min(c, a), b)

      // min(min(a, b), min(a, d)) --> min(min(a, d), b)

      MinMaxOp = RHS;

      ThirdOp = B;

    } else if (D == B || C == B) {

      // min(min(a, b), min(c, b)) --> min(min(c, b), a)

      // min(min(a, b), min(b, d)) --> min(min(b, d), a)

      MinMaxOp = RHS;

      ThirdOp = A;

    }

  } else {

    assert(RHS->hasOneUse() && "Expected one-use operand");

    // Reuse the LHS. This will eliminate the RHS.

    if (D == A || D == B) {

      // min(min(a, b), min(c, a)) --> min(min(a, b), c)

      // min(min(a, b), min(c, b)) --> min(min(a, b), c)

      MinMaxOp = LHS;

      ThirdOp = C;

    } else if (C == A || C == B) {

      // min(min(a, b), min(b, d)) --> min(min(a, b), d)

      // min(min(a, b), min(c, b)) --> min(min(a, b), d)

      MinMaxOp = LHS;

      ThirdOp = D;

    }

  }


  if (!MinMaxOp || !ThirdOp)

    return nullptr;


  Module *Mod = II->getModule();

  Function *MinMax = Intrinsic::getDeclaration(Mod, MinMaxID, II->getType());

  return CallInst::Create(MinMax, { MinMaxOp, ThirdOp });

}


/// If all arguments of the intrinsic are unary shuffles with the same mask,

/// try to shuffle after the intrinsic.

static Instruction *

foldShuffledIntrinsicOperands(IntrinsicInst *II,

                              InstCombiner::BuilderTy &Builder) {

  // TODO: This should be extended to handle other intrinsics like fshl, ctpop,

  //       etc. Use llvm::isTriviallyVectorizable() and related to determine

  //       which intrinsics are safe to shuffle?

  switch (II->getIntrinsicID()) {

  case Intrinsic::smax:

  case Intrinsic::smin:

  case Intrinsic::umax:

  case Intrinsic::umin:

  case Intrinsic::fma:

  case Intrinsic::fshl:

  case Intrinsic::fshr:

    break;

  default:

    return nullptr;

  }


  Value *X;

  ArrayRef<int> Mask;

  if (!match(II->getArgOperand(0),

             m_Shuffle(m_Value(X), m_Undef(), m_Mask(Mask))))

    return nullptr;


  // At least 1 operand must have 1 use because we are creating 2 instructions.

  if (none_of(II->args(), [](Value *V) { return V->hasOneUse(); }))

    return nullptr;


  // See if all arguments are shuffled with the same mask.

  SmallVector<Value *, 4> NewArgs(II->arg_size());

  NewArgs[0] = X;

  Type *SrcTy = X->getType();

  for (unsigned i = 1, e = II->arg_size(); i != e; ++i) {

    if (!match(II->getArgOperand(i),

               m_Shuffle(m_Value(X), m_Undef(), m_SpecificMask(Mask))) ||

        X->getType() != SrcTy)

      return nullptr;

    NewArgs[i] = X;

  }


  // intrinsic (shuf X, M), (shuf Y, M), ... --> shuf (intrinsic X, Y, ...), M

  Instruction *FPI = isa<FPMathOperator>(II) ? II : nullptr;

  Value *NewIntrinsic =

      Builder.CreateIntrinsic(II->getIntrinsicID(), SrcTy, NewArgs, FPI);

  return new ShuffleVectorInst(NewIntrinsic, Mask);

}


/// Fold the following cases and accepts bswap and bitreverse intrinsics:

///   bswap(logic_op(bswap(x), y)) --> logic_op(x, bswap(y))

///   bswap(logic_op(bswap(x), bswap(y))) --> logic_op(x, y) (ignores multiuse)

template <Intrinsic::ID IntrID>

static Instruction *foldBitOrderCrossLogicOp(Value *V,

                                             InstCombiner::BuilderTy &Builder) {

  static_assert(IntrID == Intrinsic::bswap || IntrID == Intrinsic::bitreverse,

                "This helper only supports BSWAP and BITREVERSE intrinsics");


  Value *X, *Y;

  // Find bitwise logic op. Check that it is a BinaryOperator explicitly so we

  // don't match ConstantExpr that aren't meaningful for this transform.

  if (match(V, m_OneUse(m_BitwiseLogic(m_Value(X), m_Value(Y)))) &&

      isa<BinaryOperator>(V)) {

    Value *OldReorderX, *OldReorderY;

    BinaryOperator::BinaryOps Op = cast<BinaryOperator>(V)->getOpcode();


    // If both X and Y are bswap/bitreverse, the transform reduces the number

    // of instructions even if there's multiuse.

    // If only one operand is bswap/bitreverse, we need to ensure the operand

    // have only one use.

    if (match(X, m_Intrinsic<IntrID>(m_Value(OldReorderX))) &&

        match(Y, m_Intrinsic<IntrID>(m_Value(OldReorderY)))) {

      return BinaryOperator::Create(Op, OldReorderX, OldReorderY);

    }


    if (match(X, m_OneUse(m_Intrinsic<IntrID>(m_Value(OldReorderX))))) {

      Value *NewReorder = Builder.CreateUnaryIntrinsic(IntrID, Y);

      return BinaryOperator::Create(Op, OldReorderX, NewReorder);

    }


    if (match(Y, m_OneUse(m_Intrinsic<IntrID>(m_Value(OldReorderY))))) {

      Value *NewReorder = Builder.CreateUnaryIntrinsic(IntrID, X);

      return BinaryOperator::Create(Op, NewReorder, OldReorderY);

    }

  }

  return nullptr;

}


static Value *simplifyReductionOperand(Value *Arg, bool CanReorderLanes) {

  if (!CanReorderLanes)

    return nullptr;


  Value *V;

  if (match(Arg, m_VecReverse(m_Value(V))))

    return V;


  ArrayRef<int> Mask;

  if (!isa<FixedVectorType>(Arg->getType()) ||

      !match(Arg, m_Shuffle(m_Value(V), m_Undef(), m_Mask(Mask))) ||

      !cast<ShuffleVectorInst>(Arg)->isSingleSource())

    return nullptr;


  int Sz = Mask.size();

  SmallBitVector UsedIndices(Sz);

  for (int Idx : Mask) {

    if (Idx == PoisonMaskElem || UsedIndices.test(Idx))

      return nullptr;

    UsedIndices.set(Idx);

  }


  // Can remove shuffle iff just shuffled elements, no repeats, undefs, or

  // other changes.

  return UsedIndices.all() ? V : nullptr;

}


/// Fold an unsigned minimum of trailing or leading zero bits counts:

///   umin(cttz(CtOp, ZeroUndef), ConstOp) --> cttz(CtOp | (1 << ConstOp))

///   umin(ctlz(CtOp, ZeroUndef), ConstOp) --> ctlz(CtOp | (SignedMin

///                                              >> ConstOp))

template <Intrinsic::ID IntrID>

static Value *

foldMinimumOverTrailingOrLeadingZeroCount(Value *I0, Value *I1,

                                          const DataLayout &DL,

                                          InstCombiner::BuilderTy &Builder) {

  static_assert(IntrID == Intrinsic::cttz || IntrID == Intrinsic::ctlz,

                "This helper only supports cttz and ctlz intrinsics");


  Value *CtOp;

  Value *ZeroUndef;

  if (!match(I0,

             m_OneUse(m_Intrinsic<IntrID>(m_Value(CtOp), m_Value(ZeroUndef)))))

    return nullptr;


  unsigned BitWidth = I1->getType()->getScalarSizeInBits();

  auto LessBitWidth = [BitWidth](auto &C) { return C.ult(BitWidth); };

  if (!match(I1, m_CheckedInt(LessBitWidth)))

    // We have a constant >= BitWidth (which can be handled by CVP)

    // or a non-splat vector with elements < and >= BitWidth

    return nullptr;


  Type *Ty = I1->getType();

  Constant *NewConst = ConstantFoldBinaryOpOperands(

      IntrID == Intrinsic::cttz ? Instruction::Shl : Instruction::LShr,

      IntrID == Intrinsic::cttz

          ? ConstantInt::get(Ty, 1)

          : ConstantInt::get(Ty, APInt::getSignedMinValue(BitWidth)),

      cast<Constant>(I1), DL);

  return Builder.CreateBinaryIntrinsic(

      IntrID, Builder.CreateOr(CtOp, NewConst),

      ConstantInt::getTrue(ZeroUndef->getType()));

}


/// CallInst simplification. This mostly only handles folding of intrinsic

/// instructions. For normal calls, it allows visitCallBase to do the heavy

/// lifting.

Instruction *InstCombinerImpl::visitCallInst(CallInst &CI) {

  // Don't try to simplify calls without uses. It will not do anything useful,

  // but will result in the following folds being skipped.

  if (!CI.use_empty()) {

    SmallVector<Value *, 4> Args;

    Args.reserve(CI.arg_size());

    for (Value *Op : CI.args())

      Args.push_back(Op);

    if (Value *V = simplifyCall(&CI, CI.getCalledOperand(), Args,

                                SQ.getWithInstruction(&CI)))

      return replaceInstUsesWith(CI, V);

  }


  if (Value *FreedOp = getFreedOperand(&CI, &TLI))

    return visitFree(CI, FreedOp);


  // If the caller function (i.e. us, the function that contains this CallInst)

  // is nounwind, mark the call as nounwind, even if the callee isn't.

  if (CI.getFunction()->doesNotThrow() && !CI.doesNotThrow()) {

    CI.setDoesNotThrow();

    return &CI;

  }


  IntrinsicInst *II = dyn_cast<IntrinsicInst>(&CI);

  if (!II) return visitCallBase(CI);


  // For atomic unordered mem intrinsics if len is not a positive or

  // not a multiple of element size then behavior is undefined.

  if (auto *AMI = dyn_cast<AtomicMemIntrinsic>(II))

    if (ConstantInt *NumBytes = dyn_cast<ConstantInt>(AMI->getLength()))

      if (NumBytes->isNegative() ||

          (NumBytes->getZExtValue() % AMI->getElementSizeInBytes() != 0)) {

        CreateNonTerminatorUnreachable(AMI);

        assert(AMI->getType()->isVoidTy() &&

               "non void atomic unordered mem intrinsic");

        return eraseInstFromFunction(*AMI);

      }


  // Intrinsics cannot occur in an invoke or a callbr, so handle them here

  // instead of in visitCallBase.

  if (auto *MI = dyn_cast<AnyMemIntrinsic>(II)) {

    bool Changed = false;


    // memmove/cpy/set of zero bytes is a noop.

    if (Constant *NumBytes = dyn_cast<Constant>(MI->getLength())) {

      if (NumBytes->isNullValue())

        return eraseInstFromFunction(CI);

    }


    // No other transformations apply to volatile transfers.

    if (auto *M = dyn_cast<MemIntrinsic>(MI))

      if (M->isVolatile())

        return nullptr;


    // If we have a memmove and the source operation is a constant global,

    // then the source and dest pointers can't alias, so we can change this

    // into a call to memcpy.

    if (auto *MMI = dyn_cast<AnyMemMoveInst>(MI)) {

      if (GlobalVariable *GVSrc = dyn_cast<GlobalVariable>(MMI->getSource()))

        if (GVSrc->isConstant()) {

          Module *M = CI.getModule();

          Intrinsic::ID MemCpyID =

              isa<AtomicMemMoveInst>(MMI)

                  ? Intrinsic::memcpy_element_unordered_atomic

                  : Intrinsic::memcpy;

          Type *Tys[3] = { CI.getArgOperand(0)->getType(),

                           CI.getArgOperand(1)->getType(),

                           CI.getArgOperand(2)->getType() };

          CI.setCalledFunction(Intrinsic::getDeclaration(M, MemCpyID, Tys));

          Changed = true;

        }

    }


    if (AnyMemTransferInst *MTI = dyn_cast<AnyMemTransferInst>(MI)) {

      // memmove(x,x,size) -> noop.

      if (MTI->getSource() == MTI->getDest())

        return eraseInstFromFunction(CI);

    }


    // If we can determine a pointer alignment that is bigger than currently

    // set, update the alignment.

    if (auto *MTI = dyn_cast<AnyMemTransferInst>(MI)) {

      if (Instruction *I = SimplifyAnyMemTransfer(MTI))

        return I;

    } else if (auto *MSI = dyn_cast<AnyMemSetInst>(MI)) {

      if (Instruction *I = SimplifyAnyMemSet(MSI))

        return I;

    }


    if (Changed) return II;

  }


  // For fixed width vector result intrinsics, use the generic demanded vector

  // support.

  if (auto *IIFVTy = dyn_cast<FixedVectorType>(II->getType())) {

    auto VWidth = IIFVTy->getNumElements();

    APInt PoisonElts(VWidth, 0);

    APInt AllOnesEltMask(APInt::getAllOnes(VWidth));

    if (Value *V = SimplifyDemandedVectorElts(II, AllOnesEltMask, PoisonElts)) {

      if (V != II)

        return replaceInstUsesWith(*II, V);

      return II;

    }

  }


  if (II->isCommutative()) {

    if (auto Pair = matchSymmetricPair(II->getOperand(0), II->getOperand(1))) {

      replaceOperand(*II, 0, Pair->first);

      replaceOperand(*II, 1, Pair->second);

      return II;

    }


    if (CallInst *NewCall = canonicalizeConstantArg0ToArg1(CI))

      return NewCall;

  }


  // Unused constrained FP intrinsic calls may have declared side effect, which

  // prevents it from being removed. In some cases however the side effect is

  // actually absent. To detect this case, call SimplifyConstrainedFPCall. If it

  // returns a replacement, the call may be removed.

  if (CI.use_empty() && isa<ConstrainedFPIntrinsic>(CI)) {

    if (simplifyConstrainedFPCall(&CI, SQ.getWithInstruction(&CI)))

      return eraseInstFromFunction(CI);

  }


  Intrinsic::ID IID = II->getIntrinsicID();

  switch (IID) {

  case Intrinsic::objectsize: {

    SmallVector<Instruction *> InsertedInstructions;

    if (Value *V = lowerObjectSizeCall(II, DL, &TLI, AA, /*MustSucceed=*/false,

                                       &InsertedInstructions)) {

      for (Instruction *Inserted : InsertedInstructions)

        Worklist.add(Inserted);

      return replaceInstUsesWith(CI, V);

    }

    return nullptr;

  }

  case Intrinsic::abs: {

    Value *IIOperand = II->getArgOperand(0);

    bool IntMinIsPoison = cast<Constant>(II->getArgOperand(1))->isOneValue();


    // abs(-x) -> abs(x)

    // TODO: Copy nsw if it was present on the neg?

    Value *X;

    if (match(IIOperand, m_Neg(m_Value(X))))

      return replaceOperand(*II, 0, X);

    if (match(IIOperand, m_Select(m_Value(), m_Value(X), m_Neg(m_Deferred(X)))))

      return replaceOperand(*II, 0, X);

    if (match(IIOperand, m_Select(m_Value(), m_Neg(m_Value(X)), m_Deferred(X))))

      return replaceOperand(*II, 0, X);


    Value *Y;

    // abs(a * abs(b)) -> abs(a * b)

    if (match(IIOperand,

              m_OneUse(m_c_Mul(m_Value(X),

                               m_Intrinsic<Intrinsic::abs>(m_Value(Y)))))) {

      bool NSW =

          cast<Instruction>(IIOperand)->hasNoSignedWrap() && IntMinIsPoison;

      auto *XY = NSW ? Builder.CreateNSWMul(X, Y) : Builder.CreateMul(X, Y);

      return replaceOperand(*II, 0, XY);

    }


    if (std::optional<bool> Known =

            getKnownSignOrZero(IIOperand, SQ.getWithInstruction(II))) {

      // abs(x) -> x if x >= 0 (include abs(x-y) --> x - y where x >= y)

      // abs(x) -> x if x > 0 (include abs(x-y) --> x - y where x > y)

      if (!*Known)

        return replaceInstUsesWith(*II, IIOperand);


      // abs(x) -> -x if x < 0

      // abs(x) -> -x if x < = 0 (include abs(x-y) --> y - x where x <= y)

      if (IntMinIsPoison)

        return BinaryOperator::CreateNSWNeg(IIOperand);

      return BinaryOperator::CreateNeg(IIOperand);

    }


    // abs (sext X) --> zext (abs X*)

    // Clear the IsIntMin (nsw) bit on the abs to allow narrowing.

    if (match(IIOperand, m_OneUse(m_SExt(m_Value(X))))) {

      Value *NarrowAbs =

          Builder.CreateBinaryIntrinsic(Intrinsic::abs, X, Builder.getFalse());

      return CastInst::Create(Instruction::ZExt, NarrowAbs, II->getType());

    }


    // Match a complicated way to check if a number is odd/even:

    // abs (srem X, 2) --> and X, 1

    const APInt *C;

    if (match(IIOperand, m_SRem(m_Value(X), m_APInt(C))) && *C == 2)

      return BinaryOperator::CreateAnd(X, ConstantInt::get(II->getType(), 1));


    break;

  }

  case Intrinsic::umin: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    // umin(x, 1) == zext(x != 0)

    if (match(I1, m_One())) {

      assert(II->getType()->getScalarSizeInBits() != 1 &&

             "Expected simplify of umin with max constant");

      Value *Zero = Constant::getNullValue(I0->getType());

      Value *Cmp = Builder.CreateICmpNE(I0, Zero);

      return CastInst::Create(Instruction::ZExt, Cmp, II->getType());

    }

    // umin(cttz(x), const) --> cttz(x | (1 << const))

    if (Value *FoldedCttz =

            foldMinimumOverTrailingOrLeadingZeroCount<Intrinsic::cttz>(

                I0, I1, DL, Builder))

      return replaceInstUsesWith(*II, FoldedCttz);

    // umin(ctlz(x), const) --> ctlz(x | (SignedMin >> const))

    if (Value *FoldedCtlz =

            foldMinimumOverTrailingOrLeadingZeroCount<Intrinsic::ctlz>(

                I0, I1, DL, Builder))

      return replaceInstUsesWith(*II, FoldedCtlz);

    [[fallthrough]];

  }

  case Intrinsic::umax: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(I0, m_ZExt(m_Value(X))) && match(I1, m_ZExt(m_Value(Y))) &&

        (I0->hasOneUse() || I1->hasOneUse()) && X->getType() == Y->getType()) {

      Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, Y);

      return CastInst::Create(Instruction::ZExt, NarrowMaxMin, II->getType());

    }

    Constant *C;

    if (match(I0, m_ZExt(m_Value(X))) && match(I1, m_Constant(C)) &&

        I0->hasOneUse()) {

      if (Constant *NarrowC = getLosslessUnsignedTrunc(C, X->getType())) {

        Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, NarrowC);

        return CastInst::Create(Instruction::ZExt, NarrowMaxMin, II->getType());

      }

    }

    // If both operands of unsigned min/max are sign-extended, it is still ok

    // to narrow the operation.

    [[fallthrough]];

  }

  case Intrinsic::smax:

  case Intrinsic::smin: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(I0, m_SExt(m_Value(X))) && match(I1, m_SExt(m_Value(Y))) &&

        (I0->hasOneUse() || I1->hasOneUse()) && X->getType() == Y->getType()) {

      Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, Y);

      return CastInst::Create(Instruction::SExt, NarrowMaxMin, II->getType());

    }


    Constant *C;

    if (match(I0, m_SExt(m_Value(X))) && match(I1, m_Constant(C)) &&

        I0->hasOneUse()) {

      if (Constant *NarrowC = getLosslessSignedTrunc(C, X->getType())) {

        Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, NarrowC);

        return CastInst::Create(Instruction::SExt, NarrowMaxMin, II->getType());

      }

    }


    // umin(i1 X, i1 Y) -> and i1 X, Y

    // smax(i1 X, i1 Y) -> and i1 X, Y

    if ((IID == Intrinsic::umin || IID == Intrinsic::smax) &&

        II->getType()->isIntOrIntVectorTy(1)) {

      return BinaryOperator::CreateAnd(I0, I1);

    }


    // umax(i1 X, i1 Y) -> or i1 X, Y

    // smin(i1 X, i1 Y) -> or i1 X, Y

    if ((IID == Intrinsic::umax || IID == Intrinsic::smin) &&

        II->getType()->isIntOrIntVectorTy(1)) {

      return BinaryOperator::CreateOr(I0, I1);

    }


    if (IID == Intrinsic::smax || IID == Intrinsic::smin) {

      // smax (neg nsw X), (neg nsw Y) --> neg nsw (smin X, Y)

      // smin (neg nsw X), (neg nsw Y) --> neg nsw (smax X, Y)

      // TODO: Canonicalize neg after min/max if I1 is constant.

      if (match(I0, m_NSWNeg(m_Value(X))) && match(I1, m_NSWNeg(m_Value(Y))) &&

          (I0->hasOneUse() || I1->hasOneUse())) {

        Intrinsic::ID InvID = getInverseMinMaxIntrinsic(IID);

        Value *InvMaxMin = Builder.CreateBinaryIntrinsic(InvID, X, Y);

        return BinaryOperator::CreateNSWNeg(InvMaxMin);

      }

    }


    // (umax X, (xor X, Pow2))

    //      -> (or X, Pow2)

    // (umin X, (xor X, Pow2))

    //      -> (and X, ~Pow2)

    // (smax X, (xor X, Pos_Pow2))

    //      -> (or X, Pos_Pow2)

    // (smin X, (xor X, Pos_Pow2))

    //      -> (and X, ~Pos_Pow2)

    // (smax X, (xor X, Neg_Pow2))

    //      -> (and X, ~Neg_Pow2)

    // (smin X, (xor X, Neg_Pow2))

    //      -> (or X, Neg_Pow2)

    if ((match(I0, m_c_Xor(m_Specific(I1), m_Value(X))) ||

         match(I1, m_c_Xor(m_Specific(I0), m_Value(X)))) &&

        isKnownToBeAPowerOfTwo(X, /* OrZero */ true)) {

      bool UseOr = IID == Intrinsic::smax || IID == Intrinsic::umax;

      bool UseAndN = IID == Intrinsic::smin || IID == Intrinsic::umin;


      if (IID == Intrinsic::smax || IID == Intrinsic::smin) {

        auto KnownSign = getKnownSign(X, SQ.getWithInstruction(II));

        if (KnownSign == std::nullopt) {

          UseOr = false;

          UseAndN = false;

        } else if (*KnownSign /* true is Signed. */) {

          UseOr ^= true;

          UseAndN ^= true;

          Type *Ty = I0->getType();

          // Negative power of 2 must be IntMin. It's possible to be able to

          // prove negative / power of 2 without actually having known bits, so

          // just get the value by hand.

          X = Constant::getIntegerValue(

              Ty, APInt::getSignedMinValue(Ty->getScalarSizeInBits()));

        }

      }

      if (UseOr)

        return BinaryOperator::CreateOr(I0, X);

      else if (UseAndN)

        return BinaryOperator::CreateAnd(I0, Builder.CreateNot(X));

    }


    // If we can eliminate ~A and Y is free to invert:

    // max ~A, Y --> ~(min A, ~Y)

    //

    // Examples:

    // max ~A, ~Y --> ~(min A, Y)

    // max ~A, C --> ~(min A, ~C)

    // max ~A, (max ~Y, ~Z) --> ~min( A, (min Y, Z))

    auto moveNotAfterMinMax = [&](Value *X, Value *Y) -> Instruction * {

      Value *A;

      if (match(X, m_OneUse(m_Not(m_Value(A)))) &&

          !isFreeToInvert(A, A->hasOneUse())) {

        if (Value *NotY = getFreelyInverted(Y, Y->hasOneUse(), &Builder)) {

          Intrinsic::ID InvID = getInverseMinMaxIntrinsic(IID);

          Value *InvMaxMin = Builder.CreateBinaryIntrinsic(InvID, A, NotY);

          return BinaryOperator::CreateNot(InvMaxMin);

        }

      }

      return nullptr;

    };


    if (Instruction *I = moveNotAfterMinMax(I0, I1))

      return I;

    if (Instruction *I = moveNotAfterMinMax(I1, I0))

      return I;


    if (Instruction *I = moveAddAfterMinMax(II, Builder))

      return I;


    // minmax (X & NegPow2C, Y & NegPow2C) --> minmax(X, Y) & NegPow2C

    const APInt *RHSC;

    if (match(I0, m_OneUse(m_And(m_Value(X), m_NegatedPower2(RHSC)))) &&

        match(I1, m_OneUse(m_And(m_Value(Y), m_SpecificInt(*RHSC)))))

      return BinaryOperator::CreateAnd(Builder.CreateBinaryIntrinsic(IID, X, Y),

                                       ConstantInt::get(II->getType(), *RHSC));


    // smax(X, -X) --> abs(X)

    // smin(X, -X) --> -abs(X)

    // umax(X, -X) --> -abs(X)

    // umin(X, -X) --> abs(X)

    if (isKnownNegation(I0, I1)) {

      // We can choose either operand as the input to abs(), but if we can

      // eliminate the only use of a value, that's better for subsequent

      // transforms/analysis.

      if (I0->hasOneUse() && !I1->hasOneUse())

        std::swap(I0, I1);


      // This is some variant of abs(). See if we can propagate 'nsw' to the abs

      // operation and potentially its negation.

      bool IntMinIsPoison = isKnownNegation(I0, I1, /* NeedNSW */ true);

      Value *Abs = Builder.CreateBinaryIntrinsic(

          Intrinsic::abs, I0,

          ConstantInt::getBool(II->getContext(), IntMinIsPoison));


      // We don't have a "nabs" intrinsic, so negate if needed based on the

      // max/min operation.

      if (IID == Intrinsic::smin || IID == Intrinsic::umax)

        Abs = Builder.CreateNeg(Abs, "nabs", IntMinIsPoison);

      return replaceInstUsesWith(CI, Abs);

    }


    if (Instruction *Sel = foldClampRangeOfTwo(II, Builder))

      return Sel;


    if (Instruction *SAdd = matchSAddSubSat(*II))

      return SAdd;


    if (Value *NewMinMax = reassociateMinMaxWithConstants(II, Builder, SQ))

      return replaceInstUsesWith(*II, NewMinMax);


    if (Instruction *R = reassociateMinMaxWithConstantInOperand(II, Builder))

      return R;


    if (Instruction *NewMinMax = factorizeMinMaxTree(II))

       return NewMinMax;


    // Try to fold minmax with constant RHS based on range information

    if (match(I1, m_APIntAllowPoison(RHSC))) {

      ICmpInst::Predicate Pred =

          ICmpInst::getNonStrictPredicate(MinMaxIntrinsic::getPredicate(IID));

      bool IsSigned = MinMaxIntrinsic::isSigned(IID);

      ConstantRange LHS_CR = computeConstantRangeIncludingKnownBits(

          I0, IsSigned, SQ.getWithInstruction(II));

      if (!LHS_CR.isFullSet()) {

        if (LHS_CR.icmp(Pred, *RHSC))

          return replaceInstUsesWith(*II, I0);

        if (LHS_CR.icmp(ICmpInst::getSwappedPredicate(Pred), *RHSC))

          return replaceInstUsesWith(*II,

                                     ConstantInt::get(II->getType(), *RHSC));

      }

    }


    break;

  }

  case Intrinsic::bitreverse: {

    Value *IIOperand = II->getArgOperand(0);

    // bitrev (zext i1 X to ?) --> X ? SignBitC : 0

    Value *X;

    if (match(IIOperand, m_ZExt(m_Value(X))) &&

        X->getType()->isIntOrIntVectorTy(1)) {

      Type *Ty = II->getType();

      APInt SignBit = APInt::getSignMask(Ty->getScalarSizeInBits());

      return SelectInst::Create(X, ConstantInt::get(Ty, SignBit),

                                ConstantInt::getNullValue(Ty));

    }


    if (Instruction *crossLogicOpFold =

        foldBitOrderCrossLogicOp<Intrinsic::bitreverse>(IIOperand, Builder))

      return crossLogicOpFold;


    break;

  }

  case Intrinsic::bswap: {

    Value *IIOperand = II->getArgOperand(0);


    // Try to canonicalize bswap-of-logical-shift-by-8-bit-multiple as

    // inverse-shift-of-bswap:

    // bswap (shl X, Y) --> lshr (bswap X), Y

    // bswap (lshr X, Y) --> shl (bswap X), Y

    Value *X, *Y;

    if (match(IIOperand, m_OneUse(m_LogicalShift(m_Value(X), m_Value(Y))))) {

      unsigned BitWidth = IIOperand->getType()->getScalarSizeInBits();

      if (MaskedValueIsZero(Y, APInt::getLowBitsSet(BitWidth, 3))) {

        Value *NewSwap = Builder.CreateUnaryIntrinsic(Intrinsic::bswap, X);

        BinaryOperator::BinaryOps InverseShift =

            cast<BinaryOperator>(IIOperand)->getOpcode() == Instruction::Shl

                ? Instruction::LShr

                : Instruction::Shl;

        return BinaryOperator::Create(InverseShift, NewSwap, Y);

      }

    }


    KnownBits Known = computeKnownBits(IIOperand, 0, II);

    uint64_t LZ = alignDown(Known.countMinLeadingZeros(), 8);

    uint64_t TZ = alignDown(Known.countMinTrailingZeros(), 8);

    unsigned BW = Known.getBitWidth();


    // bswap(x) -> shift(x) if x has exactly one "active byte"

    if (BW - LZ - TZ == 8) {

      assert(LZ != TZ && "active byte cannot be in the middle");

      if (LZ > TZ)  // -> shl(x) if the "active byte" is in the low part of x

        return BinaryOperator::CreateNUWShl(

            IIOperand, ConstantInt::get(IIOperand->getType(), LZ - TZ));

      // -> lshr(x) if the "active byte" is in the high part of x

      return BinaryOperator::CreateExactLShr(

            IIOperand, ConstantInt::get(IIOperand->getType(), TZ - LZ));

    }


    // bswap(trunc(bswap(x))) -> trunc(lshr(x, c))

    if (match(IIOperand, m_Trunc(m_BSwap(m_Value(X))))) {

      unsigned C = X->getType()->getScalarSizeInBits() - BW;

      Value *CV = ConstantInt::get(X->getType(), C);

      Value *V = Builder.CreateLShr(X, CV);

      return new TruncInst(V, IIOperand->getType());

    }


    if (Instruction *crossLogicOpFold =

            foldBitOrderCrossLogicOp<Intrinsic::bswap>(IIOperand, Builder)) {

      return crossLogicOpFold;

    }


    // Try to fold into bitreverse if bswap is the root of the expression tree.

    if (Instruction *BitOp = matchBSwapOrBitReverse(*II, /*MatchBSwaps*/ false,

                                                    /*MatchBitReversals*/ true))

      return BitOp;

    break;

  }

  case Intrinsic::masked_load:

    if (Value *SimplifiedMaskedOp = simplifyMaskedLoad(*II))

      return replaceInstUsesWith(CI, SimplifiedMaskedOp);

    break;

  case Intrinsic::masked_store:

    return simplifyMaskedStore(*II);

  case Intrinsic::masked_gather:

    return simplifyMaskedGather(*II);

  case Intrinsic::masked_scatter:

    return simplifyMaskedScatter(*II);

  case Intrinsic::launder_invariant_group:

  case Intrinsic::strip_invariant_group:

    if (auto *SkippedBarrier = simplifyInvariantGroupIntrinsic(*II, *this))

      return replaceInstUsesWith(*II, SkippedBarrier);

    break;

  case Intrinsic::powi:

    if (ConstantInt *Power = dyn_cast<ConstantInt>(II->getArgOperand(1))) {

      // 0 and 1 are handled in instsimplify

      // powi(x, -1) -> 1/x

      if (Power->isMinusOne())

        return BinaryOperator::CreateFDivFMF(ConstantFP::get(CI.getType(), 1.0),

                                             II->getArgOperand(0), II);

      // powi(x, 2) -> x*x

      if (Power->equalsInt(2))

        return BinaryOperator::CreateFMulFMF(II->getArgOperand(0),

                                             II->getArgOperand(0), II);


      if (!Power->getValue()[0]) {

        Value *X;

        // If power is even:

        // powi(-x, p) -> powi(x, p)

        // powi(fabs(x), p) -> powi(x, p)

        // powi(copysign(x, y), p) -> powi(x, p)

        if (match(II->getArgOperand(0), m_FNeg(m_Value(X))) ||

            match(II->getArgOperand(0), m_FAbs(m_Value(X))) ||

            match(II->getArgOperand(0),

                  m_Intrinsic<Intrinsic::copysign>(m_Value(X), m_Value())))

          return replaceOperand(*II, 0, X);

      }

    }

    break;


  case Intrinsic::cttz:

  case Intrinsic::ctlz:

    if (auto *I = foldCttzCtlz(*II, *this))

      return I;

    break;


  case Intrinsic::ctpop:

    if (auto *I = foldCtpop(*II, *this))

      return I;

    break;


  case Intrinsic::fshl:

  case Intrinsic::fshr: {

    Value *Op0 = II->getArgOperand(0), *Op1 = II->getArgOperand(1);

    Type *Ty = II->getType();

    unsigned BitWidth = Ty->getScalarSizeInBits();

    Constant *ShAmtC;

    if (match(II->getArgOperand(2), m_ImmConstant(ShAmtC))) {

      // Canonicalize a shift amount constant operand to modulo the bit-width.

      Constant *WidthC = ConstantInt::get(Ty, BitWidth);

      Constant *ModuloC =

          ConstantFoldBinaryOpOperands(Instruction::URem, ShAmtC, WidthC, DL);

      if (!ModuloC)

        return nullptr;

      if (ModuloC != ShAmtC)

        return replaceOperand(*II, 2, ModuloC);


      assert(match(ConstantFoldCompareInstOperands(ICmpInst::ICMP_UGT, WidthC,

                                                   ShAmtC, DL),

                   m_One()) &&

             "Shift amount expected to be modulo bitwidth");


      // Canonicalize funnel shift right by constant to funnel shift left. This

      // is not entirely arbitrary. For historical reasons, the backend may

      // recognize rotate left patterns but miss rotate right patterns.

      if (IID == Intrinsic::fshr) {

        // fshr X, Y, C --> fshl X, Y, (BitWidth - C) if C is not zero.

        if (!isKnownNonZero(ShAmtC, SQ.getWithInstruction(II)))

          return nullptr;


        Constant *LeftShiftC = ConstantExpr::getSub(WidthC, ShAmtC);

        Module *Mod = II->getModule();

        Function *Fshl = Intrinsic::getDeclaration(Mod, Intrinsic::fshl, Ty);

        return CallInst::Create(Fshl, { Op0, Op1, LeftShiftC });

      }

      assert(IID == Intrinsic::fshl &&

             "All funnel shifts by simple constants should go left");


      // fshl(X, 0, C) --> shl X, C

      // fshl(X, undef, C) --> shl X, C

      if (match(Op1, m_ZeroInt()) || match(Op1, m_Undef()))

        return BinaryOperator::CreateShl(Op0, ShAmtC);


      // fshl(0, X, C) --> lshr X, (BW-C)

      // fshl(undef, X, C) --> lshr X, (BW-C)

      if (match(Op0, m_ZeroInt()) || match(Op0, m_Undef()))

        return BinaryOperator::CreateLShr(Op1,

                                          ConstantExpr::getSub(WidthC, ShAmtC));


      // fshl i16 X, X, 8 --> bswap i16 X (reduce to more-specific form)

      if (Op0 == Op1 && BitWidth == 16 && match(ShAmtC, m_SpecificInt(8))) {

        Module *Mod = II->getModule();

        Function *Bswap = Intrinsic::getDeclaration(Mod, Intrinsic::bswap, Ty);

        return CallInst::Create(Bswap, { Op0 });

      }

      if (Instruction *BitOp =

              matchBSwapOrBitReverse(*II, /*MatchBSwaps*/ true,

                                     /*MatchBitReversals*/ true))

        return BitOp;

    }


    // Left or right might be masked.

    if (SimplifyDemandedInstructionBits(*II))

      return &CI;


    // The shift amount (operand 2) of a funnel shift is modulo the bitwidth,

    // so only the low bits of the shift amount are demanded if the bitwidth is

    // a power-of-2.

    if (!isPowerOf2_32(BitWidth))

      break;

    APInt Op2Demanded = APInt::getLowBitsSet(BitWidth, Log2_32_Ceil(BitWidth));

    KnownBits Op2Known(BitWidth);

    if (SimplifyDemandedBits(II, 2, Op2Demanded, Op2Known))

      return &CI;

    break;

  }

  case Intrinsic::ptrmask: {

    unsigned BitWidth = DL.getPointerTypeSizeInBits(II->getType());

    KnownBits Known(BitWidth);

    if (SimplifyDemandedInstructionBits(*II, Known))

      return II;


    Value *InnerPtr, *InnerMask;

    bool Changed = false;

    // Combine:

    // (ptrmask (ptrmask p, A), B)

    //    -> (ptrmask p, (and A, B))

    if (match(II->getArgOperand(0),

              m_OneUse(m_Intrinsic<Intrinsic::ptrmask>(m_Value(InnerPtr),

                                                       m_Value(InnerMask))))) {

      assert(II->getArgOperand(1)->getType() == InnerMask->getType() &&

             "Mask types must match");

      // TODO: If InnerMask == Op1, we could copy attributes from inner

      // callsite -> outer callsite.

      Value *NewMask = Builder.CreateAnd(II->getArgOperand(1), InnerMask);

      replaceOperand(CI, 0, InnerPtr);

      replaceOperand(CI, 1, NewMask);

      Changed = true;

    }


    // See if we can deduce non-null.

    if (!CI.hasRetAttr(Attribute::NonNull) &&

        (Known.isNonZero() ||

         isKnownNonZero(II, getSimplifyQuery().getWithInstruction(II)))) {

      CI.addRetAttr(Attribute::NonNull);

      Changed = true;

    }


    unsigned NewAlignmentLog =

        std::min(Value::MaxAlignmentExponent,

                 std::min(BitWidth - 1, Known.countMinTrailingZeros()));

    // Known bits will capture if we had alignment information associated with

    // the pointer argument.

    if (NewAlignmentLog > Log2(CI.getRetAlign().valueOrOne())) {

      CI.addRetAttr(Attribute::getWithAlignment(

          CI.getContext(), Align(uint64_t(1) << NewAlignmentLog)));

      Changed = true;

    }

    if (Changed)

      return &CI;

    break;

  }

  case Intrinsic::uadd_with_overflow:

  case Intrinsic::sadd_with_overflow: {

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;


    // Given 2 constant operands whose sum does not overflow:

    // uaddo (X +nuw C0), C1 -> uaddo X, C0 + C1

    // saddo (X +nsw C0), C1 -> saddo X, C0 + C1

    Value *X;

    const APInt *C0, *C1;

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    bool IsSigned = IID == Intrinsic::sadd_with_overflow;

    bool HasNWAdd = IsSigned

                        ? match(Arg0, m_NSWAddLike(m_Value(X), m_APInt(C0)))

                        : match(Arg0, m_NUWAddLike(m_Value(X), m_APInt(C0)));

    if (HasNWAdd && match(Arg1, m_APInt(C1))) {

      bool Overflow;

      APInt NewC =

          IsSigned ? C1->sadd_ov(*C0, Overflow) : C1->uadd_ov(*C0, Overflow);

      if (!Overflow)

        return replaceInstUsesWith(

            *II, Builder.CreateBinaryIntrinsic(

                     IID, X, ConstantInt::get(Arg1->getType(), NewC)));

    }

    break;

  }


  case Intrinsic::umul_with_overflow:

  case Intrinsic::smul_with_overflow:

  case Intrinsic::usub_with_overflow:

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;

    break;


  case Intrinsic::ssub_with_overflow: {

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;


    Constant *C;

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    // Given a constant C that is not the minimum signed value

    // for an integer of a given bit width:

    //

    // ssubo X, C -> saddo X, -C

    if (match(Arg1, m_Constant(C)) && C->isNotMinSignedValue()) {

      Value *NegVal = ConstantExpr::getNeg(C);

      // Build a saddo call that is equivalent to the discovered

      // ssubo call.

      return replaceInstUsesWith(

          *II, Builder.CreateBinaryIntrinsic(Intrinsic::sadd_with_overflow,

                                             Arg0, NegVal));

    }


    break;

  }


  case Intrinsic::uadd_sat:

  case Intrinsic::sadd_sat:

  case Intrinsic::usub_sat:

  case Intrinsic::ssub_sat: {

    SaturatingInst *SI = cast<SaturatingInst>(II);

    Type *Ty = SI->getType();

    Value *Arg0 = SI->getLHS();

    Value *Arg1 = SI->getRHS();


    // Make use of known overflow information.

    OverflowResult OR = computeOverflow(SI->getBinaryOp(), SI->isSigned(),

                                        Arg0, Arg1, SI);

    switch (OR) {

      case OverflowResult::MayOverflow:

        break;

      case OverflowResult::NeverOverflows:

        if (SI->isSigned())

          return BinaryOperator::CreateNSW(SI->getBinaryOp(), Arg0, Arg1);

        else

          return BinaryOperator::CreateNUW(SI->getBinaryOp(), Arg0, Arg1);

      case OverflowResult::AlwaysOverflowsLow: {

        unsigned BitWidth = Ty->getScalarSizeInBits();

        APInt Min = APSInt::getMinValue(BitWidth, !SI->isSigned());

        return replaceInstUsesWith(*SI, ConstantInt::get(Ty, Min));

      }

      case OverflowResult::AlwaysOverflowsHigh: {

        unsigned BitWidth = Ty->getScalarSizeInBits();

        APInt Max = APSInt::getMaxValue(BitWidth, !SI->isSigned());

        return replaceInstUsesWith(*SI, ConstantInt::get(Ty, Max));

      }

    }


    // usub_sat((sub nuw C, A), C1) -> usub_sat(usub_sat(C, C1), A)

    // which after that:

    // usub_sat((sub nuw C, A), C1) -> usub_sat(C - C1, A) if C1 u< C

    // usub_sat((sub nuw C, A), C1) -> 0 otherwise

    Constant *C, *C1;

    Value *A;

    if (IID == Intrinsic::usub_sat &&

        match(Arg0, m_NUWSub(m_ImmConstant(C), m_Value(A))) &&

        match(Arg1, m_ImmConstant(C1))) {

      auto *NewC = Builder.CreateBinaryIntrinsic(Intrinsic::usub_sat, C, C1);

      auto *NewSub =

          Builder.CreateBinaryIntrinsic(Intrinsic::usub_sat, NewC, A);

      return replaceInstUsesWith(*SI, NewSub);

    }


    // ssub.sat(X, C) -> sadd.sat(X, -C) if C != MIN

    if (IID == Intrinsic::ssub_sat && match(Arg1, m_Constant(C)) &&

        C->isNotMinSignedValue()) {

      Value *NegVal = ConstantExpr::getNeg(C);

      return replaceInstUsesWith(

          *II, Builder.CreateBinaryIntrinsic(

              Intrinsic::sadd_sat, Arg0, NegVal));

    }


    // sat(sat(X + Val2) + Val) -> sat(X + (Val+Val2))

    // sat(sat(X - Val2) - Val) -> sat(X - (Val+Val2))

    // if Val and Val2 have the same sign

    if (auto *Other = dyn_cast<IntrinsicInst>(Arg0)) {

      Value *X;

      const APInt *Val, *Val2;

      APInt NewVal;

      bool IsUnsigned =

          IID == Intrinsic::uadd_sat || IID == Intrinsic::usub_sat;

      if (Other->getIntrinsicID() == IID &&

          match(Arg1, m_APInt(Val)) &&

          match(Other->getArgOperand(0), m_Value(X)) &&

          match(Other->getArgOperand(1), m_APInt(Val2))) {

        if (IsUnsigned)

          NewVal = Val->uadd_sat(*Val2);

        else if (Val->isNonNegative() == Val2->isNonNegative()) {

          bool Overflow;

          NewVal = Val->sadd_ov(*Val2, Overflow);

          if (Overflow) {

            // Both adds together may add more than SignedMaxValue

            // without saturating the final result.

            break;

          }

        } else {

          // Cannot fold saturated addition with different signs.

          break;

        }


        return replaceInstUsesWith(

            *II, Builder.CreateBinaryIntrinsic(

                     IID, X, ConstantInt::get(II->getType(), NewVal)));

      }

    }

    break;

  }


  case Intrinsic::minnum:

  case Intrinsic::maxnum:

  case Intrinsic::minimum:

  case Intrinsic::maximum: {

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(Arg0, m_FNeg(m_Value(X))) && match(Arg1, m_FNeg(m_Value(Y))) &&

        (Arg0->hasOneUse() || Arg1->hasOneUse())) {

      // If both operands are negated, invert the call and negate the result:

      // min(-X, -Y) --> -(max(X, Y))

      // max(-X, -Y) --> -(min(X, Y))

      Intrinsic::ID NewIID;

      switch (IID) {

      case Intrinsic::maxnum:

        NewIID = Intrinsic::minnum;

        break;

      case Intrinsic::minnum:

        NewIID = Intrinsic::maxnum;

        break;

      case Intrinsic::maximum:

        NewIID = Intrinsic::minimum;

        break;

      case Intrinsic::minimum:

        NewIID = Intrinsic::maximum;

        break;

      default:

        llvm_unreachable("unexpected intrinsic ID");

      }

      Value *NewCall = Builder.CreateBinaryIntrinsic(NewIID, X, Y, II);

      Instruction *FNeg = UnaryOperator::CreateFNeg(NewCall);

      FNeg->copyIRFlags(II);

      return FNeg;

    }


    // m(m(X, C2), C1) -> m(X, C)

    const APFloat *C1, *C2;

    if (auto *M = dyn_cast<IntrinsicInst>(Arg0)) {

      if (M->getIntrinsicID() == IID && match(Arg1, m_APFloat(C1)) &&

          ((match(M->getArgOperand(0), m_Value(X)) &&

            match(M->getArgOperand(1), m_APFloat(C2))) ||

           (match(M->getArgOperand(1), m_Value(X)) &&

            match(M->getArgOperand(0), m_APFloat(C2))))) {

        APFloat Res(0.0);

        switch (IID) {

        case Intrinsic::maxnum:

          Res = maxnum(*C1, *C2);

          break;

        case Intrinsic::minnum:

          Res = minnum(*C1, *C2);

          break;

        case Intrinsic::maximum:

          Res = maximum(*C1, *C2);

          break;

        case Intrinsic::minimum:

          Res = minimum(*C1, *C2);

          break;

        default:

          llvm_unreachable("unexpected intrinsic ID");

        }

        Value *V = Builder.CreateBinaryIntrinsic(

            IID, X, ConstantFP::get(Arg0->getType(), Res), II);

        // TODO: Conservatively intersecting FMF. If Res == C2, the transform

        //       was a simplification (so Arg0 and its original flags could

        //       propagate?)

        if (auto *CI = dyn_cast<CallInst>(V))

          CI->andIRFlags(M);

        return replaceInstUsesWith(*II, V);

      }

    }


    // m((fpext X), (fpext Y)) -> fpext (m(X, Y))

    if (match(Arg0, m_OneUse(m_FPExt(m_Value(X)))) &&

        match(Arg1, m_OneUse(m_FPExt(m_Value(Y)))) &&

        X->getType() == Y->getType()) {

      Value *NewCall =

          Builder.CreateBinaryIntrinsic(IID, X, Y, II, II->getName());

      return new FPExtInst(NewCall, II->getType());

    }


    // max X, -X --> fabs X

    // min X, -X --> -(fabs X)

    // TODO: Remove one-use limitation? That is obviously better for max,

    // hence why we don't check for one-use for that. However,

    // it would be an extra instruction for min (fnabs), but

    // that is still likely better for analysis and codegen.

    auto IsMinMaxOrXNegX = [IID, &X](Value *Op0, Value *Op1) {

      if (match(Op0, m_FNeg(m_Value(X))) && match(Op1, m_Specific(X)))

        return Op0->hasOneUse() ||

               (IID != Intrinsic::minimum && IID != Intrinsic::minnum);

      return false;

    };


    if (IsMinMaxOrXNegX(Arg0, Arg1) || IsMinMaxOrXNegX(Arg1, Arg0)) {

      Value *R = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, X, II);

      if (IID == Intrinsic::minimum || IID == Intrinsic::minnum)

        R = Builder.CreateFNegFMF(R, II);

      return replaceInstUsesWith(*II, R);

    }


    break;

  }

  case Intrinsic::matrix_multiply: {

    // Optimize negation in matrix multiplication.


    // -A * -B -> A * B

    Value *A, *B;

    if (match(II->getArgOperand(0), m_FNeg(m_Value(A))) &&

        match(II->getArgOperand(1), m_FNeg(m_Value(B)))) {

      replaceOperand(*II, 0, A);

      replaceOperand(*II, 1, B);

      return II;

    }


    Value *Op0 = II->getOperand(0);

    Value *Op1 = II->getOperand(1);

    Value *OpNotNeg, *NegatedOp;

    unsigned NegatedOpArg, OtherOpArg;

    if (match(Op0, m_FNeg(m_Value(OpNotNeg)))) {

      NegatedOp = Op0;

      NegatedOpArg = 0;

      OtherOpArg = 1;

    } else if (match(Op1, m_FNeg(m_Value(OpNotNeg)))) {

      NegatedOp = Op1;

      NegatedOpArg = 1;

      OtherOpArg = 0;

    } else

      // Multiplication doesn't have a negated operand.

      break;


    // Only optimize if the negated operand has only one use.

    if (!NegatedOp->hasOneUse())

      break;


    Value *OtherOp = II->getOperand(OtherOpArg);

    VectorType *RetTy = cast<VectorType>(II->getType());

    VectorType *NegatedOpTy = cast<VectorType>(NegatedOp->getType());

    VectorType *OtherOpTy = cast<VectorType>(OtherOp->getType());

    ElementCount NegatedCount = NegatedOpTy->getElementCount();

    ElementCount OtherCount = OtherOpTy->getElementCount();

    ElementCount RetCount = RetTy->getElementCount();

    // (-A) * B -> A * (-B), if it is cheaper to negate B and vice versa.

    if (ElementCount::isKnownGT(NegatedCount, OtherCount) &&

        ElementCount::isKnownLT(OtherCount, RetCount)) {

      Value *InverseOtherOp = Builder.CreateFNeg(OtherOp);

      replaceOperand(*II, NegatedOpArg, OpNotNeg);

      replaceOperand(*II, OtherOpArg, InverseOtherOp);

      return II;

    }

    // (-A) * B -> -(A * B), if it is cheaper to negate the result

    if (ElementCount::isKnownGT(NegatedCount, RetCount)) {

      SmallVector<Value *, 5> NewArgs(II->args());

      NewArgs[NegatedOpArg] = OpNotNeg;

      Instruction *NewMul =

          Builder.CreateIntrinsic(II->getType(), IID, NewArgs, II);

      return replaceInstUsesWith(*II, Builder.CreateFNegFMF(NewMul, II));

    }

    break;

  }

  case Intrinsic::fmuladd: {

    // Try to simplify the underlying FMul.

    if (Value *V = simplifyFMulInst(II->getArgOperand(0), II->getArgOperand(1),

                                    II->getFastMathFlags(),

                                    SQ.getWithInstruction(II))) {

      auto *FAdd = BinaryOperator::CreateFAdd(V, II->getArgOperand(2));

      FAdd->copyFastMathFlags(II);

      return FAdd;

    }


    [[fallthrough]];

  }

  case Intrinsic::fma: {

    // fma fneg(x), fneg(y), z -> fma x, y, z

    Value *Src0 = II->getArgOperand(0);

    Value *Src1 = II->getArgOperand(1);

    Value *Src2 = II->getArgOperand(2);

    Value *X, *Y;

    if (match(Src0, m_FNeg(m_Value(X))) && match(Src1, m_FNeg(m_Value(Y)))) {

      replaceOperand(*II, 0, X);

      replaceOperand(*II, 1, Y);

      return II;

    }


    // fma fabs(x), fabs(x), z -> fma x, x, z

    if (match(Src0, m_FAbs(m_Value(X))) &&

        match(Src1, m_FAbs(m_Specific(X)))) {

      replaceOperand(*II, 0, X);

      replaceOperand(*II, 1, X);

      return II;

    }


    // Try to simplify the underlying FMul. We can only apply simplifications

    // that do not require rounding.

    if (Value *V = simplifyFMAFMul(Src0, Src1, II->getFastMathFlags(),

                                   SQ.getWithInstruction(II))) {

      auto *FAdd = BinaryOperator::CreateFAdd(V, Src2);

      FAdd->copyFastMathFlags(II);

      return FAdd;

    }


    // fma x, y, 0 -> fmul x, y

    // This is always valid for -0.0, but requires nsz for +0.0 as

    // -0.0 + 0.0 = 0.0, which would not be the same as the fmul on its own.

    if (match(Src2, m_NegZeroFP()) ||

        (match(Src2, m_PosZeroFP()) && II->getFastMathFlags().noSignedZeros()))

      return BinaryOperator::CreateFMulFMF(Src0, Src1, II);


    // fma x, -1.0, y -> fsub y, x

    if (match(Src1, m_SpecificFP(-1.0)))

      return BinaryOperator::CreateFSubFMF(Src2, Src0, II);


    break;

  }

  case Intrinsic::copysign: {

    Value *Mag = II->getArgOperand(0), *Sign = II->getArgOperand(1);

    if (std::optional<bool> KnownSignBit = computeKnownFPSignBit(

            Sign, /*Depth=*/0, getSimplifyQuery().getWithInstruction(II))) {

      if (*KnownSignBit) {

        // If we know that the sign argument is negative, reduce to FNABS:

        // copysign Mag, -Sign --> fneg (fabs Mag)

        Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Mag, II);

        return replaceInstUsesWith(*II, Builder.CreateFNegFMF(Fabs, II));

      }


      // If we know that the sign argument is positive, reduce to FABS:

      // copysign Mag, +Sign --> fabs Mag

      Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Mag, II);

      return replaceInstUsesWith(*II, Fabs);

    }


    // Propagate sign argument through nested calls:

    // copysign Mag, (copysign ?, X) --> copysign Mag, X

    Value *X;

    if (match(Sign, m_Intrinsic<Intrinsic::copysign>(m_Value(), m_Value(X))))

      return replaceOperand(*II, 1, X);


    // Clear sign-bit of constant magnitude:

    // copysign -MagC, X --> copysign MagC, X

    // TODO: Support constant folding for fabs

    const APFloat *MagC;

    if (match(Mag, m_APFloat(MagC)) && MagC->isNegative()) {

      APFloat PosMagC = *MagC;

      PosMagC.clearSign();

      return replaceOperand(*II, 0, ConstantFP::get(Mag->getType(), PosMagC));

    }


    // Peek through changes of magnitude's sign-bit. This call rewrites those:

    // copysign (fabs X), Sign --> copysign X, Sign

    // copysign (fneg X), Sign --> copysign X, Sign

    if (match(Mag, m_FAbs(m_Value(X))) || match(Mag, m_FNeg(m_Value(X))))

      return replaceOperand(*II, 0, X);


    break;

  }

  case Intrinsic::fabs: {

    Value *Cond, *TVal, *FVal;

    Value *Arg = II->getArgOperand(0);

    Value *X;

    // fabs (-X) --> fabs (X)

    if (match(Arg, m_FNeg(m_Value(X)))) {

        CallInst *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, X, II);

        return replaceInstUsesWith(CI, Fabs);

    }


    if (match(Arg, m_Select(m_Value(Cond), m_Value(TVal), m_Value(FVal)))) {

      // fabs (select Cond, TrueC, FalseC) --> select Cond, AbsT, AbsF

      if (isa<Constant>(TVal) || isa<Constant>(FVal)) {

        CallInst *AbsT = Builder.CreateCall(II->getCalledFunction(), {TVal});

        CallInst *AbsF = Builder.CreateCall(II->getCalledFunction(), {FVal});

        SelectInst *SI = SelectInst::Create(Cond, AbsT, AbsF);

        FastMathFlags FMF1 = II->getFastMathFlags();

        FastMathFlags FMF2 = cast<SelectInst>(Arg)->getFastMathFlags();

        FMF2.setNoSignedZeros(false);

        SI->setFastMathFlags(FMF1 | FMF2);

        return SI;

      }

      // fabs (select Cond, -FVal, FVal) --> fabs FVal

      if (match(TVal, m_FNeg(m_Specific(FVal))))

        return replaceOperand(*II, 0, FVal);

      // fabs (select Cond, TVal, -TVal) --> fabs TVal

      if (match(FVal, m_FNeg(m_Specific(TVal))))

        return replaceOperand(*II, 0, TVal);

    }


    Value *Magnitude, *Sign;

    if (match(II->getArgOperand(0),

              m_CopySign(m_Value(Magnitude), m_Value(Sign)))) {

      // fabs (copysign x, y) -> (fabs x)

      CallInst *AbsSign =

          Builder.CreateCall(II->getCalledFunction(), {Magnitude});

      AbsSign->copyFastMathFlags(II);

      return replaceInstUsesWith(*II, AbsSign);

    }


    [[fallthrough]];

  }

  case Intrinsic::ceil:

  case Intrinsic::floor:

  case Intrinsic::round:

  case Intrinsic::roundeven:

  case Intrinsic::nearbyint:

  case Intrinsic::rint:

  case Intrinsic::trunc: {

    Value *ExtSrc;

    if (match(II->getArgOperand(0), m_OneUse(m_FPExt(m_Value(ExtSrc))))) {

      // Narrow the call: intrinsic (fpext x) -> fpext (intrinsic x)

      Value *NarrowII = Builder.CreateUnaryIntrinsic(IID, ExtSrc, II);

      return new FPExtInst(NarrowII, II->getType());

    }

    break;

  }

  case Intrinsic::cos:

  case Intrinsic::amdgcn_cos: {

    Value *X, *Sign;

    Value *Src = II->getArgOperand(0);

    if (match(Src, m_FNeg(m_Value(X))) || match(Src, m_FAbs(m_Value(X))) ||

        match(Src, m_CopySign(m_Value(X), m_Value(Sign)))) {

      // cos(-x) --> cos(x)

      // cos(fabs(x)) --> cos(x)

      // cos(copysign(x, y)) --> cos(x)

      return replaceOperand(*II, 0, X);

    }

    break;

  }

  case Intrinsic::sin:

  case Intrinsic::amdgcn_sin: {

    Value *X;

    if (match(II->getArgOperand(0), m_OneUse(m_FNeg(m_Value(X))))) {

      // sin(-x) --> -sin(x)

      Value *NewSin = Builder.CreateUnaryIntrinsic(IID, X, II);

      return UnaryOperator::CreateFNegFMF(NewSin, II);

    }

    break;

  }

  case Intrinsic::ldexp: {

    // ldexp(ldexp(x, a), b) -> ldexp(x, a + b)

    //

    // The danger is if the first ldexp would overflow to infinity or underflow

    // to zero, but the combined exponent avoids it. We ignore this with

    // reassoc.

    //

    // It's also safe to fold if we know both exponents are >= 0 or <= 0 since

    // it would just double down on the overflow/underflow which would occur

    // anyway.

    //

    // TODO: Could do better if we had range tracking for the input value

    // exponent. Also could broaden sign check to cover == 0 case.

    Value *Src = II->getArgOperand(0);

    Value *Exp = II->getArgOperand(1);

    Value *InnerSrc;

    Value *InnerExp;

    if (match(Src, m_OneUse(m_Intrinsic<Intrinsic::ldexp>(

                       m_Value(InnerSrc), m_Value(InnerExp)))) &&

        Exp->getType() == InnerExp->getType()) {

      FastMathFlags FMF = II->getFastMathFlags();

      FastMathFlags InnerFlags = cast<FPMathOperator>(Src)->getFastMathFlags();


      if ((FMF.allowReassoc() && InnerFlags.allowReassoc()) ||

          signBitMustBeTheSame(Exp, InnerExp, SQ.getWithInstruction(II))) {

        // TODO: Add nsw/nuw probably safe if integer type exceeds exponent

        // width.

        Value *NewExp = Builder.CreateAdd(InnerExp, Exp);

        II->setArgOperand(1, NewExp);

        II->setFastMathFlags(InnerFlags); // Or the inner flags.

        return replaceOperand(*II, 0, InnerSrc);

      }

    }


    // ldexp(x, zext(i1 y)) -> fmul x, (select y, 2.0, 1.0)

    // ldexp(x, sext(i1 y)) -> fmul x, (select y, 0.5, 1.0)

    Value *ExtSrc;

    if (match(Exp, m_ZExt(m_Value(ExtSrc))) &&

        ExtSrc->getType()->getScalarSizeInBits() == 1) {

      Value *Select =

          Builder.CreateSelect(ExtSrc, ConstantFP::get(II->getType(), 2.0),

                               ConstantFP::get(II->getType(), 1.0));

      return BinaryOperator::CreateFMulFMF(Src, Select, II);

    }

    if (match(Exp, m_SExt(m_Value(ExtSrc))) &&

        ExtSrc->getType()->getScalarSizeInBits() == 1) {

      Value *Select =

          Builder.CreateSelect(ExtSrc, ConstantFP::get(II->getType(), 0.5),

                               ConstantFP::get(II->getType(), 1.0));

      return BinaryOperator::CreateFMulFMF(Src, Select, II);

    }


    // ldexp(x, c ? exp : 0) -> c ? ldexp(x, exp) : x

    // ldexp(x, c ? 0 : exp) -> c ? x : ldexp(x, exp)

    ///

    // TODO: If we cared, should insert a canonicalize for x

    Value *SelectCond, *SelectLHS, *SelectRHS;

    if (match(II->getArgOperand(1),

              m_OneUse(m_Select(m_Value(SelectCond), m_Value(SelectLHS),

                                m_Value(SelectRHS))))) {

      Value *NewLdexp = nullptr;

      Value *Select = nullptr;

      if (match(SelectRHS, m_ZeroInt())) {

        NewLdexp = Builder.CreateLdexp(Src, SelectLHS);

        Select = Builder.CreateSelect(SelectCond, NewLdexp, Src);

      } else if (match(SelectLHS, m_ZeroInt())) {

        NewLdexp = Builder.CreateLdexp(Src, SelectRHS);

        Select = Builder.CreateSelect(SelectCond, Src, NewLdexp);

      }


      if (NewLdexp) {

        Select->takeName(II);

        cast<Instruction>(NewLdexp)->copyFastMathFlags(II);

        return replaceInstUsesWith(*II, Select);

      }

    }


    break;

  }

  case Intrinsic::ptrauth_auth:

  case Intrinsic::ptrauth_resign: {

    // (sign|resign) + (auth|resign) can be folded by omitting the middle

    // sign+auth component if the key and discriminator match.

    bool NeedSign = II->getIntrinsicID() == Intrinsic::ptrauth_resign;

    Value *Ptr = II->getArgOperand(0);

    Value *Key = II->getArgOperand(1);

    Value *Disc = II->getArgOperand(2);


    // AuthKey will be the key we need to end up authenticating against in

    // whatever we replace this sequence with.

    Value *AuthKey = nullptr, *AuthDisc = nullptr, *BasePtr;

    if (const auto *CI = dyn_cast<CallBase>(Ptr)) {

      BasePtr = CI->getArgOperand(0);

      if (CI->getIntrinsicID() == Intrinsic::ptrauth_sign) {

        if (CI->getArgOperand(1) != Key || CI->getArgOperand(2) != Disc)

          break;

      } else if (CI->getIntrinsicID() == Intrinsic::ptrauth_resign) {

        if (CI->getArgOperand(3) != Key || CI->getArgOperand(4) != Disc)

          break;

        AuthKey = CI->getArgOperand(1);

        AuthDisc = CI->getArgOperand(2);

      } else

        break;

    } else if (const auto *PtrToInt = dyn_cast<PtrToIntOperator>(Ptr)) {

      // ptrauth constants are equivalent to a call to @llvm.ptrauth.sign for

      // our purposes, so check for that too.

      const auto *CPA = dyn_cast<ConstantPtrAuth>(PtrToInt->getOperand(0));

      if (!CPA || !CPA->isKnownCompatibleWith(Key, Disc, DL))

        break;


      // resign(ptrauth(p,ks,ds),ks,ds,kr,dr) -> ptrauth(p,kr,dr)

      if (NeedSign && isa<ConstantInt>(II->getArgOperand(4))) {

        auto *SignKey = cast<ConstantInt>(II->getArgOperand(3));

        auto *SignDisc = cast<ConstantInt>(II->getArgOperand(4));

        auto *SignAddrDisc = ConstantPointerNull::get(Builder.getPtrTy());

        auto *NewCPA = ConstantPtrAuth::get(CPA->getPointer(), SignKey,

                                            SignDisc, SignAddrDisc);

        replaceInstUsesWith(

            *II, ConstantExpr::getPointerCast(NewCPA, II->getType()));

        return eraseInstFromFunction(*II);

      }


      // auth(ptrauth(p,k,d),k,d) -> p

      BasePtr = Builder.CreatePtrToInt(CPA->getPointer(), II->getType());

    } else

      break;


    unsigned NewIntrin;

    if (AuthKey && NeedSign) {

      // resign(0,1) + resign(1,2) = resign(0, 2)

      NewIntrin = Intrinsic::ptrauth_resign;

    } else if (AuthKey) {

      // resign(0,1) + auth(1) = auth(0)

      NewIntrin = Intrinsic::ptrauth_auth;

    } else if (NeedSign) {

      // sign(0) + resign(0, 1) = sign(1)

      NewIntrin = Intrinsic::ptrauth_sign;

    } else {

      // sign(0) + auth(0) = nop

      replaceInstUsesWith(*II, BasePtr);

      return eraseInstFromFunction(*II);

    }


    SmallVector<Value *, 4> CallArgs;

    CallArgs.push_back(BasePtr);

    if (AuthKey) {

      CallArgs.push_back(AuthKey);

      CallArgs.push_back(AuthDisc);

    }


    if (NeedSign) {

      CallArgs.push_back(II->getArgOperand(3));

      CallArgs.push_back(II->getArgOperand(4));

    }


    Function *NewFn = Intrinsic::getDeclaration(II->getModule(), NewIntrin);

    return CallInst::Create(NewFn, CallArgs);

  }

  case Intrinsic::arm_neon_vtbl1:

  case Intrinsic::aarch64_neon_tbl1:

    if (Value *V = simplifyNeonTbl1(*II, Builder))

      return replaceInstUsesWith(*II, V);

    break;


  case Intrinsic::arm_neon_vmulls:

  case Intrinsic::arm_neon_vmullu:

  case Intrinsic::aarch64_neon_smull:

  case Intrinsic::aarch64_neon_umull: {

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);


    // Handle mul by zero first:

    if (isa<ConstantAggregateZero>(Arg0) || isa<ConstantAggregateZero>(Arg1)) {

      return replaceInstUsesWith(CI, ConstantAggregateZero::get(II->getType()));

    }


    // Check for constant LHS & RHS - in this case we just simplify.

    bool Zext = (IID == Intrinsic::arm_neon_vmullu ||

                 IID == Intrinsic::aarch64_neon_umull);

    VectorType *NewVT = cast<VectorType>(II->getType());

    if (Constant *CV0 = dyn_cast<Constant>(Arg0)) {

      if (Constant *CV1 = dyn_cast<Constant>(Arg1)) {

        Value *V0 = Builder.CreateIntCast(CV0, NewVT, /*isSigned=*/!Zext);

        Value *V1 = Builder.CreateIntCast(CV1, NewVT, /*isSigned=*/!Zext);

        return replaceInstUsesWith(CI, Builder.CreateMul(V0, V1));

      }


      // Couldn't simplify - canonicalize constant to the RHS.

      std::swap(Arg0, Arg1);

    }


    // Handle mul by one:

    if (Constant *CV1 = dyn_cast<Constant>(Arg1))

      if (ConstantInt *Splat =

              dyn_cast_or_null<ConstantInt>(CV1->getSplatValue()))

        if (Splat->isOne())

          return CastInst::CreateIntegerCast(Arg0, II->getType(),

                                             /*isSigned=*/!Zext);


    break;

  }

  case Intrinsic::arm_neon_aesd:

  case Intrinsic::arm_neon_aese:

  case Intrinsic::aarch64_crypto_aesd:

  case Intrinsic::aarch64_crypto_aese: {

    Value *DataArg = II->getArgOperand(0);

    Value *KeyArg  = II->getArgOperand(1);


    // Try to use the builtin XOR in AESE and AESD to eliminate a prior XOR

    Value *Data, *Key;

    if (match(KeyArg, m_ZeroInt()) &&

        match(DataArg, m_Xor(m_Value(Data), m_Value(Key)))) {

      replaceOperand(*II, 0, Data);

      replaceOperand(*II, 1, Key);

      return II;

    }

    break;

  }

  case Intrinsic::hexagon_V6_vandvrt:

  case Intrinsic::hexagon_V6_vandvrt_128B: {

    // Simplify Q -> V -> Q conversion.

    if (auto Op0 = dyn_cast<IntrinsicInst>(II->getArgOperand(0))) {

      Intrinsic::ID ID0 = Op0->getIntrinsicID();

      if (ID0 != Intrinsic::hexagon_V6_vandqrt &&

          ID0 != Intrinsic::hexagon_V6_vandqrt_128B)

        break;

      Value *Bytes = Op0->getArgOperand(1), *Mask = II->getArgOperand(1);

      uint64_t Bytes1 = computeKnownBits(Bytes, 0, Op0).One.getZExtValue();

      uint64_t Mask1 = computeKnownBits(Mask, 0, II).One.getZExtValue();

      // Check if every byte has common bits in Bytes and Mask.

      uint64_t C = Bytes1 & Mask1;

      if ((C & 0xFF) && (C & 0xFF00) && (C & 0xFF0000) && (C & 0xFF000000))

        return replaceInstUsesWith(*II, Op0->getArgOperand(0));

    }

    break;

  }

  case Intrinsic::stackrestore: {

    enum class ClassifyResult {

      None,

      Alloca,

      StackRestore,

      CallWithSideEffects,

    };

    auto Classify = [](const Instruction *I) {

      if (isa<AllocaInst>(I))

        return ClassifyResult::Alloca;


      if (auto *CI = dyn_cast<CallInst>(I)) {

        if (auto *II = dyn_cast<IntrinsicInst>(CI)) {

          if (II->getIntrinsicID() == Intrinsic::stackrestore)

            return ClassifyResult::StackRestore;


          if (II->mayHaveSideEffects())

            return ClassifyResult::CallWithSideEffects;

        } else {

          // Consider all non-intrinsic calls to be side effects

          return ClassifyResult::CallWithSideEffects;

        }

      }


      return ClassifyResult::None;

    };


    // If the stacksave and the stackrestore are in the same BB, and there is

    // no intervening call, alloca, or stackrestore of a different stacksave,

    // remove the restore. This can happen when variable allocas are DCE'd.

    if (IntrinsicInst *SS = dyn_cast<IntrinsicInst>(II->getArgOperand(0))) {

      if (SS->getIntrinsicID() == Intrinsic::stacksave &&

          SS->getParent() == II->getParent()) {

        BasicBlock::iterator BI(SS);

        bool CannotRemove = false;

        for (++BI; &*BI != II; ++BI) {

          switch (Classify(&*BI)) {

          case ClassifyResult::None:

            // So far so good, look at next instructions.

            break;


          case ClassifyResult::StackRestore:

            // If we found an intervening stackrestore for a different

            // stacksave, we can't remove the stackrestore. Otherwise, continue.

            if (cast<IntrinsicInst>(*BI).getArgOperand(0) != SS)

              CannotRemove = true;

            break;


          case ClassifyResult::Alloca:

          case ClassifyResult::CallWithSideEffects:

            // If we found an alloca, a non-intrinsic call, or an intrinsic

            // call with side effects, we can't remove the stackrestore.

            CannotRemove = true;

            break;

          }

          if (CannotRemove)

            break;

        }


        if (!CannotRemove)

          return eraseInstFromFunction(CI);

      }

    }


    // Scan down this block to see if there is another stack restore in the

    // same block without an intervening call/alloca.

    BasicBlock::iterator BI(II);

    Instruction *TI = II->getParent()->getTerminator();

    bool CannotRemove = false;

    for (++BI; &*BI != TI; ++BI) {

      switch (Classify(&*BI)) {

      case ClassifyResult::None:

        // So far so good, look at next instructions.

        break;


      case ClassifyResult::StackRestore:

        // If there is a stackrestore below this one, remove this one.

        return eraseInstFromFunction(CI);


      case ClassifyResult::Alloca:

      case ClassifyResult::CallWithSideEffects:

        // If we found an alloca, a non-intrinsic call, or an intrinsic call

        // with side effects (such as llvm.stacksave and llvm.read_register),

        // we can't remove the stack restore.

        CannotRemove = true;

        break;

      }

      if (CannotRemove)

        break;

    }


    // If the stack restore is in a return, resume, or unwind block and if there

    // are no allocas or calls between the restore and the return, nuke the

    // restore.

    if (!CannotRemove && (isa<ReturnInst>(TI) || isa<ResumeInst>(TI)))

      return eraseInstFromFunction(CI);

    break;

  }

  case Intrinsic::lifetime_end:

    // Asan needs to poison memory to detect invalid access which is possible

    // even for empty lifetime range.

    if (II->getFunction()->hasFnAttribute(Attribute::SanitizeAddress) ||

        II->getFunction()->hasFnAttribute(Attribute::SanitizeMemory) ||

        II->getFunction()->hasFnAttribute(Attribute::SanitizeHWAddress))

      break;


    if (removeTriviallyEmptyRange(*II, *this, [](const IntrinsicInst &I) {

          return I.getIntrinsicID() == Intrinsic::lifetime_start;

        }))

      return nullptr;

    break;

  case Intrinsic::assume: {

    Value *IIOperand = II->getArgOperand(0);

    SmallVector<OperandBundleDef, 4> OpBundles;

    II->getOperandBundlesAsDefs(OpBundles);


    /// This will remove the boolean Condition from the assume given as

    /// argument and remove the assume if it becomes useless.

    /// always returns nullptr for use as a return values.

    auto RemoveConditionFromAssume = [&](Instruction *Assume) -> Instruction * {

      assert(isa<AssumeInst>(Assume));

      if (isAssumeWithEmptyBundle(*cast<AssumeInst>(II)))

        return eraseInstFromFunction(CI);

      replaceUse(II->getOperandUse(0), ConstantInt::getTrue(II->getContext()));

      return nullptr;

    };

    // Remove an assume if it is followed by an identical assume.

    // TODO: Do we need this? Unless there are conflicting assumptions, the

    // computeKnownBits(IIOperand) below here eliminates redundant assumes.

    Instruction *Next = II->getNextNonDebugInstruction();

    if (match(Next, m_Intrinsic<Intrinsic::assume>(m_Specific(IIOperand))))

      return RemoveConditionFromAssume(Next);


    // Canonicalize assume(a && b) -> assume(a); assume(b);

    // Note: New assumption intrinsics created here are registered by

    // the InstCombineIRInserter object.

    FunctionType *AssumeIntrinsicTy = II->getFunctionType();

    Value *AssumeIntrinsic = II->getCalledOperand();

    Value *A, *B;

    if (match(IIOperand, m_LogicalAnd(m_Value(A), m_Value(B)))) {

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic, A, OpBundles,

                         II->getName());

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic, B, II->getName());

      return eraseInstFromFunction(*II);

    }

    // assume(!(a || b)) -> assume(!a); assume(!b);

    if (match(IIOperand, m_Not(m_LogicalOr(m_Value(A), m_Value(B))))) {

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic,

                         Builder.CreateNot(A), OpBundles, II->getName());

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic,

                         Builder.CreateNot(B), II->getName());

      return eraseInstFromFunction(*II);

    }


    // assume( (load addr) != null ) -> add 'nonnull' metadata to load

    // (if assume is valid at the load)

    CmpInst::Predicate Pred;

    Instruction *LHS;

    if (match(IIOperand, m_ICmp(Pred, m_Instruction(LHS), m_Zero())) &&

        Pred == ICmpInst::ICMP_NE && LHS->getOpcode() == Instruction::Load &&

        LHS->getType()->isPointerTy() &&

        isValidAssumeForContext(II, LHS, &DT)) {

      MDNode *MD = MDNode::get(II->getContext(), std::nullopt);

      LHS->setMetadata(LLVMContext::MD_nonnull, MD);

      LHS->setMetadata(LLVMContext::MD_noundef, MD);

      return RemoveConditionFromAssume(II);


      // TODO: apply nonnull return attributes to calls and invokes

      // TODO: apply range metadata for range check patterns?

    }


    // Separate storage assumptions apply to the underlying allocations, not any

    // particular pointer within them. When evaluating the hints for AA purposes

    // we getUnderlyingObject them; by precomputing the answers here we can

    // avoid having to do so repeatedly there.

    for (unsigned Idx = 0; Idx < II->getNumOperandBundles(); Idx++) {

      OperandBundleUse OBU = II->getOperandBundleAt(Idx);

      if (OBU.getTagName() == "separate_storage") {

        assert(OBU.Inputs.size() == 2);

        auto MaybeSimplifyHint = [&](const Use &U) {

          Value *Hint = U.get();

          // Not having a limit is safe because InstCombine removes unreachable

          // code.

          Value *UnderlyingObject = getUnderlyingObject(Hint, /*MaxLookup*/ 0);

          if (Hint != UnderlyingObject)

            replaceUse(const_cast<Use &>(U), UnderlyingObject);

        };

        MaybeSimplifyHint(OBU.Inputs[0]);

        MaybeSimplifyHint(OBU.Inputs[1]);

      }

    }


    // Convert nonnull assume like:

    // %A = icmp ne i32* %PTR, null

    // call void @llvm.assume(i1 %A)

    // into

    // call void @llvm.assume(i1 true) [ "nonnull"(i32* %PTR) ]

    if (EnableKnowledgeRetention &&

        match(IIOperand, m_Cmp(Pred, m_Value(A), m_Zero())) &&

        Pred == CmpInst::ICMP_NE && A->getType()->isPointerTy()) {

      if (auto *Replacement = buildAssumeFromKnowledge(

              {RetainedKnowledge{Attribute::NonNull, 0, A}}, Next, &AC, &DT)) {


        Replacement->insertBefore(Next);

        AC.registerAssumption(Replacement);

        return RemoveConditionFromAssume(II);

      }

    }


    // Convert alignment assume like:

    // %B = ptrtoint i32* %A to i64

    // %C = and i64 %B, Constant

    // %D = icmp eq i64 %C, 0

    // call void @llvm.assume(i1 %D)

    // into

    // call void @llvm.assume(i1 true) [ "align"(i32* [[A]], i64  Constant + 1)]

    uint64_t AlignMask;

    if (EnableKnowledgeRetention &&

        match(IIOperand,

              m_Cmp(Pred, m_And(m_Value(A), m_ConstantInt(AlignMask)),

                    m_Zero())) &&

        Pred == CmpInst::ICMP_EQ) {

      if (isPowerOf2_64(AlignMask + 1)) {

        uint64_t Offset = 0;

        match(A, m_Add(m_Value(A), m_ConstantInt(Offset)));

        if (match(A, m_PtrToInt(m_Value(A)))) {

          /// Note: this doesn't preserve the offset information but merges

          /// offset and alignment.

          /// TODO: we can generate a GEP instead of merging the alignment with

          /// the offset.

          RetainedKnowledge RK{Attribute::Alignment,

                               (unsigned)MinAlign(Offset, AlignMask + 1), A};

          if (auto *Replacement =

                  buildAssumeFromKnowledge(RK, Next, &AC, &DT)) {


            Replacement->insertAfter(II);

            AC.registerAssumption(Replacement);

          }

          return RemoveConditionFromAssume(II);

        }

      }

    }


    /// Canonicalize Knowledge in operand bundles.

    if (EnableKnowledgeRetention && II->hasOperandBundles()) {

      for (unsigned Idx = 0; Idx < II->getNumOperandBundles(); Idx++) {

        auto &BOI = II->bundle_op_info_begin()[Idx];

        RetainedKnowledge RK =

          llvm::getKnowledgeFromBundle(cast<AssumeInst>(*II), BOI);

        if (BOI.End - BOI.Begin > 2)

          continue; // Prevent reducing knowledge in an align with offset since

                    // extracting a RetainedKnowledge from them looses offset

                    // information

        RetainedKnowledge CanonRK =

          llvm::simplifyRetainedKnowledge(cast<AssumeInst>(II), RK,

                                          &getAssumptionCache(),

                                          &getDominatorTree());

        if (CanonRK == RK)

          continue;

        if (!CanonRK) {

          if (BOI.End - BOI.Begin > 0) {

            Worklist.pushValue(II->op_begin()[BOI.Begin]);

            Value::dropDroppableUse(II->op_begin()[BOI.Begin]);

          }

          continue;

        }

        assert(RK.AttrKind == CanonRK.AttrKind);

        if (BOI.End - BOI.Begin > 0)

          II->op_begin()[BOI.Begin].set(CanonRK.WasOn);

        if (BOI.End - BOI.Begin > 1)

          II->op_begin()[BOI.Begin + 1].set(ConstantInt::get(

              Type::getInt64Ty(II->getContext()), CanonRK.ArgValue));

        if (RK.WasOn)

          Worklist.pushValue(RK.WasOn);

        return II;

      }

    }


    // If there is a dominating assume with the same condition as this one,

    // then this one is redundant, and should be removed.

    KnownBits Known(1);

    computeKnownBits(IIOperand, Known, 0, II);

    if (Known.isAllOnes() && isAssumeWithEmptyBundle(cast<AssumeInst>(*II)))

      return eraseInstFromFunction(*II);


    // assume(false) is unreachable.

    if (match(IIOperand, m_CombineOr(m_Zero(), m_Undef()))) {

      CreateNonTerminatorUnreachable(II);

      return eraseInstFromFunction(*II);

    }


    // Update the cache of affected values for this assumption (we might be

    // here because we just simplified the condition).

    AC.updateAffectedValues(cast<AssumeInst>(II));

    break;

  }

  case Intrinsic::experimental_guard: {

    // Is this guard followed by another guard?  We scan forward over a small

    // fixed window of instructions to handle common cases with conditions

    // computed between guards.

    Instruction *NextInst = II->getNextNonDebugInstruction();

    for (unsigned i = 0; i < GuardWideningWindow; i++) {

      // Note: Using context-free form to avoid compile time blow up

      if (!isSafeToSpeculativelyExecute(NextInst))

        break;

      NextInst = NextInst->getNextNonDebugInstruction();

    }

    Value *NextCond = nullptr;

    if (match(NextInst,

              m_Intrinsic<Intrinsic::experimental_guard>(m_Value(NextCond)))) {

      Value *CurrCond = II->getArgOperand(0);


      // Remove a guard that it is immediately preceded by an identical guard.

      // Otherwise canonicalize guard(a); guard(b) -> guard(a & b).

      if (CurrCond != NextCond) {

        Instruction *MoveI = II->getNextNonDebugInstruction();

        while (MoveI != NextInst) {

          auto *Temp = MoveI;

          MoveI = MoveI->getNextNonDebugInstruction();

          Temp->moveBefore(II);

        }

        replaceOperand(*II, 0, Builder.CreateAnd(CurrCond, NextCond));

      }

      eraseInstFromFunction(*NextInst);

      return II;

    }

    break;

  }

  case Intrinsic::vector_insert: {

    Value *Vec = II->getArgOperand(0);

    Value *SubVec = II->getArgOperand(1);

    Value *Idx = II->getArgOperand(2);

    auto *DstTy = dyn_cast<FixedVectorType>(II->getType());

    auto *VecTy = dyn_cast<FixedVectorType>(Vec->getType());

    auto *SubVecTy = dyn_cast<FixedVectorType>(SubVec->getType());


    // Only canonicalize if the destination vector, Vec, and SubVec are all

    // fixed vectors.

    if (DstTy && VecTy && SubVecTy) {

      unsigned DstNumElts = DstTy->getNumElements();

      unsigned VecNumElts = VecTy->getNumElements();

      unsigned SubVecNumElts = SubVecTy->getNumElements();

      unsigned IdxN = cast<ConstantInt>(Idx)->getZExtValue();


      // An insert that entirely overwrites Vec with SubVec is a nop.

      if (VecNumElts == SubVecNumElts)

        return replaceInstUsesWith(CI, SubVec);


      // Widen SubVec into a vector of the same width as Vec, since

      // shufflevector requires the two input vectors to be the same width.

      // Elements beyond the bounds of SubVec within the widened vector are

      // undefined.

      SmallVector<int, 8> WidenMask;

      unsigned i;

      for (i = 0; i != SubVecNumElts; ++i)

        WidenMask.push_back(i);

      for (; i != VecNumElts; ++i)

        WidenMask.push_back(PoisonMaskElem);


      Value *WidenShuffle = Builder.CreateShuffleVector(SubVec, WidenMask);


      SmallVector<int, 8> Mask;

      for (unsigned i = 0; i != IdxN; ++i)

        Mask.push_back(i);

      for (unsigned i = DstNumElts; i != DstNumElts + SubVecNumElts; ++i)

        Mask.push_back(i);

      for (unsigned i = IdxN + SubVecNumElts; i != DstNumElts; ++i)

        Mask.push_back(i);


      Value *Shuffle = Builder.CreateShuffleVector(Vec, WidenShuffle, Mask);

      return replaceInstUsesWith(CI, Shuffle);

    }

    break;

  }

  case Intrinsic::vector_extract: {

    Value *Vec = II->getArgOperand(0);

    Value *Idx = II->getArgOperand(1);


    Type *ReturnType = II->getType();

    // (extract_vector (insert_vector InsertTuple, InsertValue, InsertIdx),

    // ExtractIdx)

    unsigned ExtractIdx = cast<ConstantInt>(Idx)->getZExtValue();

    Value *InsertTuple, *InsertIdx, *InsertValue;

    if (match(Vec, m_Intrinsic<Intrinsic::vector_insert>(m_Value(InsertTuple),

                                                         m_Value(InsertValue),

                                                         m_Value(InsertIdx))) &&

        InsertValue->getType() == ReturnType) {

      unsigned Index = cast<ConstantInt>(InsertIdx)->getZExtValue();

      // Case where we get the same index right after setting it.

      // extract.vector(insert.vector(InsertTuple, InsertValue, Idx), Idx) -->

      // InsertValue

      if (ExtractIdx == Index)

        return replaceInstUsesWith(CI, InsertValue);

      // If we are getting a different index than what was set in the

      // insert.vector intrinsic. We can just set the input tuple to the one up

      // in the chain. extract.vector(insert.vector(InsertTuple, InsertValue,

      // InsertIndex), ExtractIndex)

      // --> extract.vector(InsertTuple, ExtractIndex)

      else

        return replaceOperand(CI, 0, InsertTuple);

    }


    auto *DstTy = dyn_cast<VectorType>(ReturnType);

    auto *VecTy = dyn_cast<VectorType>(Vec->getType());


    if (DstTy && VecTy) {

      auto DstEltCnt = DstTy->getElementCount();

      auto VecEltCnt = VecTy->getElementCount();

      unsigned IdxN = cast<ConstantInt>(Idx)->getZExtValue();


      // Extracting the entirety of Vec is a nop.

      if (DstEltCnt == VecTy->getElementCount()) {

        replaceInstUsesWith(CI, Vec);

        return eraseInstFromFunction(CI);

      }


      // Only canonicalize to shufflevector if the destination vector and

      // Vec are fixed vectors.

      if (VecEltCnt.isScalable() || DstEltCnt.isScalable())

        break;


      SmallVector<int, 8> Mask;

      for (unsigned i = 0; i != DstEltCnt.getKnownMinValue(); ++i)

        Mask.push_back(IdxN + i);


      Value *Shuffle = Builder.CreateShuffleVector(Vec, Mask);

      return replaceInstUsesWith(CI, Shuffle);

    }

    break;

  }

  case Intrinsic::vector_reverse: {

    Value *BO0, *BO1, *X, *Y;

    Value *Vec = II->getArgOperand(0);

    if (match(Vec, m_OneUse(m_BinOp(m_Value(BO0), m_Value(BO1))))) {

      auto *OldBinOp = cast<BinaryOperator>(Vec);

      if (match(BO0, m_VecReverse(m_Value(X)))) {

        // rev(binop rev(X), rev(Y)) --> binop X, Y

        if (match(BO1, m_VecReverse(m_Value(Y))))

          return replaceInstUsesWith(CI, BinaryOperator::CreateWithCopiedFlags(

                                             OldBinOp->getOpcode(), X, Y,

                                             OldBinOp, OldBinOp->getName(),

                                             II->getIterator()));

        // rev(binop rev(X), BO1Splat) --> binop X, BO1Splat

        if (isSplatValue(BO1))

          return replaceInstUsesWith(CI, BinaryOperator::CreateWithCopiedFlags(

                                             OldBinOp->getOpcode(), X, BO1,

                                             OldBinOp, OldBinOp->getName(),

                                             II->getIterator()));

      }

      // rev(binop BO0Splat, rev(Y)) --> binop BO0Splat, Y

      if (match(BO1, m_VecReverse(m_Value(Y))) && isSplatValue(BO0))

        return replaceInstUsesWith(CI,

                                   BinaryOperator::CreateWithCopiedFlags(

                                       OldBinOp->getOpcode(), BO0, Y, OldBinOp,

                                       OldBinOp->getName(), II->getIterator()));

    }

    // rev(unop rev(X)) --> unop X

    if (match(Vec, m_OneUse(m_UnOp(m_VecReverse(m_Value(X)))))) {

      auto *OldUnOp = cast<UnaryOperator>(Vec);

      auto *NewUnOp = UnaryOperator::CreateWithCopiedFlags(

          OldUnOp->getOpcode(), X, OldUnOp, OldUnOp->getName(),

          II->getIterator());

      return replaceInstUsesWith(CI, NewUnOp);

    }

    break;

  }

  case Intrinsic::vector_reduce_or:

  case Intrinsic::vector_reduce_and: {

    // Canonicalize logical or/and reductions:

    // Or reduction for i1 is represented as:

    // %val = bitcast <ReduxWidth x i1> to iReduxWidth

    // %res = cmp ne iReduxWidth %val, 0

    // And reduction for i1 is represented as:

    // %val = bitcast <ReduxWidth x i1> to iReduxWidth

    // %res = cmp eq iReduxWidth %val, 11111

    Value *Arg = II->getArgOperand(0);

    Value *Vect;


    if (Value *NewOp =

            simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

      replaceUse(II->getOperandUse(0), NewOp);

      return II;

    }


    if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

      if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

        if (FTy->getElementType() == Builder.getInt1Ty()) {

          Value *Res = Builder.CreateBitCast(

              Vect, Builder.getIntNTy(FTy->getNumElements()));

          if (IID == Intrinsic::vector_reduce_and) {

            Res = Builder.CreateICmpEQ(

                Res, ConstantInt::getAllOnesValue(Res->getType()));

          } else {

            assert(IID == Intrinsic::vector_reduce_or &&

                   "Expected or reduction.");

            Res = Builder.CreateIsNotNull(Res);

          }

          if (Arg != Vect)

            Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                     II->getType());

          return replaceInstUsesWith(CI, Res);

        }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_add: {

    if (IID == Intrinsic::vector_reduce_add) {

      // Convert vector_reduce_add(ZExt(<n x i1>)) to

      // ZExtOrTrunc(ctpop(bitcast <n x i1> to in)).

      // Convert vector_reduce_add(SExt(<n x i1>)) to

      // -ZExtOrTrunc(ctpop(bitcast <n x i1> to in)).

      // Convert vector_reduce_add(<n x i1>) to

      // Trunc(ctpop(bitcast <n x i1> to in)).

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

          if (FTy->getElementType() == Builder.getInt1Ty()) {

            Value *V = Builder.CreateBitCast(

                Vect, Builder.getIntNTy(FTy->getNumElements()));

            Value *Res = Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, V);

            if (Res->getType() != II->getType())

              Res = Builder.CreateZExtOrTrunc(Res, II->getType());

            if (Arg != Vect &&

                cast<Instruction>(Arg)->getOpcode() == Instruction::SExt)

              Res = Builder.CreateNeg(Res);

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_xor: {

    if (IID == Intrinsic::vector_reduce_xor) {

      // Exclusive disjunction reduction over the vector with

      // (potentially-extended) i1 element type is actually a

      // (potentially-extended) arithmetic `add` reduction over the original

      // non-extended value:

      //   vector_reduce_xor(?ext(<n x i1>))

      //     -->

      //   ?ext(vector_reduce_add(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = Builder.CreateAddReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                       II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_mul: {

    if (IID == Intrinsic::vector_reduce_mul) {

      // Multiplicative reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially zero-extended)

      // logical `and` reduction over the original non-extended value:

      //   vector_reduce_mul(?ext(<n x i1>))

      //     -->

      //   zext(vector_reduce_and(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = Builder.CreateAndReduce(Vect);

            if (Res->getType() != II->getType())

              Res = Builder.CreateZExt(Res, II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_umin:

  case Intrinsic::vector_reduce_umax: {

    if (IID == Intrinsic::vector_reduce_umin ||

        IID == Intrinsic::vector_reduce_umax) {

      // UMin/UMax reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially-extended)

      // logical `and`/`or` reduction over the original non-extended value:

      //   vector_reduce_u{min,max}(?ext(<n x i1>))

      //     -->

      //   ?ext(vector_reduce_{and,or}(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = IID == Intrinsic::vector_reduce_umin

                             ? Builder.CreateAndReduce(Vect)

                             : Builder.CreateOrReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                       II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_smin:

  case Intrinsic::vector_reduce_smax: {

    if (IID == Intrinsic::vector_reduce_smin ||

        IID == Intrinsic::vector_reduce_smax) {

      // SMin/SMax reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially-extended)

      // logical `and`/`or` reduction over the original non-extended value:

      //   vector_reduce_s{min,max}(<n x i1>)

      //     -->

      //   vector_reduce_{or,and}(<n x i1>)

      // and

      //   vector_reduce_s{min,max}(sext(<n x i1>))

      //     -->

      //   sext(vector_reduce_{or,and}(<n x i1>))

      // and

      //   vector_reduce_s{min,max}(zext(<n x i1>))

      //     -->

      //   zext(vector_reduce_{and,or}(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;


      if (Value *NewOp =

              simplifyReductionOperand(Arg, /*CanReorderLanes=*/true)) {

        replaceUse(II->getOperandUse(0), NewOp);

        return II;

      }


      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *VTy = dyn_cast<VectorType>(Vect->getType()))

          if (VTy->getElementType() == Builder.getInt1Ty()) {

            Instruction::CastOps ExtOpc = Instruction::CastOps::CastOpsEnd;

            if (Arg != Vect)

              ExtOpc = cast<CastInst>(Arg)->getOpcode();

            Value *Res = ((IID == Intrinsic::vector_reduce_smin) ==

                          (ExtOpc == Instruction::CastOps::ZExt))

                             ? Builder.CreateAndReduce(Vect)

                             : Builder.CreateOrReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(ExtOpc, Res, II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_fmax:

  case Intrinsic::vector_reduce_fmin:

  case Intrinsic::vector_reduce_fadd:

  case Intrinsic::vector_reduce_fmul: {

    bool CanReorderLanes = (IID != Intrinsic::vector_reduce_fadd &&

                            IID != Intrinsic::vector_reduce_fmul) ||

                           II->hasAllowReassoc();

    const unsigned ArgIdx = (IID == Intrinsic::vector_reduce_fadd ||

                             IID == Intrinsic::vector_reduce_fmul)

                                ? 1

                                : 0;

    Value *Arg = II->getArgOperand(ArgIdx);

    if (Value *NewOp = simplifyReductionOperand(Arg, CanReorderLanes)) {

      replaceUse(II->getOperandUse(ArgIdx), NewOp);

      return nullptr;

    }

    break;

  }

  case Intrinsic::is_fpclass: {

    if (Instruction *I = foldIntrinsicIsFPClass(*II))

      return I;

    break;

  }

  case Intrinsic::threadlocal_address: {

    Align MinAlign = getKnownAlignment(II->getArgOperand(0), DL, II, &AC, &DT);

    MaybeAlign Align = II->getRetAlign();

    if (MinAlign > Align.valueOrOne()) {

      II->addRetAttr(Attribute::getWithAlignment(II->getContext(), MinAlign));

      return II;

    }

    break;

  }

  default: {

    // Handle target specific intrinsics

    std::optional<Instruction *> V = targetInstCombineIntrinsic(*II);

    if (V)

      return *V;

    break;

  }

  }


  // Try to fold intrinsic into select operands. This is legal if:

  //  * The intrinsic is speculatable.

  //  * The select condition is not a vector, or the intrinsic does not

  //    perform cross-lane operations.

  switch (IID) {

  case Intrinsic::ctlz:

  case Intrinsic::cttz:

  case Intrinsic::ctpop:

  case Intrinsic::umin:

  case Intrinsic::umax:

  case Intrinsic::smin:

  case Intrinsic::smax:

  case Intrinsic::usub_sat:

  case Intrinsic::uadd_sat:

  case Intrinsic::ssub_sat:

  case Intrinsic::sadd_sat:

    for (Value *Op : II->args())

      if (auto *Sel = dyn_cast<SelectInst>(Op))

        if (Instruction *R = FoldOpIntoSelect(*II, Sel))

          return R;

    [[fallthrough]];

  default:

    break;

  }


  if (Instruction *Shuf = foldShuffledIntrinsicOperands(II, Builder))

    return Shuf;


  // Some intrinsics (like experimental_gc_statepoint) can be used in invoke

  // context, so it is handled in visitCallBase and we should trigger it.

  return visitCallBase(*II);

}


// Fence instruction simplification

Instruction *InstCombinerImpl::visitFenceInst(FenceInst &FI) {

  auto *NFI = dyn_cast<FenceInst>(FI.getNextNonDebugInstruction());

  // This check is solely here to handle arbitrary target-dependent syncscopes.

  // TODO: Can remove if does not matter in practice.

  if (NFI && FI.isIdenticalTo(NFI))

    return eraseInstFromFunction(FI);


  // Returns true if FI1 is identical or stronger fence than FI2.

  auto isIdenticalOrStrongerFence = [](FenceInst *FI1, FenceInst *FI2) {

    auto FI1SyncScope = FI1->getSyncScopeID();

    // Consider same scope, where scope is global or single-thread.

    if (FI1SyncScope != FI2->getSyncScopeID() ||

        (FI1SyncScope != SyncScope::System &&

         FI1SyncScope != SyncScope::SingleThread))

      return false;


    return isAtLeastOrStrongerThan(FI1->getOrdering(), FI2->getOrdering());

  };

  if (NFI && isIdenticalOrStrongerFence(NFI, &FI))

    return eraseInstFromFunction(FI);


  if (auto *PFI = dyn_cast_or_null<FenceInst>(FI.getPrevNonDebugInstruction()))

    if (isIdenticalOrStrongerFence(PFI, &FI))

      return eraseInstFromFunction(FI);

  return nullptr;

}


// InvokeInst simplification

Instruction *InstCombinerImpl::visitInvokeInst(InvokeInst &II) {

  return visitCallBase(II);

}


// CallBrInst simplification

Instruction *InstCombinerImpl::visitCallBrInst(CallBrInst &CBI) {

  return visitCallBase(CBI);

}


Instruction *InstCombinerImpl::tryOptimizeCall(CallInst *CI) {

  if (!CI->getCalledFunction()) return nullptr;


  // Skip optimizing notail and musttail calls so

  // LibCallSimplifier::optimizeCall doesn't have to preserve those invariants.

  // LibCallSimplifier::optimizeCall should try to preseve tail calls though.

  if (CI->isMustTailCall() || CI->isNoTailCall())

    return nullptr;


  auto InstCombineRAUW = [this](Instruction *From, Value *With) {

    replaceInstUsesWith(*From, With);

  };

  auto InstCombineErase = [this](Instruction *I) {

    eraseInstFromFunction(*I);

  };

  LibCallSimplifier Simplifier(DL, &TLI, &AC, ORE, BFI, PSI, InstCombineRAUW,

                               InstCombineErase);

  if (Value *With = Simplifier.optimizeCall(CI, Builder)) {

    ++NumSimplified;

    return CI->use_empty() ? CI : replaceInstUsesWith(*CI, With);

  }


  return nullptr;

}


static IntrinsicInst *findInitTrampolineFromAlloca(Value *TrampMem) {

  // Strip off at most one level of pointer casts, looking for an alloca.  This

  // is good enough in practice and simpler than handling any number of casts.

  Value *Underlying = TrampMem->stripPointerCasts();

  if (Underlying != TrampMem &&

      (!Underlying->hasOneUse() || Underlying->user_back() != TrampMem))

    return nullptr;

  if (!isa<AllocaInst>(Underlying))

    return nullptr;


  IntrinsicInst *InitTrampoline = nullptr;

  for (User *U : TrampMem->users()) {

    IntrinsicInst *II = dyn_cast<IntrinsicInst>(U);

    if (!II)

      return nullptr;

    if (II->getIntrinsicID() == Intrinsic::init_trampoline) {

      if (InitTrampoline)

        // More than one init_trampoline writes to this value.  Give up.

        return nullptr;

      InitTrampoline = II;

      continue;

    }

    if (II->getIntrinsicID() == Intrinsic::adjust_trampoline)

      // Allow any number of calls to adjust.trampoline.

      continue;

    return nullptr;

  }


  // No call to init.trampoline found.

  if (!InitTrampoline)

    return nullptr;


  // Check that the alloca is being used in the expected way.

  if (InitTrampoline->getOperand(0) != TrampMem)

    return nullptr;


  return InitTrampoline;

}


static IntrinsicInst *findInitTrampolineFromBB(IntrinsicInst *AdjustTramp,

                                               Value *TrampMem) {

  // Visit all the previous instructions in the basic block, and try to find a

  // init.trampoline which has a direct path to the adjust.trampoline.

  for (BasicBlock::iterator I = AdjustTramp->getIterator(),

                            E = AdjustTramp->getParent()->begin();

       I != E;) {

    Instruction *Inst = &*--I;

    if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(I))

      if (II->getIntrinsicID() == Intrinsic::init_trampoline &&

          II->getOperand(0) == TrampMem)

        return II;

    if (Inst->mayWriteToMemory())

      return nullptr;

  }

  return nullptr;

}


// Given a call to llvm.adjust.trampoline, find and return the corresponding

// call to llvm.init.trampoline if the call to the trampoline can be optimized

// to a direct call to a function.  Otherwise return NULL.

static IntrinsicInst *findInitTrampoline(Value *Callee) {

  Callee = Callee->stripPointerCasts();

  IntrinsicInst *AdjustTramp = dyn_cast<IntrinsicInst>(Callee);

  if (!AdjustTramp ||

      AdjustTramp->getIntrinsicID() != Intrinsic::adjust_trampoline)

    return nullptr;


  Value *TrampMem = AdjustTramp->getOperand(0);


  if (IntrinsicInst *IT = findInitTrampolineFromAlloca(TrampMem))

    return IT;

  if (IntrinsicInst *IT = findInitTrampolineFromBB(AdjustTramp, TrampMem))

    return IT;

  return nullptr;

}


bool InstCombinerImpl::annotateAnyAllocSite(CallBase &Call,

                                            const TargetLibraryInfo *TLI) {

  // Note: We only handle cases which can't be driven from generic attributes

  // here.  So, for example, nonnull and noalias (which are common properties

  // of some allocation functions) are expected to be handled via annotation

  // of the respective allocator declaration with generic attributes.

  bool Changed = false;


  if (!Call.getType()->isPointerTy())

    return Changed;


  std::optional<APInt> Size = getAllocSize(&Call, TLI);

  if (Size && *Size != 0) {

    // TODO: We really should just emit deref_or_null here and then

    // let the generic inference code combine that with nonnull.

    if (Call.hasRetAttr(Attribute::NonNull)) {

      Changed = !Call.hasRetAttr(Attribute::Dereferenceable);

      Call.addRetAttr(Attribute::getWithDereferenceableBytes(

          Call.getContext(), Size->getLimitedValue()));

    } else {

      Changed = !Call.hasRetAttr(Attribute::DereferenceableOrNull);

      Call.addRetAttr(Attribute::getWithDereferenceableOrNullBytes(

          Call.getContext(), Size->getLimitedValue()));

    }

  }


  // Add alignment attribute if alignment is a power of two constant.

  Value *Alignment = getAllocAlignment(&Call, TLI);

  if (!Alignment)

    return Changed;


  ConstantInt *AlignOpC = dyn_cast<ConstantInt>(Alignment);

  if (AlignOpC && AlignOpC->getValue().ult(llvm::Value::MaximumAlignment)) {

    uint64_t AlignmentVal = AlignOpC->getZExtValue();

    if (llvm::isPowerOf2_64(AlignmentVal)) {

      Align ExistingAlign = Call.getRetAlign().valueOrOne();

      Align NewAlign = Align(AlignmentVal);

      if (NewAlign > ExistingAlign) {

        Call.addRetAttr(

            Attribute::getWithAlignment(Call.getContext(), NewAlign));

        Changed = true;

      }

    }

  }

  return Changed;

}


/// Improvements for call, callbr and invoke instructions.

Instruction *InstCombinerImpl::visitCallBase(CallBase &Call) {

  bool Changed = annotateAnyAllocSite(Call, &TLI);


  // Mark any parameters that are known to be non-null with the nonnull

  // attribute.  This is helpful for inlining calls to functions with null

  // checks on their arguments.

  SmallVector<unsigned, 4> ArgNos;

  unsigned ArgNo = 0;


  for (Value *V : Call.args()) {

    if (V->getType()->isPointerTy() &&

        !Call.paramHasAttr(ArgNo, Attribute::NonNull) &&

        isKnownNonZero(V, getSimplifyQuery().getWithInstruction(&Call)))

      ArgNos.push_back(ArgNo);

    ArgNo++;

  }


  assert(ArgNo == Call.arg_size() && "Call arguments not processed correctly.");


  if (!ArgNos.empty()) {

    AttributeList AS = Call.getAttributes();

    LLVMContext &Ctx = Call.getContext();

    AS = AS.addParamAttribute(Ctx, ArgNos,

                              Attribute::get(Ctx, Attribute::NonNull));

    Call.setAttributes(AS);

    Changed = true;

  }


  // If the callee is a pointer to a function, attempt to move any casts to the

  // arguments of the call/callbr/invoke.

  Value *Callee = Call.getCalledOperand();

  Function *CalleeF = dyn_cast<Function>(Callee);

  if ((!CalleeF || CalleeF->getFunctionType() != Call.getFunctionType()) &&

      transformConstExprCastCall(Call))

    return nullptr;


  if (CalleeF) {

    // Remove the convergent attr on calls when the callee is not convergent.

    if (Call.isConvergent() && !CalleeF->isConvergent() &&

        !CalleeF->isIntrinsic()) {

      LLVM_DEBUG(dbgs() << "Removing convergent attr from instr " << Call

                        << "\n");

      Call.setNotConvergent();

      return &Call;

    }


    // If the call and callee calling conventions don't match, and neither one

    // of the calling conventions is compatible with C calling convention

    // this call must be unreachable, as the call is undefined.

    if ((CalleeF->getCallingConv() != Call.getCallingConv() &&

         !(CalleeF->getCallingConv() == llvm::CallingConv::C &&

           TargetLibraryInfoImpl::isCallingConvCCompatible(&Call)) &&

         !(Call.getCallingConv() == llvm::CallingConv::C &&

           TargetLibraryInfoImpl::isCallingConvCCompatible(CalleeF))) &&

        // Only do this for calls to a function with a body.  A prototype may

        // not actually end up matching the implementation's calling conv for a

        // variety of reasons (e.g. it may be written in assembly).

        !CalleeF->isDeclaration()) {

      Instruction *OldCall = &Call;

      CreateNonTerminatorUnreachable(OldCall);

      // If OldCall does not return void then replaceInstUsesWith poison.

      // This allows ValueHandlers and custom metadata to adjust itself.

      if (!OldCall->getType()->isVoidTy())

        replaceInstUsesWith(*OldCall, PoisonValue::get(OldCall->getType()));

      if (isa<CallInst>(OldCall))

        return eraseInstFromFunction(*OldCall);


      // We cannot remove an invoke or a callbr, because it would change thexi

      // CFG, just change the callee to a null pointer.

      cast<CallBase>(OldCall)->setCalledFunction(

          CalleeF->getFunctionType(),

          Constant::getNullValue(CalleeF->getType()));

      return nullptr;

    }

  }


  // Calling a null function pointer is undefined if a null address isn't

  // dereferenceable.

  if ((isa<ConstantPointerNull>(Callee) &&

       !NullPointerIsDefined(Call.getFunction())) ||

      isa<UndefValue>(Callee)) {

    // If Call does not return void then replaceInstUsesWith poison.

    // This allows ValueHandlers and custom metadata to adjust itself.

    if (!Call.getType()->isVoidTy())

      replaceInstUsesWith(Call, PoisonValue::get(Call.getType()));


    if (Call.isTerminator()) {

      // Can't remove an invoke or callbr because we cannot change the CFG.

      return nullptr;

    }


    // This instruction is not reachable, just remove it.

    CreateNonTerminatorUnreachable(&Call);

    return eraseInstFromFunction(Call);

  }


  if (IntrinsicInst *II = findInitTrampoline(Callee))

    return transformCallThroughTrampoline(Call, *II);


  if (isa<InlineAsm>(Callee) && !Call.doesNotThrow()) {

    InlineAsm *IA = cast<InlineAsm>(Callee);

    if (!IA->canThrow()) {

      // Normal inline asm calls cannot throw - mark them

      // 'nounwind'.

      Call.setDoesNotThrow();

      Changed = true;

    }

  }


  // Try to optimize the call if possible, we require DataLayout for most of

  // this.  None of these calls are seen as possibly dead so go ahead and

  // delete the instruction now.

  if (CallInst *CI = dyn_cast<CallInst>(&Call)) {

    Instruction *I = tryOptimizeCall(CI);

    // If we changed something return the result, etc. Otherwise let

    // the fallthrough check.

    if (I) return eraseInstFromFunction(*I);

  }


  if (!Call.use_empty() && !Call.isMustTailCall())

    if (Value *ReturnedArg = Call.getReturnedArgOperand()) {

      Type *CallTy = Call.getType();

      Type *RetArgTy = ReturnedArg->getType();

      if (RetArgTy->canLosslesslyBitCastTo(CallTy))

        return replaceInstUsesWith(

            Call, Builder.CreateBitOrPointerCast(ReturnedArg, CallTy));

    }


  // Drop unnecessary kcfi operand bundles from calls that were converted

  // into direct calls.

  auto Bundle = Call.getOperandBundle(LLVMContext::OB_kcfi);

  if (Bundle && !Call.isIndirectCall()) {

    DEBUG_WITH_TYPE(DEBUG_TYPE "-kcfi", {

      if (CalleeF) {

        ConstantInt *FunctionType = nullptr;

        ConstantInt *ExpectedType = cast<ConstantInt>(Bundle->Inputs[0]);


        if (MDNode *MD = CalleeF->getMetadata(LLVMContext::MD_kcfi_type))

          FunctionType = mdconst::extract<ConstantInt>(MD->getOperand(0));


        if (FunctionType &&

            FunctionType->getZExtValue() != ExpectedType->getZExtValue())

          dbgs() << Call.getModule()->getName()

                 << ": warning: kcfi: " << Call.getCaller()->getName()

                 << ": call to " << CalleeF->getName()

                 << " using a mismatching function pointer type\n";

      }

    });


    return CallBase::removeOperandBundle(&Call, LLVMContext::OB_kcfi);

  }


  if (isRemovableAlloc(&Call, &TLI))

    return visitAllocSite(Call);


  // Handle intrinsics which can be used in both call and invoke context.

  switch (Call.getIntrinsicID()) {

  case Intrinsic::experimental_gc_statepoint: {

    GCStatepointInst &GCSP = *cast<GCStatepointInst>(&Call);

    SmallPtrSet<Value *, 32> LiveGcValues;

    for (const GCRelocateInst *Reloc : GCSP.getGCRelocates()) {

      GCRelocateInst &GCR = *const_cast<GCRelocateInst *>(Reloc);


      // Remove the relocation if unused.

      if (GCR.use_empty()) {

        eraseInstFromFunction(GCR);

        continue;

      }


      Value *DerivedPtr = GCR.getDerivedPtr();

      Value *BasePtr = GCR.getBasePtr();


      // Undef is undef, even after relocation.

      if (isa<UndefValue>(DerivedPtr) || isa<UndefValue>(BasePtr)) {

        replaceInstUsesWith(GCR, UndefValue::get(GCR.getType()));

        eraseInstFromFunction(GCR);

        continue;

      }


      if (auto *PT = dyn_cast<PointerType>(GCR.getType())) {

        // The relocation of null will be null for most any collector.

        // TODO: provide a hook for this in GCStrategy.  There might be some

        // weird collector this property does not hold for.

        if (isa<ConstantPointerNull>(DerivedPtr)) {

          // Use null-pointer of gc_relocate's type to replace it.

          replaceInstUsesWith(GCR, ConstantPointerNull::get(PT));

          eraseInstFromFunction(GCR);

          continue;

        }


        // isKnownNonNull -> nonnull attribute

        if (!GCR.hasRetAttr(Attribute::NonNull) &&

            isKnownNonZero(DerivedPtr,

                           getSimplifyQuery().getWithInstruction(&Call))) {

          GCR.addRetAttr(Attribute::NonNull);

          // We discovered new fact, re-check users.

          Worklist.pushUsersToWorkList(GCR);

        }

      }


      // If we have two copies of the same pointer in the statepoint argument

      // list, canonicalize to one.  This may let us common gc.relocates.

      if (GCR.getBasePtr() == GCR.getDerivedPtr() &&

          GCR.getBasePtrIndex() != GCR.getDerivedPtrIndex()) {

        auto *OpIntTy = GCR.getOperand(2)->getType();

        GCR.setOperand(2, ConstantInt::get(OpIntTy, GCR.getBasePtrIndex()));

      }


      // TODO: bitcast(relocate(p)) -> relocate(bitcast(p))

      // Canonicalize on the type from the uses to the defs


      // TODO: relocate((gep p, C, C2, ...)) -> gep(relocate(p), C, C2, ...)

      LiveGcValues.insert(BasePtr);

      LiveGcValues.insert(DerivedPtr);

    }

    std::optional<OperandBundleUse> Bundle =

        GCSP.getOperandBundle(LLVMContext::OB_gc_live);

    unsigned NumOfGCLives = LiveGcValues.size();

    if (!Bundle || NumOfGCLives == Bundle->Inputs.size())

      break;

    // We can reduce the size of gc live bundle.

    DenseMap<Value *, unsigned> Val2Idx;

    std::vector<Value *> NewLiveGc;

    for (Value *V : Bundle->Inputs) {

      if (Val2Idx.count(V))

        continue;

      if (LiveGcValues.count(V)) {

        Val2Idx[V] = NewLiveGc.size();

        NewLiveGc.push_back(V);

      } else

        Val2Idx[V] = NumOfGCLives;

    }

    // Update all gc.relocates

    for (const GCRelocateInst *Reloc : GCSP.getGCRelocates()) {

      GCRelocateInst &GCR = *const_cast<GCRelocateInst *>(Reloc);

      Value *BasePtr = GCR.getBasePtr();

      assert(Val2Idx.count(BasePtr) && Val2Idx[BasePtr] != NumOfGCLives &&

             "Missed live gc for base pointer");

      auto *OpIntTy1 = GCR.getOperand(1)->getType();

      GCR.setOperand(1, ConstantInt::get(OpIntTy1, Val2Idx[BasePtr]));

      Value *DerivedPtr = GCR.getDerivedPtr();

      assert(Val2Idx.count(DerivedPtr) && Val2Idx[DerivedPtr] != NumOfGCLives &&

             "Missed live gc for derived pointer");

      auto *OpIntTy2 = GCR.getOperand(2)->getType();

      GCR.setOperand(2, ConstantInt::get(OpIntTy2, Val2Idx[DerivedPtr]));

    }

    // Create new statepoint instruction.

    OperandBundleDef NewBundle("gc-live", NewLiveGc);

    return CallBase::Create(&Call, NewBundle);

  }

  default: { break; }

  }


  return Changed ? &Call : nullptr;

}


/// If the callee is a constexpr cast of a function, attempt to move the cast to

/// the arguments of the call/invoke.

/// CallBrInst is not supported.

bool InstCombinerImpl::transformConstExprCastCall(CallBase &Call) {

  auto *Callee =

      dyn_cast<Function>(Call.getCalledOperand()->stripPointerCasts());

  if (!Callee)

    return false;


  assert(!isa<CallBrInst>(Call) &&

         "CallBr's don't have a single point after a def to insert at");


  // If this is a call to a thunk function, don't remove the cast. Thunks are

  // used to transparently forward all incoming parameters and outgoing return

  // values, so it's important to leave the cast in place.

  if (Callee->hasFnAttribute("thunk"))

    return false;


  // If this is a call to a naked function, the assembly might be

  // using an argument, or otherwise rely on the frame layout,

  // the function prototype will mismatch.

  if (Callee->hasFnAttribute(Attribute::Naked))

    return false;


  // If this is a musttail call, the callee's prototype must match the caller's

  // prototype with the exception of pointee types. The code below doesn't

  // implement that, so we can't do this transform.

  // TODO: Do the transform if it only requires adding pointer casts.

  if (Call.isMustTailCall())

    return false;


  Instruction *Caller = &Call;

  const AttributeList &CallerPAL = Call.getAttributes();


  // Okay, this is a cast from a function to a different type.  Unless doing so

  // would cause a type conversion of one of our arguments, change this call to

  // be a direct call with arguments casted to the appropriate types.

  FunctionType *FT = Callee->getFunctionType();

  Type *OldRetTy = Caller->getType();

  Type *NewRetTy = FT->getReturnType();


  // Check to see if we are changing the return type...

  if (OldRetTy != NewRetTy) {


    if (NewRetTy->isStructTy())

      return false; // TODO: Handle multiple return values.


    if (!CastInst::isBitOrNoopPointerCastable(NewRetTy, OldRetTy, DL)) {

      if (Callee->isDeclaration())

        return false;   // Cannot transform this return value.


      if (!Caller->use_empty() &&

          // void -> non-void is handled specially

          !NewRetTy->isVoidTy())

        return false;   // Cannot transform this return value.

    }


    if (!CallerPAL.isEmpty() && !Caller->use_empty()) {

      AttrBuilder RAttrs(FT->getContext(), CallerPAL.getRetAttrs());

      if (RAttrs.overlaps(AttributeFuncs::typeIncompatible(NewRetTy)))

        return false;   // Attribute not compatible with transformed value.

    }


    // If the callbase is an invoke instruction, and the return value is

    // used by a PHI node in a successor, we cannot change the return type of

    // the call because there is no place to put the cast instruction (without

    // breaking the critical edge).  Bail out in this case.

    if (!Caller->use_empty()) {

      BasicBlock *PhisNotSupportedBlock = nullptr;

      if (auto *II = dyn_cast<InvokeInst>(Caller))

        PhisNotSupportedBlock = II->getNormalDest();

      if (PhisNotSupportedBlock)

        for (User *U : Caller->users())

          if (PHINode *PN = dyn_cast<PHINode>(U))

            if (PN->getParent() == PhisNotSupportedBlock)

              return false;

    }

  }


  unsigned NumActualArgs = Call.arg_size();

  unsigned NumCommonArgs = std::min(FT->getNumParams(), NumActualArgs);


  // Prevent us turning:

  // declare void @takes_i32_inalloca(i32* inalloca)

  //  call void bitcast (void (i32*)* @takes_i32_inalloca to void (i32)*)(i32 0)

  //

  // into:

  //  call void @takes_i32_inalloca(i32* null)

  //

  //  Similarly, avoid folding away bitcasts of byval calls.

  if (Callee->getAttributes().hasAttrSomewhere(Attribute::InAlloca) ||

      Callee->getAttributes().hasAttrSomewhere(Attribute::Preallocated))

    return false;


  auto AI = Call.arg_begin();

  for (unsigned i = 0, e = NumCommonArgs; i != e; ++i, ++AI) {

    Type *ParamTy = FT->getParamType(i);

    Type *ActTy = (*AI)->getType();


    if (!CastInst::isBitOrNoopPointerCastable(ActTy, ParamTy, DL))

      return false;   // Cannot transform this parameter value.


    // Check if there are any incompatible attributes we cannot drop safely.

    if (AttrBuilder(FT->getContext(), CallerPAL.getParamAttrs(i))

            .overlaps(AttributeFuncs::typeIncompatible(

                ParamTy, AttributeFuncs::ASK_UNSAFE_TO_DROP)))

      return false;   // Attribute not compatible with transformed value.


    if (Call.isInAllocaArgument(i) ||

        CallerPAL.hasParamAttr(i, Attribute::Preallocated))

      return false; // Cannot transform to and from inalloca/preallocated.


    if (CallerPAL.hasParamAttr(i, Attribute::SwiftError))

      return false;


    if (CallerPAL.hasParamAttr(i, Attribute::ByVal) !=

        Callee->getAttributes().hasParamAttr(i, Attribute::ByVal))

      return false; // Cannot transform to or from byval.

  }


  if (Callee->isDeclaration()) {

    // Do not delete arguments unless we have a function body.

    if (FT->getNumParams() < NumActualArgs && !FT->isVarArg())

      return false;


    // If the callee is just a declaration, don't change the varargsness of the

    // call.  We don't want to introduce a varargs call where one doesn't

    // already exist.

    if (FT->isVarArg() != Call.getFunctionType()->isVarArg())

      return false;


    // If both the callee and the cast type are varargs, we still have to make

    // sure the number of fixed parameters are the same or we have the same

    // ABI issues as if we introduce a varargs call.

    if (FT->isVarArg() && Call.getFunctionType()->isVarArg() &&

        FT->getNumParams() != Call.getFunctionType()->getNumParams())

      return false;

  }


  if (FT->getNumParams() < NumActualArgs && FT->isVarArg() &&

      !CallerPAL.isEmpty()) {

    // In this case we have more arguments than the new function type, but we

    // won't be dropping them.  Check that these extra arguments have attributes

    // that are compatible with being a vararg call argument.

    unsigned SRetIdx;

    if (CallerPAL.hasAttrSomewhere(Attribute::StructRet, &SRetIdx) &&

        SRetIdx - AttributeList::FirstArgIndex >= FT->getNumParams())

      return false;

  }


  // Okay, we decided that this is a safe thing to do: go ahead and start

  // inserting cast instructions as necessary.

  SmallVector<Value *, 8> Args;

  SmallVector<AttributeSet, 8> ArgAttrs;

  Args.reserve(NumActualArgs);

  ArgAttrs.reserve(NumActualArgs);


  // Get any return attributes.

  AttrBuilder RAttrs(FT->getContext(), CallerPAL.getRetAttrs());


  // If the return value is not being used, the type may not be compatible

  // with the existing attributes.  Wipe out any problematic attributes.

  RAttrs.remove(AttributeFuncs::typeIncompatible(NewRetTy));


  LLVMContext &Ctx = Call.getContext();

  AI = Call.arg_begin();

  for (unsigned i = 0; i != NumCommonArgs; ++i, ++AI) {

    Type *ParamTy = FT->getParamType(i);


    Value *NewArg = *AI;

    if ((*AI)->getType() != ParamTy)

      NewArg = Builder.CreateBitOrPointerCast(*AI, ParamTy);

    Args.push_back(NewArg);


    // Add any parameter attributes except the ones incompatible with the new

    // type. Note that we made sure all incompatible ones are safe to drop.

    AttributeMask IncompatibleAttrs = AttributeFuncs::typeIncompatible(

        ParamTy, AttributeFuncs::ASK_SAFE_TO_DROP);

    ArgAttrs.push_back(

        CallerPAL.getParamAttrs(i).removeAttributes(Ctx, IncompatibleAttrs));

  }


  // If the function takes more arguments than the call was taking, add them

  // now.

  for (unsigned i = NumCommonArgs; i != FT->getNumParams(); ++i) {

    Args.push_back(Constant::getNullValue(FT->getParamType(i)));

    ArgAttrs.push_back(AttributeSet());

  }


  // If we are removing arguments to the function, emit an obnoxious warning.

  if (FT->getNumParams() < NumActualArgs) {

    // TODO: if (!FT->isVarArg()) this call may be unreachable. PR14722

    if (FT->isVarArg()) {

      // Add all of the arguments in their promoted form to the arg list.

      for (unsigned i = FT->getNumParams(); i != NumActualArgs; ++i, ++AI) {

        Type *PTy = getPromotedType((*AI)->getType());

        Value *NewArg = *AI;

        if (PTy != (*AI)->getType()) {

          // Must promote to pass through va_arg area!

          Instruction::CastOps opcode =

            CastInst::getCastOpcode(*AI, false, PTy, false);

          NewArg = Builder.CreateCast(opcode, *AI, PTy);

        }

        Args.push_back(NewArg);


        // Add any parameter attributes.

        ArgAttrs.push_back(CallerPAL.getParamAttrs(i));

      }

    }

  }


  AttributeSet FnAttrs = CallerPAL.getFnAttrs();


  if (NewRetTy->isVoidTy())

    Caller->setName("");   // Void type should not have a name.


  assert((ArgAttrs.size() == FT->getNumParams() || FT->isVarArg()) &&

         "missing argument attributes");

  AttributeList NewCallerPAL = AttributeList::get(

      Ctx, FnAttrs, AttributeSet::get(Ctx, RAttrs), ArgAttrs);


  SmallVector<OperandBundleDef, 1> OpBundles;

  Call.getOperandBundlesAsDefs(OpBundles);


  CallBase *NewCall;

  if (InvokeInst *II = dyn_cast<InvokeInst>(Caller)) {

    NewCall = Builder.CreateInvoke(Callee, II->getNormalDest(),

                                   II->getUnwindDest(), Args, OpBundles);

  } else {

    NewCall = Builder.CreateCall(Callee, Args, OpBundles);

    cast<CallInst>(NewCall)->setTailCallKind(

        cast<CallInst>(Caller)->getTailCallKind());

  }

  NewCall->takeName(Caller);

  NewCall->setCallingConv(Call.getCallingConv());

  NewCall->setAttributes(NewCallerPAL);


  // Preserve prof metadata if any.

  NewCall->copyMetadata(*Caller, {LLVMContext::MD_prof});


  // Insert a cast of the return type as necessary.

  Instruction *NC = NewCall;

  Value *NV = NC;

  if (OldRetTy != NV->getType() && !Caller->use_empty()) {

    if (!NV->getType()->isVoidTy()) {

      NV = NC = CastInst::CreateBitOrPointerCast(NC, OldRetTy);

      NC->setDebugLoc(Caller->getDebugLoc());


      auto OptInsertPt = NewCall->getInsertionPointAfterDef();

      assert(OptInsertPt && "No place to insert cast");

      InsertNewInstBefore(NC, *OptInsertPt);

      Worklist.pushUsersToWorkList(*Caller);

    } else {

      NV = PoisonValue::get(Caller->getType());

    }

  }


  if (!Caller->use_empty())

    replaceInstUsesWith(*Caller, NV);

  else if (Caller->hasValueHandle()) {

    if (OldRetTy == NV->getType())

      ValueHandleBase::ValueIsRAUWd(Caller, NV);

    else

      // We cannot call ValueIsRAUWd with a different type, and the

      // actual tracked value will disappear.

      ValueHandleBase::ValueIsDeleted(Caller);

  }


  eraseInstFromFunction(*Caller);

  return true;

}


/// Turn a call to a function created by init_trampoline / adjust_trampoline

/// intrinsic pair into a direct call to the underlying function.

Instruction *

InstCombinerImpl::transformCallThroughTrampoline(CallBase &Call,

                                                 IntrinsicInst &Tramp) {

  FunctionType *FTy = Call.getFunctionType();

  AttributeList Attrs = Call.getAttributes();


  // If the call already has the 'nest' attribute somewhere then give up -

  // otherwise 'nest' would occur twice after splicing in the chain.

  if (Attrs.hasAttrSomewhere(Attribute::Nest))

    return nullptr;


  Function *NestF = cast<Function>(Tramp.getArgOperand(1)->stripPointerCasts());

  FunctionType *NestFTy = NestF->getFunctionType();


  AttributeList NestAttrs = NestF->getAttributes();

  if (!NestAttrs.isEmpty()) {

    unsigned NestArgNo = 0;

    Type *NestTy = nullptr;

    AttributeSet NestAttr;


    // Look for a parameter marked with the 'nest' attribute.

    for (FunctionType::param_iterator I = NestFTy->param_begin(),

                                      E = NestFTy->param_end();

         I != E; ++NestArgNo, ++I) {

      AttributeSet AS = NestAttrs.getParamAttrs(NestArgNo);

      if (AS.hasAttribute(Attribute::Nest)) {

        // Record the parameter type and any other attributes.

        NestTy = *I;

        NestAttr = AS;

        break;

      }

    }


    if (NestTy) {

      std::vector<Value*> NewArgs;

      std::vector<AttributeSet> NewArgAttrs;

      NewArgs.reserve(Call.arg_size() + 1);

      NewArgAttrs.reserve(Call.arg_size());


      // Insert the nest argument into the call argument list, which may

      // mean appending it.  Likewise for attributes.


      {

        unsigned ArgNo = 0;

        auto I = Call.arg_begin(), E = Call.arg_end();

        do {

          if (ArgNo == NestArgNo) {

            // Add the chain argument and attributes.

            Value *NestVal = Tramp.getArgOperand(2);

            if (NestVal->getType() != NestTy)

              NestVal = Builder.CreateBitCast(NestVal, NestTy, "nest");

            NewArgs.push_back(NestVal);

            NewArgAttrs.push_back(NestAttr);

          }


          if (I == E)

            break;


          // Add the original argument and attributes.

          NewArgs.push_back(*I);

          NewArgAttrs.push_back(Attrs.getParamAttrs(ArgNo));


          ++ArgNo;

          ++I;

        } while (true);

      }


      // The trampoline may have been bitcast to a bogus type (FTy).

      // Handle this by synthesizing a new function type, equal to FTy

      // with the chain parameter inserted.


      std::vector<Type*> NewTypes;

      NewTypes.reserve(FTy->getNumParams()+1);


      // Insert the chain's type into the list of parameter types, which may

      // mean appending it.

      {

        unsigned ArgNo = 0;

        FunctionType::param_iterator I = FTy->param_begin(),

          E = FTy->param_end();


        do {

          if (ArgNo == NestArgNo)

            // Add the chain's type.

            NewTypes.push_back(NestTy);


          if (I == E)

            break;


          // Add the original type.

          NewTypes.push_back(*I);


          ++ArgNo;

          ++I;

        } while (true);

      }


      // Replace the trampoline call with a direct call.  Let the generic

      // code sort out any function type mismatches.

      FunctionType *NewFTy =

          FunctionType::get(FTy->getReturnType(), NewTypes, FTy->isVarArg());

      AttributeList NewPAL =

          AttributeList::get(FTy->getContext(), Attrs.getFnAttrs(),

                             Attrs.getRetAttrs(), NewArgAttrs);


      SmallVector<OperandBundleDef, 1> OpBundles;

      Call.getOperandBundlesAsDefs(OpBundles);


      Instruction *NewCaller;

      if (InvokeInst *II = dyn_cast<InvokeInst>(&Call)) {

        NewCaller = InvokeInst::Create(NewFTy, NestF, II->getNormalDest(),

                                       II->getUnwindDest(), NewArgs, OpBundles);

        cast<InvokeInst>(NewCaller)->setCallingConv(II->getCallingConv());

        cast<InvokeInst>(NewCaller)->setAttributes(NewPAL);

      } else if (CallBrInst *CBI = dyn_cast<CallBrInst>(&Call)) {

        NewCaller =

            CallBrInst::Create(NewFTy, NestF, CBI->getDefaultDest(),

                               CBI->getIndirectDests(), NewArgs, OpBundles);

        cast<CallBrInst>(NewCaller)->setCallingConv(CBI->getCallingConv());

        cast<CallBrInst>(NewCaller)->setAttributes(NewPAL);

      } else {

        NewCaller = CallInst::Create(NewFTy, NestF, NewArgs, OpBundles);

        cast<CallInst>(NewCaller)->setTailCallKind(

            cast<CallInst>(Call).getTailCallKind());

        cast<CallInst>(NewCaller)->setCallingConv(

            cast<CallInst>(Call).getCallingConv());

        cast<CallInst>(NewCaller)->setAttributes(NewPAL);

      }

      NewCaller->setDebugLoc(Call.getDebugLoc());


      return NewCaller;

    }

  }


  // Replace the trampoline call with a direct call.  Since there is no 'nest'

  // parameter, there is no need to adjust the argument list.  Let the generic

  // code sort out any function type mismatches.

  Call.setCalledFunction(FTy, NestF);

  return &Call;

}

Intr
unsigned Intr
Definition: AMDGPUBaseInfo.cpp:2910

Select
amdgpu AMDGPU Register Bank Select
Definition: AMDGPURegBankSelect.cpp:46

APFloat.h
This file declares a class to represent arbitrary precision floating point values and provide a varie...

APInt.h
This file implements a class to represent arbitrary precision integral constant values and operations...

APSInt.h
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

IT
static cl::opt< ITMode > IT(cl::desc("IT block support"), cl::Hidden, cl::init(DefaultIT), cl::values(clEnumValN(DefaultIT, "arm-default-it", "Generate any type of IT block"), clEnumValN(RestrictedIT, "arm-restrict-it", "Disallow complex IT blocks")))

AliasAnalysis.h

ArrayRef.h

AssumeBundleBuilder.h

AssumeBundleQueries.h

AssumptionCache.h

AtomicOrdering.h
Atomic ordering constants.

AttributeMask.h

Attributes.h
This file contains the simple types necessary to represent the attributes associated with functions a...

BasicBlock.h

From
BlockVerifier::State From
Definition: BlockVerifier.cpp:57

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

Casting.h

CommandLine.h

Compiler.h

Constant.h

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

foldBitOrderCrossLogicOp
static SDValue foldBitOrderCrossLogicOp(SDNode *N, SelectionDAG &DAG)
Definition: DAGCombiner.cpp:10278

DataLayout.h

RetTy
return RetTy
Definition: DeadArgumentElimination.cpp:360

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:352

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(X)
Definition: Debug.h:101

DEBUG_WITH_TYPE
#define DEBUG_WITH_TYPE(TYPE, X)
DEBUG_WITH_TYPE macro - This macro should be used by passes to emit debug information.
Definition: Debug.h:64

DerivedTypes.h

Size
uint64_t Size
Definition: ELFObjHandler.cpp:81

X
static GCMetadataPrinterRegistry::Add< ErlangGCPrinter > X("erlang", "erlang-compatible garbage collector")

Function.h

DEBUG_TYPE
#define DEBUG_TYPE
Definition: GenericCycleImpl.h:30

GlobalVariable.h

MI
IRTranslator LLVM IR MI
Definition: IRTranslator.cpp:113

Instruction.h

InlineAsm.h

getPromotedType
static Type * getPromotedType(Type *Ty)
Return the specified type promoted as it would be to pass though a va_arg area.
Definition: InstCombineCalls.cpp:94

createOverflowTuple
static Instruction * createOverflowTuple(IntrinsicInst *II, Value *Result, Constant *Overflow)
Creates a result tuple for an overflow intrinsic II with a given Result and a constant Overflow value...
Definition: InstCombineCalls.cpp:814

findInitTrampolineFromAlloca
static IntrinsicInst * findInitTrampolineFromAlloca(Value *TrampMem)
Definition: InstCombineCalls.cpp:3693

removeTriviallyEmptyRange
static bool removeTriviallyEmptyRange(IntrinsicInst &EndI, InstCombinerImpl &IC, std::function< bool(const IntrinsicInst &)> IsStart)
Definition: InstCombineCalls.cpp:766

inputDenormalIsDAZ
static bool inputDenormalIsDAZ(const Function &F, const Type *Ty)
Definition: InstCombineCalls.cpp:838

reassociateMinMaxWithConstantInOperand
static Instruction * reassociateMinMaxWithConstantInOperand(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
If this min/max has a matching min/max operand with a constant, try to push the constant operand into...
Definition: InstCombineCalls.cpp:1259

signBitMustBeTheSame
static bool signBitMustBeTheSame(Value *Op0, Value *Op1, const SimplifyQuery &SQ)
Return true if two values Op0 and Op1 are known to have the same sign.
Definition: InstCombineCalls.cpp:1071

moveAddAfterMinMax
static Instruction * moveAddAfterMinMax(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
Try to canonicalize min/max(X + C0, C1) as min/max(X, C1 - C0) + C0.
Definition: InstCombineCalls.cpp:1084

simplifyInvariantGroupIntrinsic
static Instruction * simplifyInvariantGroupIntrinsic(IntrinsicInst &II, InstCombinerImpl &IC)
This function transforms launder.invariant.group and strip.invariant.group like: launder(launder(x)) ...
Definition: InstCombineCalls.cpp:451

haveSameOperands
static bool haveSameOperands(const IntrinsicInst &I, const IntrinsicInst &E, unsigned NumOperands)
Definition: InstCombineCalls.cpp:746

getKnownSign
static std::optional< bool > getKnownSign(Value *Op, const SimplifyQuery &SQ)
Definition: InstCombineCalls.cpp:1044

GuardWideningWindow
static cl::opt< unsigned > GuardWideningWindow("instcombine-guard-widening-window", cl::init(3), cl::desc("How wide an instruction window to bypass looking for " "another guard"))

hasUndefSource
static bool hasUndefSource(AnyMemTransferInst *MI)
Recognize a memcpy/memmove from a trivially otherwise unused alloca.
Definition: InstCombineCalls.cpp:105

foldShuffledIntrinsicOperands
static Instruction * foldShuffledIntrinsicOperands(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
If all arguments of the intrinsic are unary shuffles with the same mask, try to shuffle after the int...
Definition: InstCombineCalls.cpp:1346

factorizeMinMaxTree
static Instruction * factorizeMinMaxTree(IntrinsicInst *II)
Reduce a sequence of min/max intrinsics with a common operand.
Definition: InstCombineCalls.cpp:1287

simplifyNeonTbl1
static Value * simplifyNeonTbl1(const IntrinsicInst &II, InstCombiner::BuilderTy &Builder)
Convert a table lookup to shufflevector if the mask is constant.
Definition: InstCombineCalls.cpp:710

foldClampRangeOfTwo
static Instruction * foldClampRangeOfTwo(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
If we have a clamp pattern like max (min X, 42), 41 – where the output can only be one of two possibl...
Definition: InstCombineCalls.cpp:1185

simplifyReductionOperand
static Value * simplifyReductionOperand(Value *Arg, bool CanReorderLanes)
Definition: InstCombineCalls.cpp:1432

findInitTrampolineFromBB
static IntrinsicInst * findInitTrampolineFromBB(IntrinsicInst *AdjustTramp, Value *TrampMem)
Definition: InstCombineCalls.cpp:3732

getKnownSignOrZero
static std::optional< bool > getKnownSignOrZero(Value *Op, const SimplifyQuery &SQ)
Definition: InstCombineCalls.cpp:1058

foldMinimumOverTrailingOrLeadingZeroCount
static Value * foldMinimumOverTrailingOrLeadingZeroCount(Value *I0, Value *I1, const DataLayout &DL, InstCombiner::BuilderTy &Builder)
Fold an unsigned minimum of trailing or leading zero bits counts: umin(cttz(CtOp, ZeroUndef),...
Definition: InstCombineCalls.cpp:1465

foldCtpop
static Instruction * foldCtpop(IntrinsicInst &II, InstCombinerImpl &IC)
Definition: InstCombineCalls.cpp:629

foldCttzCtlz
static Instruction * foldCttzCtlz(IntrinsicInst &II, InstCombinerImpl &IC)
Definition: InstCombineCalls.cpp:481

findInitTrampoline
static IntrinsicInst * findInitTrampoline(Value *Callee)
Definition: InstCombineCalls.cpp:3753

fpclassTestIsFCmp0
static FCmpInst::Predicate fpclassTestIsFCmp0(FPClassTest Mask, const Function &F, Type *Ty)
Definition: InstCombineCalls.cpp:846

reassociateMinMaxWithConstants
static Value * reassociateMinMaxWithConstants(IntrinsicInst *II, IRBuilderBase &Builder, const SimplifyQuery &SQ)
If this min/max has a constant operand and an operand that is a matching min/max with a constant oper...
Definition: InstCombineCalls.cpp:1225

canonicalizeConstantArg0ToArg1
static CallInst * canonicalizeConstantArg0ToArg1(CallInst &Call)
Definition: InstCombineCalls.cpp:801

InstCombineInternal.h
This file provides internal interfaces used to implement the InstCombine.

InstCombiner.h
This file provides the interface for the instcombine pass implementation.

InstrTypes.h

InstructionSimplify.h

InstructionWorklist.h

Instructions.h

IntrinsicInst.h

Intrinsics.h

KnownBits.h

LLVMContext.h

Loads.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

MathExtras.h

MemoryBuiltins.h

Metadata.h
This file contains the declarations for metadata subclasses.

Range
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))

II
uint64_t IntrinsicInst * II
Definition: NVVMIntrRange.cpp:52

Y
static GCMetadataPrinterRegistry::Add< OcamlGCMetadataPrinter > Y("ocaml", "ocaml 3.10-compatible collector")

PatternMatch.h

Cond
const SmallVectorImpl< MachineOperand > & Cond
Definition: RISCVRedundantCopyElimination.cpp:75

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

STLFunctionalExtras.h

SimplifyLibCalls.h

SmallBitVector.h
This file implements the SmallBitVector class.

SmallVector.h
This file defines the SmallVector class.

Statepoint.h

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition: Statistic.h:167

Ptr
@ Ptr
Definition: TargetLibraryInfo.cpp:77

Struct
@ Struct
Definition: TargetLibraryInfo.cpp:78

Local.h

Type.h

User.h

getOpcode
static std::optional< unsigned > getOpcode(ArrayRef< VPValue * > Values)
Returns the opcode of Values or ~0 if they do not all agree.
Definition: VPlanSLP.cpp:191

ValueHandle.h

inputDenormalIsIEEE
static bool inputDenormalIsIEEE(const Function &F, const Type *Ty)
Return true if it's possible to assume IEEE treatment of input denormals in F for Val.
Definition: ValueTracking.cpp:4221

ValueTracking.h

Value.h

VectorUtils.h

RHS
Value * RHS
Definition: X86PartialReduction.cpp:76

LHS
Value * LHS
Definition: X86PartialReduction.cpp:75

FunctionType
Definition: ItaniumDemangle.h:799

VectorType
Definition: ItaniumDemangle.h:1149

llvm::AAResults::getModRefInfoMask
ModRefInfo getModRefInfoMask(const MemoryLocation &Loc, bool IgnoreLocals=false)
Returns a bitmask that should be unconditionally applied to the ModRef info of a memory location.
Definition: AliasAnalysis.cpp:149

llvm::APFloat
Definition: APFloat.h:811

llvm::APFloat::isNegative
bool isNegative() const
Definition: APFloat.h:1354

llvm::APFloat::clearSign
void clearSign()
Definition: APFloat.h:1209

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::APInt::getAllOnes
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition: APInt.h:214

llvm::APInt::getSignMask
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition: APInt.h:209

llvm::APInt::usub_ov
APInt usub_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1918

llvm::APInt::isZero
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition: APInt.h:360

llvm::APInt::getBitWidth
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition: APInt.h:1448

llvm::APInt::ult
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition: APInt.h:1091

llvm::APInt::sadd_ov
APInt sadd_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1898

llvm::APInt::uadd_ov
APInt uadd_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1905

llvm::APInt::getSignedMinValue
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition: APInt.h:199

llvm::APInt::uadd_sat
APInt uadd_sat(const APInt &RHS) const
Definition: APInt.cpp:2006

llvm::APInt::isNonNegative
bool isNonNegative() const
Determine if this APInt Value is non-negative (>= 0)
Definition: APInt.h:314

llvm::APInt::getLowBitsSet
static APInt getLowBitsSet(unsigned numBits, unsigned loBitsSet)
Constructs an APInt value that has the bottom loBitsSet bits set.
Definition: APInt.h:286

llvm::APInt::ssub_ov
APInt ssub_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1911

llvm::APSInt::getMinValue
static APSInt getMinValue(uint32_t numBits, bool Unsigned)
Return the APSInt representing the minimum integer value with the given bit width and signedness.
Definition: APSInt.h:311

llvm::APSInt::getMaxValue
static APSInt getMaxValue(uint32_t numBits, bool Unsigned)
Return the APSInt representing the maximum integer value with the given bit width and signedness.
Definition: APSInt.h:303

llvm::AnyMemSetInst
This class represents any memset intrinsic.
Definition: IntrinsicInst.h:1348

llvm::AnyMemTransferInst
Definition: IntrinsicInst.h:1368

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::AssumptionCache::registerAssumption
void registerAssumption(AssumeInst *CI)
Add an @llvm.assume intrinsic to this function's cache.
Definition: AssumptionCache.cpp:187

llvm::AssumptionCache::updateAffectedValues
void updateAffectedValues(AssumeInst *CI)
Update the cache of values being affected by this assumption (i.e.
Definition: AssumptionCache.cpp:99

llvm::AttrBuilder
Definition: Attributes.h:1033

llvm::AttrBuilder::overlaps
bool overlaps(const AttributeMask &AM) const
Return true if the builder has any attribute that's in the specified builder.
Definition: Attributes.cpp:2053

llvm::AttributeList
Definition: Attributes.h:468

llvm::AttributeList::getFnAttrs
AttributeSet getFnAttrs() const
The function attributes are returned.
Definition: Attributes.cpp:1628

llvm::AttributeList::get
static AttributeList get(LLVMContext &C, ArrayRef< std::pair< unsigned, Attribute > > Attrs)
Create an AttributeList with the specified parameters in it.
Definition: Attributes.cpp:1291

llvm::AttributeList::isEmpty
bool isEmpty() const
Return true if there are no attributes.
Definition: Attributes.h:994

llvm::AttributeList::getRetAttrs
AttributeSet getRetAttrs() const
The attributes for the ret value are returned.
Definition: Attributes.cpp:1624

llvm::AttributeList::hasAttrSomewhere
bool hasAttrSomewhere(Attribute::AttrKind Kind, unsigned *Index=nullptr) const
Return true if the specified attribute is set for at least one parameter or for the return value.
Definition: Attributes.cpp:1653

llvm::AttributeList::hasParamAttr
bool hasParamAttr(unsigned ArgNo, Attribute::AttrKind Kind) const
Return true if the attribute exists for the given argument.
Definition: Attributes.h:805

llvm::AttributeList::getParamAttrs
AttributeSet getParamAttrs(unsigned ArgNo) const
The attributes for the argument or parameter at the given index are returned.
Definition: Attributes.cpp:1620

llvm::AttributeList::addParamAttribute
AttributeList addParamAttribute(LLVMContext &C, unsigned ArgNo, Attribute::AttrKind Kind) const
Add an argument attribute to the list.
Definition: Attributes.h:606

llvm::AttributeList::FirstArgIndex
@ FirstArgIndex
Definition: Attributes.h:473

llvm::AttributeMask
Definition: AttributeMask.h:29

llvm::AttributeSet
Definition: Attributes.h:330

llvm::AttributeSet::hasAttribute
bool hasAttribute(Attribute::AttrKind Kind) const
Return true if the attribute exists in this set.
Definition: Attributes.cpp:909

llvm::AttributeSet::removeAttributes
AttributeSet removeAttributes(LLVMContext &C, const AttributeMask &AttrsToRemove) const
Remove the specified attributes from this set.
Definition: Attributes.cpp:894

llvm::AttributeSet::get
static AttributeSet get(LLVMContext &C, const AttrBuilder &B)
Definition: Attributes.cpp:842

llvm::Attribute::get
static Attribute get(LLVMContext &Context, AttrKind Kind, uint64_t Val=0)
Return a uniquified Attribute object.
Definition: Attributes.cpp:94

llvm::Attribute::getWithDereferenceableBytes
static Attribute getWithDereferenceableBytes(LLVMContext &Context, uint64_t Bytes)
Definition: Attributes.cpp:242

llvm::Attribute::getWithDereferenceableOrNullBytes
static Attribute getWithDereferenceableOrNullBytes(LLVMContext &Context, uint64_t Bytes)
Definition: Attributes.cpp:248

llvm::Attribute::getWithAlignment
static Attribute getWithAlignment(LLVMContext &Context, Align Alignment)
Return a uniquified Attribute object that has the specific alignment set.
Definition: Attributes.cpp:232

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:61

llvm::BasicBlock::reverse_iterator
InstListType::reverse_iterator reverse_iterator
Definition: BasicBlock.h:169

llvm::BasicBlock::iterator
InstListType::iterator iterator
Instruction iterators...
Definition: BasicBlock.h:167

llvm::BinaryOpIntrinsic::getRHS
Value * getRHS() const
Definition: IntrinsicInst.h:904

llvm::BinaryOpIntrinsic::isSigned
bool isSigned() const
Whether the intrinsic is signed or unsigned.
Definition: IntrinsicInst.cpp:868

llvm::BinaryOpIntrinsic::getBinaryOp
Instruction::BinaryOps getBinaryOp() const
Returns the binary operation underlying the intrinsic.
Definition: IntrinsicInst.cpp:848

llvm::BinaryOpIntrinsic::getLHS
Value * getLHS() const
Definition: IntrinsicInst.h:903

llvm::BinaryOperator
Definition: InstrTypes.h:188

llvm::BinaryOperator::CreateNeg
static BinaryOperator * CreateNeg(Value *Op, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Helper functions to construct and inspect unary operations (NEG and NOT) via binary operators SUB and...
Definition: Instructions.cpp:2647

llvm::BinaryOperator::CreateNSW
static BinaryOperator * CreateNSW(BinaryOps Opc, Value *V1, Value *V2, const Twine &Name="")
Definition: InstrTypes.h:306

llvm::BinaryOperator::CreateNot
static BinaryOperator * CreateNot(Value *Op, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition: Instructions.cpp:2660

llvm::BinaryOperator::Create
static BinaryOperator * Create(BinaryOps Op, Value *S1, Value *S2, const Twine &Name=Twine(), InsertPosition InsertBefore=nullptr)
Construct a binary instruction, given the opcode and the two operands.
Definition: Instructions.cpp:2639

llvm::BinaryOperator::CreateNUW
static BinaryOperator * CreateNUW(BinaryOps Opc, Value *V1, Value *V2, const Twine &Name="")
Definition: InstrTypes.h:331

llvm::BinaryOperator::CreateFMulFMF
static BinaryOperator * CreateFMulFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition: InstrTypes.h:271

llvm::BinaryOperator::CreateFDivFMF
static BinaryOperator * CreateFDivFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition: InstrTypes.h:275

llvm::BinaryOperator::CreateFSubFMF
static BinaryOperator * CreateFSubFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition: InstrTypes.h:267

llvm::BinaryOperator::CreateWithCopiedFlags
static BinaryOperator * CreateWithCopiedFlags(BinaryOps Opc, Value *V1, Value *V2, Value *CopyO, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition: InstrTypes.h:246

llvm::BinaryOperator::CreateNSWNeg
static BinaryOperator * CreateNSWNeg(Value *Op, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition: Instructions.cpp:2654

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition: InstrTypes.h:1236

llvm::CallBase::setCallingConv
void setCallingConv(CallingConv::ID CC)
Definition: InstrTypes.h:1527

llvm::CallBase::setDoesNotThrow
void setDoesNotThrow()
Definition: InstrTypes.h:2016

llvm::CallBase::getRetAlign
MaybeAlign getRetAlign() const
Extract the alignment of the return value.
Definition: InstrTypes.h:1829

llvm::CallBase::getOperandBundle
std::optional< OperandBundleUse > getOperandBundle(StringRef Name) const
Return an operand bundle by name, if present.
Definition: InstrTypes.h:2143

llvm::CallBase::getCalledFunction
Function * getCalledFunction() const
Returns the function called, or null if this is an indirect function invocation or the function signa...
Definition: InstrTypes.h:1465

llvm::CallBase::hasRetAttr
bool hasRetAttr(Attribute::AttrKind Kind) const
Determine whether the return value has the given attribute.
Definition: InstrTypes.h:1673

llvm::CallBase::getCalledOperand
Value * getCalledOperand() const
Definition: InstrTypes.h:1458

llvm::CallBase::setAttributes
void setAttributes(AttributeList A)
Set the parameter attributes for this call.
Definition: InstrTypes.h:1546

llvm::CallBase::doesNotThrow
bool doesNotThrow() const
Determine if the call cannot unwind.
Definition: InstrTypes.h:2015

llvm::CallBase::addRetAttr
void addRetAttr(Attribute::AttrKind Kind)
Adds the attribute to the return value.
Definition: InstrTypes.h:1584

llvm::CallBase::getArgOperand
Value * getArgOperand(unsigned i) const
Definition: InstrTypes.h:1410

llvm::CallBase::getIntrinsicID
Intrinsic::ID getIntrinsicID() const
Returns the intrinsic ID of the intrinsic called or Intrinsic::not_intrinsic if the called function i...
Definition: Instructions.cpp:353

llvm::CallBase::Create
static CallBase * Create(CallBase *CB, ArrayRef< OperandBundleDef > Bundles, InsertPosition InsertPt=nullptr)
Create a clone of CB with a different set of operand bundles and insert it before InsertPt.
Definition: Instructions.cpp:298

llvm::CallBase::args
iterator_range< User::op_iterator > args()
Iteration adapter for range-for loops.
Definition: InstrTypes.h:1401

llvm::CallBase::removeOperandBundle
static CallBase * removeOperandBundle(CallBase *CB, uint32_t ID, InsertPosition InsertPt=nullptr)
Create a clone of CB with operand bundle ID removed.
Definition: Instructions.cpp:571

llvm::CallBase::arg_size
unsigned arg_size() const
Definition: InstrTypes.h:1408

llvm::CallBase::setCalledFunction
void setCalledFunction(Function *Fn)
Sets the function called, including updating the function type.
Definition: InstrTypes.h:1504

llvm::CallBrInst
CallBr instruction, tracking function calls that may not return control but instead transfer it to a ...
Definition: Instructions.h:3729

llvm::CallBrInst::Create
static CallBrInst * Create(FunctionType *Ty, Value *Func, BasicBlock *DefaultDest, ArrayRef< BasicBlock * > IndirectDests, ArrayRef< Value * > Args, const Twine &NameStr, InsertPosition InsertBefore=nullptr)
Definition: Instructions.h:3763

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1398

llvm::CallInst::isNoTailCall
bool isNoTailCall() const
Definition: Instructions.h:1510

llvm::CallInst::setTailCallKind
void setTailCallKind(TailCallKind TCK)
Definition: Instructions.h:1512

llvm::CallInst::Create
static CallInst * Create(FunctionType *Ty, Value *F, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Definition: Instructions.h:1431

llvm::CallInst::isMustTailCall
bool isMustTailCall() const
Definition: Instructions.h:1508

llvm::CastInst::getCastOpcode
static Instruction::CastOps getCastOpcode(const Value *Val, bool SrcIsSigned, Type *Ty, bool DstIsSigned)
Returns the opcode necessary to cast Val into Ty using usual casting rules.
Definition: Instructions.cpp:3147

llvm::CastInst::CreateIntegerCast
static CastInst * CreateIntegerCast(Value *S, Type *Ty, bool isSigned, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Create a ZExt, BitCast, or Trunc for int -> int casts.
Definition: Instructions.cpp:3058

llvm::CastInst::isBitOrNoopPointerCastable
static bool isBitOrNoopPointerCastable(Type *SrcTy, Type *DestTy, const DataLayout &DL)
Check whether a bitcast, inttoptr, or ptrtoint cast between these types is valid and a no-op.
Definition: Instructions.cpp:3125

llvm::CastInst::CreateBitOrPointerCast
static CastInst * CreateBitOrPointerCast(Value *S, Type *Ty, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Create a BitCast, a PtrToInt, or an IntToPTr cast instruction.
Definition: Instructions.cpp:3047

llvm::CastInst::Create
static CastInst * Create(Instruction::CastOps, Value *S, Type *Ty, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Provides a way to construct any of the CastInst subclasses using an opcode instead of the subclass's ...
Definition: Instructions.cpp:2972

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition: InstrTypes.h:757

llvm::CmpInst::FCMP_OEQ
@ FCMP_OEQ
0 0 0 1 True if ordered and equal
Definition: InstrTypes.h:760

llvm::CmpInst::BAD_ICMP_PREDICATE
@ BAD_ICMP_PREDICATE
Definition: InstrTypes.h:790

llvm::CmpInst::ICMP_SLT
@ ICMP_SLT
signed less than
Definition: InstrTypes.h:786

llvm::CmpInst::ICMP_SLE
@ ICMP_SLE
signed less or equal
Definition: InstrTypes.h:787

llvm::CmpInst::FCMP_OLT
@ FCMP_OLT
0 1 0 0 True if ordered and less than
Definition: InstrTypes.h:763

llvm::CmpInst::FCMP_OGT
@ FCMP_OGT
0 0 1 0 True if ordered and greater than
Definition: InstrTypes.h:761

llvm::CmpInst::FCMP_OGE
@ FCMP_OGE
0 0 1 1 True if ordered and greater than or equal
Definition: InstrTypes.h:762

llvm::CmpInst::ICMP_UGT
@ ICMP_UGT
unsigned greater than
Definition: InstrTypes.h:780

llvm::CmpInst::ICMP_SGT
@ ICMP_SGT
signed greater than
Definition: InstrTypes.h:784

llvm::CmpInst::FCMP_ONE
@ FCMP_ONE
0 1 1 0 True if ordered and operands are unequal
Definition: InstrTypes.h:765

llvm::CmpInst::FCMP_UEQ
@ FCMP_UEQ
1 0 0 1 True if unordered or equal
Definition: InstrTypes.h:768

llvm::CmpInst::ICMP_ULT
@ ICMP_ULT
unsigned less than
Definition: InstrTypes.h:782

llvm::CmpInst::FCMP_OLE
@ FCMP_OLE
0 1 0 1 True if ordered and less than or equal
Definition: InstrTypes.h:764

llvm::CmpInst::ICMP_EQ
@ ICMP_EQ
equal
Definition: InstrTypes.h:778

llvm::CmpInst::ICMP_NE
@ ICMP_NE
not equal
Definition: InstrTypes.h:779

llvm::CmpInst::FCMP_UNE
@ FCMP_UNE
1 1 1 0 True if unordered or not equal
Definition: InstrTypes.h:773

llvm::CmpInst::BAD_FCMP_PREDICATE
@ BAD_FCMP_PREDICATE
Definition: InstrTypes.h:777

llvm::CmpInst::getSwappedPredicate
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Definition: InstrTypes.h:909

llvm::CmpInst::getNonStrictPredicate
Predicate getNonStrictPredicate() const
For example, SGT -> SGE, SLT -> SLE, ULT -> ULE, UGT -> UGE.
Definition: InstrTypes.h:953

llvm::CmpInst::getUnorderedPredicate
Predicate getUnorderedPredicate() const
Definition: InstrTypes.h:893

llvm::ConstantAggregateZero::get
static ConstantAggregateZero * get(Type *Ty)
Definition: Constants.cpp:1650

llvm::ConstantExpr::getPointerCast
static Constant * getPointerCast(Constant *C, Type *Ty)
Create a BitCast, AddrSpaceCast, or a PtrToInt cast constant expression.
Definition: Constants.cpp:2215

llvm::ConstantExpr::getSub
static Constant * getSub(Constant *C1, Constant *C2, bool HasNUW=false, bool HasNSW=false)
Definition: Constants.cpp:2606

llvm::ConstantExpr::getNeg
static Constant * getNeg(Constant *C, bool HasNSW=false)
Definition: Constants.cpp:2587

llvm::ConstantFP::getInfinity
static Constant * getInfinity(Type *Ty, bool Negative=false)
Definition: Constants.cpp:1084

llvm::ConstantFP::getZero
static Constant * getZero(Type *Ty, bool Negative=false)
Definition: Constants.cpp:1038

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition: Constants.h:81

llvm::ConstantInt::getLimitedValue
uint64_t getLimitedValue(uint64_t Limit=~0ULL) const
getLimitedValue - If the value is smaller than the specified limit, return it, otherwise return the l...
Definition: Constants.h:256

llvm::ConstantInt::getTrue
static ConstantInt * getTrue(LLVMContext &Context)
Definition: Constants.cpp:850

llvm::ConstantInt::getZExtValue
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
Definition: Constants.h:155

llvm::ConstantInt::getValue
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition: Constants.h:146

llvm::ConstantInt::getBool
static ConstantInt * getBool(LLVMContext &Context, bool V)
Definition: Constants.cpp:864

llvm::ConstantPointerNull::get
static ConstantPointerNull * get(PointerType *T)
Static factory methods - Return objects of the specified value.
Definition: Constants.cpp:1800

llvm::ConstantPtrAuth::get
static ConstantPtrAuth * get(Constant *Ptr, ConstantInt *Key, ConstantInt *Disc, Constant *AddrDisc)
Return a pointer signed with the specified parameters.
Definition: Constants.cpp:2046

llvm::ConstantRange
This class represents a range of values.
Definition: ConstantRange.h:47

llvm::ConstantRange::isFullSet
bool isFullSet() const
Return true if this set contains all of the elements possible for this data-type.
Definition: ConstantRange.cpp:413

llvm::ConstantRange::icmp
bool icmp(CmpInst::Predicate Pred, const ConstantRange &Other) const
Does the predicate Pred hold between ranges this and Other? NOTE: false does not mean that inverse pr...
Definition: ConstantRange.cpp:242

llvm::ConstantStruct::get
static Constant * get(StructType *T, ArrayRef< Constant * > V)
Definition: Constants.cpp:1357

llvm::Constant
This is an important base class in LLVM.
Definition: Constant.h:42

llvm::Constant::getIntegerValue
static Constant * getIntegerValue(Type *Ty, const APInt &V)
Return the value for an integer or pointer constant, or a vector thereof, with the given scalar value...
Definition: Constants.cpp:400

llvm::Constant::getAllOnesValue
static Constant * getAllOnesValue(Type *Ty)
Definition: Constants.cpp:417

llvm::Constant::getNullValue
static Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
Definition: Constants.cpp:370

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:32

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:110

llvm::DataLayout::getPointerTypeSizeInBits
unsigned getPointerTypeSizeInBits(Type *) const
Layout pointer size, in bits, based on the type.
Definition: DataLayout.cpp:763

llvm::DenseMapBase::size
unsigned size() const
Definition: DenseMap.h:99

llvm::DenseMapBase::count
size_type count(const_arg_type_t< KeyT > Val) const
Return 1 if the specified key is in the map, 0 otherwise.
Definition: DenseMap.h:151

llvm::DenseMap
Definition: DenseMap.h:758

llvm::ElementCount
Definition: TypeSize.h:300

llvm::FPExtInst
This class represents an extension of floating point types.
Definition: Instructions.h:4551

llvm::FastMathFlags
Convenience struct for specifying and reasoning about fast-math flags.
Definition: FMF.h:20

llvm::FastMathFlags::setNoSignedZeros
void setNoSignedZeros(bool B=true)
Definition: FMF.h:85

llvm::FastMathFlags::allowReassoc
bool allowReassoc() const
Flag queries.
Definition: FMF.h:65

llvm::FenceInst
An instruction for ordering other memory operations.
Definition: Instructions.h:420

llvm::FenceInst::getSyncScopeID
SyncScope::ID getSyncScopeID() const
Returns the synchronization scope ID of this fence instruction.
Definition: Instructions.h:454

llvm::FenceInst::getOrdering
AtomicOrdering getOrdering() const
Returns the ordering constraint of this fence instruction.
Definition: Instructions.h:443

llvm::FunctionType
Class to represent function types.
Definition: DerivedTypes.h:103

llvm::FunctionType::param_iterator
Type::subtype_iterator param_iterator
Definition: DerivedTypes.h:126

llvm::FunctionType::get
static FunctionType * get(Type *Result, ArrayRef< Type * > Params, bool isVarArg)
This static method is the primary way of constructing a FunctionType.

llvm::Function
Definition: Function.h:64

llvm::Function::isConvergent
bool isConvergent() const
Determine if the call is convergent.
Definition: Function.h:602

llvm::Function::getFunctionType
FunctionType * getFunctionType() const
Returns the FunctionType for me.
Definition: Function.h:207

llvm::Function::getCallingConv
CallingConv::ID getCallingConv() const
getCallingConv()/setCallingConv(CC) - These method get and set the calling convention of this functio...
Definition: Function.h:274

llvm::Function::getAttributes
AttributeList getAttributes() const
Return the attribute list for this Function.
Definition: Function.h:350

llvm::Function::doesNotThrow
bool doesNotThrow() const
Determine if the function cannot unwind.
Definition: Function.h:586

llvm::Function::isIntrinsic
bool isIntrinsic() const
isIntrinsic - Returns true if the function's name starts with "llvm.".
Definition: Function.h:247

llvm::GCRelocateInst
Represents calls to the gc.relocate intrinsic.
Definition: IntrinsicInst.h:1739

llvm::GCRelocateInst::getBasePtr
Value * getBasePtr() const
Definition: IntrinsicInst.cpp:913

llvm::GCRelocateInst::getBasePtrIndex
unsigned getBasePtrIndex() const
The index into the associate statepoint's argument list which contains the base pointer of the pointe...
Definition: IntrinsicInst.h:1752

llvm::GCRelocateInst::getDerivedPtr
Value * getDerivedPtr() const
Definition: IntrinsicInst.cpp:924

llvm::GCRelocateInst::getDerivedPtrIndex
unsigned getDerivedPtrIndex() const
The index into the associate statepoint's argument list which contains the pointer whose relocation t...
Definition: IntrinsicInst.h:1758

llvm::GCStatepointInst
Represents a gc.statepoint intrinsic call.
Definition: Statepoint.h:61

llvm::GCStatepointInst::getGCRelocates
std::vector< const GCRelocateInst * > getGCRelocates() const
Get list of all gc reloactes linked to this statepoint May contain several relocations for the same b...
Definition: Statepoint.h:206

llvm::GlobalObject::getMetadata
MDNode * getMetadata(unsigned KindID) const
Get the current metadata attachments for the given kind, if any.
Definition: Value.h:565

llvm::GlobalValue::isDeclaration
bool isDeclaration() const
Return true if the primary definition of this global value is outside of the current translation unit...
Definition: Globals.cpp:290

llvm::GlobalValue::getType
PointerType * getType() const
Global values are always pointers.
Definition: GlobalValue.h:294

llvm::GlobalVariable
Definition: GlobalVariable.h:39

llvm::IRBuilderBase
Common base class shared among various IRBuilders.
Definition: IRBuilder.h:91

llvm::IRBuilderBase::CreateFCmpONE
Value * CreateFCmpONE(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2311

llvm::IRBuilderBase::CreateUnaryIntrinsic
CallInst * CreateUnaryIntrinsic(Intrinsic::ID ID, Value *V, Instruction *FMFSource=nullptr, const Twine &Name="")
Create a call to intrinsic ID with 1 operand which is mangled on its type.
Definition: IRBuilder.cpp:914

llvm::IRBuilderBase::CreateLaunderInvariantGroup
Value * CreateLaunderInvariantGroup(Value *Ptr)
Create a launder.invariant.group intrinsic call.
Definition: IRBuilder.cpp:1118

llvm::IRBuilderBase::CreateBinaryIntrinsic
Value * CreateBinaryIntrinsic(Intrinsic::ID ID, Value *LHS, Value *RHS, Instruction *FMFSource=nullptr, const Twine &Name="")
Create a call to intrinsic ID with 2 operands which is mangled on the first type.
Definition: IRBuilder.cpp:922

llvm::IRBuilderBase::CreateFCmp
Value * CreateFCmp(CmpInst::Predicate P, Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2366

llvm::IRBuilderBase::getInt1Ty
IntegerType * getInt1Ty()
Fetch the type representing a single bit.
Definition: IRBuilder.h:508

llvm::IRBuilderBase::CreateExtractElement
Value * CreateExtractElement(Value *Vec, Value *Idx, const Twine &Name="")
Definition: IRBuilder.h:2465

llvm::IRBuilderBase::getIntNTy
IntegerType * getIntNTy(unsigned N)
Fetch the type representing an N-bit integer.
Definition: IRBuilder.h:536

llvm::IRBuilderBase::CreateAlignedLoad
LoadInst * CreateAlignedLoad(Type *Ty, Value *Ptr, MaybeAlign Align, const char *Name)
Definition: IRBuilder.h:1812

llvm::IRBuilderBase::CreateFCmpORD
Value * CreateFCmpORD(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2316

llvm::IRBuilderBase::CreateZExtOrTrunc
Value * CreateZExtOrTrunc(Value *V, Type *DestTy, const Twine &Name="")
Create a ZExt or Trunc from the integer value V to DestTy.
Definition: IRBuilder.h:2044

llvm::IRBuilderBase::CreateAndReduce
CallInst * CreateAndReduce(Value *Src)
Create a vector int AND reduction intrinsic of the source vector.
Definition: IRBuilder.cpp:442

llvm::IRBuilderBase::CreateVectorSplat
Value * CreateVectorSplat(unsigned NumElts, Value *V, const Twine &Name="")
Return a vector value that contains.
Definition: IRBuilder.cpp:1193

llvm::IRBuilderBase::getTrue
ConstantInt * getTrue()
Get the constant value for i1 true.
Definition: IRBuilder.h:463

llvm::IRBuilderBase::CreateIntrinsic
CallInst * CreateIntrinsic(Intrinsic::ID ID, ArrayRef< Type * > Types, ArrayRef< Value * > Args, Instruction *FMFSource=nullptr, const Twine &Name="")
Create a call to intrinsic ID with Args, mangled using Types.
Definition: IRBuilder.cpp:933

llvm::IRBuilderBase::CreateFNegFMF
Value * CreateFNegFMF(Value *V, Instruction *FMFSource, const Twine &Name="")
Copy fast-math-flags from an instruction rather than using the builder's default FMF.
Definition: IRBuilder.h:1745

llvm::IRBuilderBase::CreateSelect
Value * CreateSelect(Value *C, Value *True, Value *False, const Twine &Name="", Instruction *MDFrom=nullptr)
Definition: IRBuilder.cpp:1091

llvm::IRBuilderBase::CreateInvoke
InvokeInst * CreateInvoke(FunctionType *Ty, Value *Callee, BasicBlock *NormalDest, BasicBlock *UnwindDest, ArrayRef< Value * > Args, ArrayRef< OperandBundleDef > OpBundles, const Twine &Name="")
Create an invoke instruction.
Definition: IRBuilder.h:1163

llvm::IRBuilderBase::CreateFCmpUNE
Value * CreateFCmpUNE(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2351

llvm::IRBuilderBase::CreateAddReduce
CallInst * CreateAddReduce(Value *Src)
Create a vector int add reduction intrinsic of the source vector.
Definition: IRBuilder.cpp:434

llvm::IRBuilderBase::CreateLShr
Value * CreateLShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
Definition: IRBuilder.h:1442

llvm::IRBuilderBase::getInt32Ty
IntegerType * getInt32Ty()
Fetch the type representing a 32-bit integer.
Definition: IRBuilder.h:523

llvm::IRBuilderBase::CreateNSWMul
Value * CreateNSWMul(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1375

llvm::IRBuilderBase::CreateICmpNE
Value * CreateICmpNE(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2250

llvm::IRBuilderBase::CreateNeg
Value * CreateNeg(Value *V, const Twine &Name="", bool HasNSW=false)
Definition: IRBuilder.h:1726

llvm::IRBuilderBase::CreateOrReduce
CallInst * CreateOrReduce(Value *Src)
Create a vector int OR reduction intrinsic of the source vector.
Definition: IRBuilder.cpp:446

llvm::IRBuilderBase::CreateLdexp
Value * CreateLdexp(Value *Src, Value *Exp, Instruction *FMFSource=nullptr, const Twine &Name="")
Create call to the ldexp intrinsic.
Definition: IRBuilder.h:1027

llvm::IRBuilderBase::getInt32
ConstantInt * getInt32(uint32_t C)
Get a constant 32-bit value.
Definition: IRBuilder.h:483

llvm::IRBuilderBase::CreateBitOrPointerCast
Value * CreateBitOrPointerCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2210

llvm::IRBuilderBase::CreateNot
Value * CreateNot(Value *V, const Twine &Name="")
Definition: IRBuilder.h:1754

llvm::IRBuilderBase::CreateICmpEQ
Value * CreateICmpEQ(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2246

llvm::IRBuilderBase::CreateFCmpUEQ
Value * CreateFCmpUEQ(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2326

llvm::IRBuilderBase::CreateSub
Value * CreateSub(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1349

llvm::IRBuilderBase::CreateBitCast
Value * CreateBitCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2132

llvm::IRBuilderBase::CreateLoad
LoadInst * CreateLoad(Type *Ty, Value *Ptr, const char *Name)
Provided to resolve 'CreateLoad(Ty, Ptr, "...")' correctly, instead of converting the string to 'bool...
Definition: IRBuilder.h:1795

llvm::IRBuilderBase::CreateZExt
Value * CreateZExt(Value *V, Type *DestTy, const Twine &Name="", bool IsNonNeg=false)
Definition: IRBuilder.h:2026

llvm::IRBuilderBase::CreateShuffleVector
Value * CreateShuffleVector(Value *V1, Value *V2, Value *Mask, const Twine &Name="")
Definition: IRBuilder.h:2499

llvm::IRBuilderBase::CreateFCmpOEQ
Value * CreateFCmpOEQ(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2286

llvm::IRBuilderBase::CreateAnd
Value * CreateAnd(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1480

llvm::IRBuilderBase::CreateStore
StoreInst * CreateStore(Value *Val, Value *Ptr, bool isVolatile=false)
Definition: IRBuilder.h:1808

llvm::IRBuilderBase::CreateAdd
Value * CreateAdd(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1332

llvm::IRBuilderBase::CreatePtrToInt
Value * CreatePtrToInt(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2122

llvm::IRBuilderBase::getFalse
ConstantInt * getFalse()
Get the constant value for i1 false.
Definition: IRBuilder.h:468

llvm::IRBuilderBase::CreateIsNotNull
Value * CreateIsNotNull(Value *Arg, const Twine &Name="")
Return a boolean value testing if Arg != 0.
Definition: IRBuilder.h:2554

llvm::IRBuilderBase::CreateTrunc
Value * CreateTrunc(Value *V, Type *DestTy, const Twine &Name="", bool IsNUW=false, bool IsNSW=false)
Definition: IRBuilder.h:2012

llvm::IRBuilderBase::CreateOr
Value * CreateOr(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1502

llvm::IRBuilderBase::getPtrTy
PointerType * getPtrTy(unsigned AddrSpace=0)
Fetch the type representing a pointer.
Definition: IRBuilder.h:566

llvm::IRBuilderBase::CreateElementCount
Value * CreateElementCount(Type *DstType, ElementCount EC)
Create an expression which evaluates to the number of elements in EC at runtime.
Definition: IRBuilder.cpp:100

llvm::IRBuilderBase::CreateCast
Value * CreateCast(Instruction::CastOps Op, Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2166

llvm::IRBuilderBase::CreateIntCast
Value * CreateIntCast(Value *V, Type *DestTy, bool isSigned, const Twine &Name="")
Definition: IRBuilder.h:2201

llvm::IRBuilderBase::CreateFCmpUNO
Value * CreateFCmpUNO(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2321

llvm::IRBuilderBase::CreateCall
CallInst * CreateCall(FunctionType *FTy, Value *Callee, ArrayRef< Value * > Args=std::nullopt, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2417

llvm::IRBuilderBase::CreateICmp
Value * CreateICmp(CmpInst::Predicate P, Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2356

llvm::IRBuilderBase::CreateFNeg
Value * CreateFNeg(Value *V, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:1735

llvm::IRBuilderBase::CreateAddrSpaceCast
Value * CreateAddrSpaceCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2137

llvm::IRBuilderBase::CreateMul
Value * CreateMul(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1366

llvm::IRBuilderBase::CreateStripInvariantGroup
Value * CreateStripInvariantGroup(Value *Ptr)
Create a strip.invariant.group intrinsic call.
Definition: IRBuilder.cpp:1134

llvm::IRBuilder< TargetFolder, IRBuilderCallbackInserter >

llvm::InlineAsm
Definition: InlineAsm.h:34

llvm::InsertValueInst::Create
static InsertValueInst * Create(Value *Agg, Value *Val, ArrayRef< unsigned > Idxs, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Definition: Instructions.h:2422

llvm::InstCombinerImpl
Definition: InstCombineInternal.h:64

llvm::InstCombinerImpl::FoldOpIntoSelect
Instruction * FoldOpIntoSelect(Instruction &Op, SelectInst *SI, bool FoldWithMultiUse=false)
Given an instruction with a select as one operand and a constant as the other operand,...
Definition: InstructionCombining.cpp:1685

llvm::InstCombinerImpl::computeKnownFPClass
KnownFPClass computeKnownFPClass(Value *Val, FastMathFlags FMF, FPClassTest Interested=fcAllFlags, const Instruction *CtxI=nullptr, unsigned Depth=0) const
Definition: InstCombineInternal.h:202

llvm::InstCombinerImpl::SimplifyDemandedVectorElts
Value * SimplifyDemandedVectorElts(Value *V, APInt DemandedElts, APInt &PoisonElts, unsigned Depth=0, bool AllowMultipleUsers=false) override
The specified value produces a vector with any number of elements.
Definition: InstCombineSimplifyDemanded.cpp:1393

llvm::InstCombinerImpl::SimplifyAnyMemSet
Instruction * SimplifyAnyMemSet(AnyMemSetInst *MI)
Definition: InstCombineCalls.cpp:217

llvm::InstCombinerImpl::getLosslessUnsignedTrunc
Constant * getLosslessUnsignedTrunc(Constant *C, Type *TruncTy)
Definition: InstCombineInternal.h:233

llvm::InstCombinerImpl::visitFree
Instruction * visitFree(CallInst &FI, Value *FreedOp)
Definition: InstructionCombining.cpp:3452

llvm::InstCombinerImpl::visitCallBrInst
Instruction * visitCallBrInst(CallBrInst &CBI)
Definition: InstCombineCalls.cpp:3664

llvm::InstCombinerImpl::eraseInstFromFunction
Instruction * eraseInstFromFunction(Instruction &I) override
Combiner aware instruction erasure.
Definition: InstCombineInternal.h:473

llvm::InstCombinerImpl::SimplifyDemandedBits
bool SimplifyDemandedBits(Instruction *I, unsigned Op, const APInt &DemandedMask, KnownBits &Known, unsigned Depth, const SimplifyQuery &Q) override
This form of SimplifyDemandedBits simplifies the specified instruction operand if possible,...
Definition: InstCombineSimplifyDemanded.cpp:89

llvm::InstCombinerImpl::visitFenceInst
Instruction * visitFenceInst(FenceInst &FI)
Definition: InstCombineCalls.cpp:3631

llvm::InstCombinerImpl::visitInvokeInst
Instruction * visitInvokeInst(InvokeInst &II)
Definition: InstCombineCalls.cpp:3659

llvm::InstCombinerImpl::getLosslessSignedTrunc
Constant * getLosslessSignedTrunc(Constant *C, Type *TruncTy)
Definition: InstCombineInternal.h:237

llvm::InstCombinerImpl::SimplifyDemandedInstructionBits
bool SimplifyDemandedInstructionBits(Instruction &Inst)
Tries to simplify operands to an integer instruction based on its demanded bits.
Definition: InstCombineSimplifyDemanded.cpp:81

llvm::InstCombinerImpl::CreateNonTerminatorUnreachable
void CreateNonTerminatorUnreachable(Instruction *InsertAt)
Create and insert the idiom we use to indicate a block is unreachable without having to rewrite the C...
Definition: InstCombineInternal.h:460

llvm::InstCombinerImpl::visitVAEndInst
Instruction * visitVAEndInst(VAEndInst &I)
Definition: InstCombineCalls.cpp:793

llvm::InstCombinerImpl::matchBSwapOrBitReverse
Instruction * matchBSwapOrBitReverse(Instruction &I, bool MatchBSwaps, bool MatchBitReversals)
Given an initial instruction, check to see if it is the root of a bswap/bitreverse idiom.
Definition: InstCombineAndOrXor.cpp:2825

llvm::InstCombinerImpl::visitAllocSite
Instruction * visitAllocSite(Instruction &FI)
Definition: InstructionCombining.cpp:3236

llvm::InstCombinerImpl::SimplifyAnyMemTransfer
Instruction * SimplifyAnyMemTransfer(AnyMemTransferInst *MI)
Definition: InstCombineCalls.cpp:115

llvm::InstCombinerImpl::computeOverflow
OverflowResult computeOverflow(Instruction::BinaryOps BinaryOp, bool IsSigned, Value *LHS, Value *RHS, Instruction *CxtI) const
Definition: InstCombineCompares.cpp:6058

llvm::InstCombinerImpl::visitCallInst
Instruction * visitCallInst(CallInst &CI)
CallInst simplification.
Definition: InstCombineCalls.cpp:1499

llvm::InstCombiner::SQ
SimplifyQuery SQ
Definition: InstCombiner.h:76

llvm::InstCombiner::isFreeToInvert
bool isFreeToInvert(Value *V, bool WillInvertAllUses, bool &DoesConsume)
Return true if the specified value is free to invert (apply ~ to).
Definition: InstCombiner.h:232

llvm::InstCombiner::getDominatorTree
DominatorTree & getDominatorTree() const
Definition: InstCombiner.h:340

llvm::InstCombiner::BFI
BlockFrequencyInfo * BFI
Definition: InstCombiner.h:78

llvm::InstCombiner::TLI
TargetLibraryInfo & TLI
Definition: InstCombiner.h:73

llvm::InstCombiner::isKnownToBeAPowerOfTwo
bool isKnownToBeAPowerOfTwo(const Value *V, bool OrZero=false, unsigned Depth=0, const Instruction *CxtI=nullptr)
Definition: InstCombiner.h:441

llvm::InstCombiner::InsertNewInstBefore
Instruction * InsertNewInstBefore(Instruction *New, BasicBlock::iterator Old)
Inserts an instruction New before instruction Old.
Definition: InstCombiner.h:366

llvm::InstCombiner::AA
AAResults * AA
Definition: InstCombiner.h:69

llvm::InstCombiner::replaceInstUsesWith
Instruction * replaceInstUsesWith(Instruction &I, Value *V)
A combiner-aware RAUW-like routine.
Definition: InstCombiner.h:386

llvm::InstCombiner::LI
LoopInfo * LI
Definition: InstCombiner.h:85

llvm::InstCombiner::replaceUse
void replaceUse(Use &U, Value *NewValue)
Replace use and add the previously used value to the worklist.
Definition: InstCombiner.h:418

llvm::InstCombiner::Worklist
InstructionWorklist & Worklist
A worklist of the instructions that need to be simplified.
Definition: InstCombiner.h:64

llvm::InstCombiner::DL
const DataLayout & DL
Definition: InstCombiner.h:75

llvm::InstCombiner::targetInstCombineIntrinsic
std::optional< Instruction * > targetInstCombineIntrinsic(IntrinsicInst &II)
Definition: InstructionCombining.cpp:156

llvm::InstCombiner::AC
AssumptionCache & AC
Definition: InstCombiner.h:72

llvm::InstCombiner::replaceOperand
Instruction * replaceOperand(Instruction &I, unsigned OpNum, Value *V)
Replace operand of instruction and add old operand to the worklist.
Definition: InstCombiner.h:410

llvm::InstCombiner::DT
DominatorTree & DT
Definition: InstCombiner.h:74

llvm::InstCombiner::PSI
ProfileSummaryInfo * PSI
Definition: InstCombiner.h:80

llvm::InstCombiner::computeKnownBits
void computeKnownBits(const Value *V, KnownBits &Known, unsigned Depth, const Instruction *CxtI) const
Definition: InstCombiner.h:431

llvm::InstCombiner::Builder
BuilderTy & Builder
Definition: InstCombiner.h:60

llvm::InstCombiner::getAssumptionCache
AssumptionCache & getAssumptionCache() const
Definition: InstCombiner.h:338

llvm::InstCombiner::MaskedValueIsZero
bool MaskedValueIsZero(const Value *V, const APInt &Mask, unsigned Depth=0, const Instruction *CxtI=nullptr) const
Definition: InstCombiner.h:447

llvm::InstCombiner::ORE
OptimizationRemarkEmitter & ORE
Definition: InstCombiner.h:77

llvm::InstCombiner::getFreelyInverted
Value * getFreelyInverted(Value *V, bool WillInvertAllUses, BuilderTy *Builder, bool &DoesConsume)
Definition: InstCombiner.h:213

llvm::InstCombiner::getSimplifyQuery
const SimplifyQuery & getSimplifyQuery() const
Definition: InstCombiner.h:342

llvm::InstCombiner::ComputeMaxSignificantBits
unsigned ComputeMaxSignificantBits(const Value *Op, unsigned Depth=0, const Instruction *CxtI=nullptr) const
Definition: InstCombiner.h:457

llvm::InstructionWorklist::pushValue
void pushValue(Value *V)
Definition: InstructionWorklist.h:68

llvm::InstructionWorklist::pushUsersToWorkList
void pushUsersToWorkList(Instruction &I)
When an instruction is simplified, add all users of the instruction to the work lists because they mi...
Definition: InstructionWorklist.h:106

llvm::InstructionWorklist::add
void add(Instruction *I)
Add instruction to the worklist.
Definition: InstructionWorklist.h:44

llvm::Instruction
Definition: Instruction.h:68

llvm::Instruction::copyFastMathFlags
void copyFastMathFlags(FastMathFlags FMF)
Convenience function for transferring all fast-math flag values to this instruction,...
Definition: Instruction.cpp:565

llvm::Instruction::mayWriteToMemory
bool mayWriteToMemory() const LLVM_READONLY
Return true if this instruction may modify memory.
Definition: Instruction.cpp:949

llvm::Instruction::copyIRFlags
void copyIRFlags(const Value *V, bool IncludeWrapFlags=true)
Convenience method to copy supported exact, fast-math, and (optionally) wrapping flags from V to this...
Definition: Instruction.cpp:619

llvm::Instruction::getModule
const Module * getModule() const
Return the module owning the function this instruction belongs to or nullptr it the function does not...
Definition: Instruction.cpp:66

llvm::Instruction::setAAMetadata
void setAAMetadata(const AAMDNodes &N)
Sets the AA metadata on this instruction from the AAMDNodes structure.
Definition: Metadata.cpp:1720

llvm::Instruction::andIRFlags
void andIRFlags(const Value *V)
Logical 'and' of any supported wrapping, exact, and fast-math flags of V and this instruction.
Definition: Instruction.cpp:659

llvm::Instruction::getPrevNonDebugInstruction
const Instruction * getPrevNonDebugInstruction(bool SkipPseudoOp=false) const
Return a pointer to the previous non-debug instruction in the same basic block as 'this',...
Definition: Instruction.cpp:1172

llvm::Instruction::getFunction
const Function * getFunction() const
Return the function this instruction belongs to.
Definition: Instruction.cpp:70

llvm::Instruction::getNextNonDebugInstruction
const Instruction * getNextNonDebugInstruction(bool SkipPseudoOp=false) const
Return a pointer to the next non-debug instruction in the same basic block as 'this',...
Definition: Instruction.cpp:1164

llvm::Instruction::setMetadata
void setMetadata(unsigned KindID, MDNode *Node)
Set the metadata of the specified kind to the specified node.
Definition: Metadata.cpp:1635

llvm::Instruction::getOpcode
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
Definition: Instruction.h:274

llvm::Instruction::BinaryOps
BinaryOps
Definition: Instruction.h:959

llvm::Instruction::getInsertionPointAfterDef
std::optional< InstListType::iterator > getInsertionPointAfterDef()
Get the first insertion point at which the result of this instruction is defined.
Definition: Instruction.cpp:328

llvm::Instruction::isIdenticalTo
bool isIdenticalTo(const Instruction *I) const LLVM_READONLY
Return true if the specified instruction is exactly identical to the current one.
Definition: Instruction.cpp:855

llvm::Instruction::setDebugLoc
void setDebugLoc(DebugLoc Loc)
Set the debug location information for this instruction.
Definition: Instruction.h:463

llvm::Instruction::copyMetadata
void copyMetadata(const Instruction &SrcInst, ArrayRef< unsigned > WL=ArrayRef< unsigned >())
Copy metadata from SrcInst to this instruction.
Definition: Instruction.cpp:1280

llvm::Instruction::moveBefore
void moveBefore(Instruction *MovePos)
Unlink this instruction from its current basic block and insert it into the basic block that MovePos ...
Definition: Instruction.cpp:167

llvm::Instruction::CastOps
CastOps
Definition: Instruction.h:973

llvm::IntegerType
Class to represent integer types.
Definition: DerivedTypes.h:40

llvm::IntegerType::get
static IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition: Type.cpp:278

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:48

llvm::IntrinsicInst::getIntrinsicID
Intrinsic::ID getIntrinsicID() const
Return the intrinsic ID of this intrinsic.
Definition: IntrinsicInst.h:55

llvm::InvokeInst
Invoke instruction.
Definition: Instructions.h:3569

llvm::InvokeInst::Create
static InvokeInst * Create(FunctionType *Ty, Value *Func, BasicBlock *IfNormal, BasicBlock *IfException, ArrayRef< Value * > Args, const Twine &NameStr, InsertPosition InsertBefore=nullptr)
Definition: Instructions.h:3608

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67

llvm::LLVMContext::OB_kcfi
@ OB_kcfi
Definition: LLVMContext.h:97

llvm::LLVMContext::OB_gc_live
@ OB_gc_live
Definition: LLVMContext.h:94

llvm::LibCallSimplifier
LibCallSimplifier - This class implements a collection of optimizations that replace well formed call...
Definition: SimplifyLibCalls.h:101

llvm::LoadInst
An instruction for reading from memory.
Definition: Instructions.h:174

llvm::MDNode
Metadata node.
Definition: Metadata.h:1067

llvm::MDNode::get
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
Definition: Metadata.h:1541

llvm::MinMaxIntrinsic::getPredicate
ICmpInst::Predicate getPredicate() const
Returns the comparison predicate underlying the intrinsic.
Definition: IntrinsicInst.h:788

llvm::MinMaxIntrinsic::isSigned
bool isSigned() const
Whether the intrinsic is signed or unsigned.
Definition: IntrinsicInst.h:798

llvm::Module
A Module instance is used to store all the information related to an LLVM module.
Definition: Module.h:65

llvm::OperandBundleDefT
A container for an operand bundle being viewed as a set of values rather than a set of uses.
Definition: InstrTypes.h:1189

llvm::PHINode
Definition: Instructions.h:2505

llvm::PoisonValue::get
static PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition: Constants.cpp:1852

llvm::SaturatingInst
Represents a saturating add/sub intrinsic.
Definition: IntrinsicInst.h:938

llvm::SelectInst
This class represents the LLVM 'select' instruction.
Definition: Instructions.h:1572

llvm::SelectInst::Create
static SelectInst * Create(Value *C, Value *S1, Value *S2, const Twine &NameStr="", InsertPosition InsertBefore=nullptr, Instruction *MDFrom=nullptr)
Definition: Instructions.h:1596

llvm::ShuffleVectorInst
This instruction constructs a fixed permutation of two input vectors.
Definition: Instructions.h:1808

llvm::SmallBitVector
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
Definition: SmallBitVector.h:35

llvm::SmallBitVector::set
SmallBitVector & set()
Definition: SmallBitVector.h:366

llvm::SmallBitVector::test
bool test(unsigned Idx) const
Definition: SmallBitVector.h:472

llvm::SmallBitVector::all
bool all() const
Returns true if all bits are set.
Definition: SmallBitVector.h:216

llvm::SmallPtrSetImplBase::size
size_type size() const
Definition: SmallPtrSet.h:94

llvm::SmallPtrSetImpl::count
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
Definition: SmallPtrSet.h:412

llvm::SmallPtrSetImpl::insert
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
Definition: SmallPtrSet.h:344

llvm::SmallPtrSet
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
Definition: SmallPtrSet.h:479

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:94

llvm::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:91

llvm::SmallVectorImpl::reserve
void reserve(size_type N)
Definition: SmallVector.h:676

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:426

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1209

llvm::StoreInst
An instruction for storing to memory.
Definition: Instructions.h:290

llvm::StoreInst::setVolatile
void setVolatile(bool V)
Specify whether this is a volatile store or not.
Definition: Instructions.h:324

llvm::StoreInst::setAlignment
void setAlignment(Align Align)
Definition: Instructions.h:333

llvm::StoreInst::setOrdering
void setOrdering(AtomicOrdering Ordering)
Sets the ordering constraint of this store instruction.
Definition: Instructions.h:344

llvm::StructType
Class to represent struct types.
Definition: DerivedTypes.h:216

llvm::TargetLibraryInfoImpl::isCallingConvCCompatible
static bool isCallingConvCCompatible(CallBase *CI)
Returns true if call site / callee has cdecl-compatible calling conventions.
Definition: TargetLibraryInfo.cpp:152

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition: TargetLibraryInfo.h:281

llvm::TruncInst
This class represents a truncation of integer types.
Definition: Instructions.h:4393

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::getIntegerBitWidth
unsigned getIntegerBitWidth() const

llvm::Type::getFltSemantics
const fltSemantics & getFltSemantics() const

llvm::Type::isPointerTy
bool isPointerTy() const
True if this is an instance of PointerType.
Definition: Type.h:255

llvm::Type::getScalarSizeInBits
unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.

llvm::Type::isStructTy
bool isStructTy() const
True if this is an instance of StructType.
Definition: Type.h:249

llvm::Type::getWithNewBitWidth
Type * getWithNewBitWidth(unsigned NewBitWidth) const
Given an integer or vector type, change the lane bitwidth to NewBitwidth, whilst keeping the old numb...

llvm::Type::getContext
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition: Type.h:129

llvm::Type::canLosslesslyBitCastTo
bool canLosslesslyBitCastTo(Type *Ty) const
Return true if this type could be converted with a lossless BitCast to type 'Ty'.

llvm::Type::getInt32Ty
static IntegerType * getInt32Ty(LLVMContext &C)

llvm::Type::getInt64Ty
static IntegerType * getInt64Ty(LLVMContext &C)

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition: Type.h:228

llvm::Type::isVoidTy
bool isVoidTy() const
Return true if this is 'void'.
Definition: Type.h:140

llvm::Type::getScalarType
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition: Type.h:348

llvm::UnaryOperator::CreateWithCopiedFlags
static UnaryOperator * CreateWithCopiedFlags(UnaryOps Opc, Value *V, Instruction *CopyO, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition: InstrTypes.h:156

llvm::UnaryOperator::CreateFNegFMF
static UnaryOperator * CreateFNegFMF(Value *Op, Instruction *FMFSource, const Twine &Name="", InsertPosition InsertBefore=nullptr)
Definition: InstrTypes.h:164

llvm::UndefValue::get
static UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
Definition: Constants.cpp:1833

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition: Use.h:43

llvm::User
Definition: User.h:44

llvm::User::setOperand
void setOperand(unsigned i, Value *Val)
Definition: User.h:174

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition: User.h:169

llvm::VAEndInst
This represents the llvm.va_end intrinsic.
Definition: IntrinsicInst.h:1440

llvm::ValueHandleBase::ValueIsDeleted
static void ValueIsDeleted(Value *V)
Definition: Value.cpp:1202

llvm::ValueHandleBase::ValueIsRAUWd
static void ValueIsRAUWd(Value *Old, Value *New)
Definition: Value.cpp:1255

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::Value::MaximumAlignment
static constexpr uint64_t MaximumAlignment
Definition: Value.h:807

llvm::Value::setMetadata
void setMetadata(unsigned KindID, MDNode *Node)
Set a particular kind of metadata attachment.
Definition: Metadata.cpp:1487

llvm::Value::hasOneUse
bool hasOneUse() const
Return true if there is exactly one use of this value.
Definition: Value.h:434

llvm::Value::users
iterator_range< user_iterator > users()
Definition: Value.h:421

llvm::Value::dropDroppableUse
static void dropDroppableUse(Use &U)
Remove the droppable use U.
Definition: Value.cpp:217

llvm::Value::stripPointerCasts
const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
Definition: Value.cpp:694

llvm::Value::use_empty
bool use_empty() const
Definition: Value.h:344

llvm::Value::getContext
LLVMContext & getContext() const
All values hold a context through their type.
Definition: Value.cpp:1075

llvm::Value::MaxAlignmentExponent
static constexpr unsigned MaxAlignmentExponent
The maximum alignment for instructions.
Definition: Value.h:806

llvm::Value::getName
StringRef getName() const
Return a constant reference to the value's name.
Definition: Value.cpp:309

llvm::Value::takeName
void takeName(Value *V)
Transfer the name from V to this value.
Definition: Value.cpp:383

llvm::VectorType
Base class of all SIMD vector types.
Definition: DerivedTypes.h:403

llvm::VectorType::getElementCount
ElementCount getElementCount() const
Return an ElementCount instance to represent the (possibly scalable) number of elements in the vector...
Definition: DerivedTypes.h:641

llvm::WithOverflowInst
Represents an op.with.overflow intrinsic.
Definition: IntrinsicInst.h:917

llvm::cl::opt
Definition: CommandLine.h:1423

llvm::details::FixedOrScalableQuantity< ElementCount, unsigned >::isKnownLT
static constexpr bool isKnownLT(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition: TypeSize.h:218

llvm::details::FixedOrScalableQuantity< ElementCount, unsigned >::isKnownGT
static constexpr bool isKnownGT(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition: TypeSize.h:225

llvm::ilist_detail::node_parent_access::getParent
const ParentTy * getParent() const
Definition: ilist_node.h:32

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition: ilist_node.h:132

uint32_t

uint64_t

unsigned

DebugInfo.h

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::AArch64PACKey::IA
@ IA
Definition: AArch64BaseInfo.h:820

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition: AMDGPUMetadata.h:395

llvm::AMDGPU::HSAMD::Kernel::Key::Attrs
constexpr char Attrs[]
Key for Kernel::Metadata::mAttrs.
Definition: AMDGPUMetadata.h:393

llvm::AttributeFuncs::ASK_UNSAFE_TO_DROP
@ ASK_UNSAFE_TO_DROP
Definition: Attributes.h:1259

llvm::AttributeFuncs::ASK_SAFE_TO_DROP
@ ASK_SAFE_TO_DROP
Definition: Attributes.h:1258

llvm::AttributeFuncs::typeIncompatible
AttributeMask typeIncompatible(Type *Ty, AttributeSafetyKind ASK=ASK_ALL)
Which attributes cannot be applied to a type.
Definition: Attributes.cpp:2099

llvm::BitmaskEnumDetail::Mask
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
Definition: BitmaskEnum.h:121

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::Intrinsic::getDeclaration
Function * getDeclaration(Module *M, ID id, ArrayRef< Type * > Tys=std::nullopt)
Create or insert an LLVM Function declaration for an intrinsic, and return it.
Definition: Function.cpp:1513

llvm::M68k::MemAddrModeKind::V
@ V

llvm::M68k::MemAddrModeKind::L
@ L

llvm::MCID::Call
@ Call
Definition: MCInstrDesc.h:156

llvm::PatternMatch::m_AllOnes
cst_pred_ty< is_all_ones > m_AllOnes()
Match an integer or vector with all bits set.
Definition: PatternMatch.h:524

llvm::PatternMatch::m_And
BinaryOp_match< LHS, RHS, Instruction::And > m_And(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1206

llvm::PatternMatch::m_Add
BinaryOp_match< LHS, RHS, Instruction::Add > m_Add(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1092

llvm::PatternMatch::m_BinOp
class_match< BinaryOperator > m_BinOp()
Match an arbitrary binary operation and ignore it.
Definition: PatternMatch.h:100

llvm::PatternMatch::m_BitReverse
m_Intrinsic_Ty< Opnd0 >::Ty m_BitReverse(const Opnd0 &Op0)
Definition: PatternMatch.h:2604

llvm::PatternMatch::m_Constant
class_match< Constant > m_Constant()
Match an arbitrary Constant and ignore it.
Definition: PatternMatch.h:165

llvm::PatternMatch::m_c_And
BinaryOp_match< LHS, RHS, Instruction::And, true > m_c_And(const LHS &L, const RHS &R)
Matches an And with LHS and RHS in either order.
Definition: PatternMatch.h:2711

llvm::PatternMatch::m_Trunc
CastInst_match< OpTy, TruncInst > m_Trunc(const OpTy &Op)
Matches Trunc.
Definition: PatternMatch.h:2013

llvm::PatternMatch::m_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor > m_Xor(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1218

llvm::PatternMatch::m_NSWSub
OverflowingBinaryOp_match< LHS, RHS, Instruction::Sub, OverflowingBinaryOperator::NoSignedWrap > m_NSWSub(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1279

llvm::PatternMatch::m_SpecificInt
specific_intval< false > m_SpecificInt(const APInt &V)
Match a specific integer value or vector with all elements equal to the value.
Definition: PatternMatch.h:972

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition: PatternMatch.h:49

llvm::PatternMatch::m_Instruction
bind_ty< Instruction > m_Instruction(Instruction *&I)
Match an instruction, capturing it if we match.
Definition: PatternMatch.h:816

llvm::PatternMatch::m_Specific
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
Definition: PatternMatch.h:875

llvm::PatternMatch::m_NSWNeg
OverflowingBinaryOp_match< cst_pred_ty< is_zero_int >, ValTy, Instruction::Sub, OverflowingBinaryOperator::NoSignedWrap > m_NSWNeg(const ValTy &V)
Matches a 'Neg' as 'sub nsw 0, V'.
Definition: PatternMatch.h:2742

llvm::PatternMatch::m_ConstantInt
class_match< ConstantInt > m_ConstantInt()
Match an arbitrary ConstantInt and ignore it.
Definition: PatternMatch.h:168

llvm::PatternMatch::m_One
cst_pred_ty< is_one > m_One()
Match an integer 1 or a vector with all elements equal to 1.
Definition: PatternMatch.h:592

llvm::PatternMatch::m_Select
ThreeOps_match< Cond, LHS, RHS, Instruction::Select > m_Select(const Cond &C, const LHS &L, const RHS &R)
Matches SelectInst.
Definition: PatternMatch.h:1745

llvm::PatternMatch::m_NegZeroFP
cstfp_pred_ty< is_neg_zero_fp > m_NegZeroFP()
Match a floating-point negative zero.
Definition: PatternMatch.h:782

llvm::PatternMatch::m_SpecificFP
specific_fpval m_SpecificFP(double V)
Match a specific floating point value or vector with all elements equal to the value.
Definition: PatternMatch.h:918

llvm::PatternMatch::m_LogicalShift
BinOpPred_match< LHS, RHS, is_logical_shift_op > m_LogicalShift(const LHS &L, const RHS &R)
Matches logical shift operations.
Definition: PatternMatch.h:1495

llvm::PatternMatch::m_CombineAnd
match_combine_and< LTy, RTy > m_CombineAnd(const LTy &L, const RTy &R)
Combine two pattern matchers matching L && R.
Definition: PatternMatch.h:245

llvm::PatternMatch::m_SMin
MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > m_SMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2286

llvm::PatternMatch::m_c_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor, true > m_c_Xor(const LHS &L, const RHS &R)
Matches an Xor with LHS and RHS in either order.
Definition: PatternMatch.h:2725

llvm::PatternMatch::m_Deferred
deferredval_ty< Value > m_Deferred(Value *const &V)
Like m_Specific(), but works if the specific value to match is determined as part of the same match()...
Definition: PatternMatch.h:893

llvm::PatternMatch::m_ZeroInt
cst_pred_ty< is_zero_int > m_ZeroInt()
Match an integer 0 or a vector with all elements equal to 0.
Definition: PatternMatch.h:599

llvm::PatternMatch::m_APIntAllowPoison
apint_match m_APIntAllowPoison(const APInt *&Res)
Match APInt while allowing poison in splat vector constants.
Definition: PatternMatch.h:305

llvm::PatternMatch::m_ICmp
CmpClass_match< LHS, RHS, ICmpInst, ICmpInst::Predicate > m_ICmp(ICmpInst::Predicate &Pred, const LHS &L, const RHS &R)
Definition: PatternMatch.h:1589

llvm::PatternMatch::m_ZExtOrSExtOrSelf
match_combine_or< match_combine_or< CastInst_match< OpTy, ZExtInst >, CastInst_match< OpTy, SExtInst > >, OpTy > m_ZExtOrSExtOrSelf(const OpTy &Op)
Definition: PatternMatch.h:2084

llvm::PatternMatch::m_OneUse
OneUse_match< T > m_OneUse(const T &SubPattern)
Definition: PatternMatch.h:67

llvm::PatternMatch::m_LogicalOr
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
Definition: PatternMatch.h:3001

llvm::PatternMatch::m_Neg
BinaryOp_match< cst_pred_ty< is_zero_int >, ValTy, Instruction::Sub > m_Neg(const ValTy &V)
Matches a 'Neg' as 'sub 0, V'.
Definition: PatternMatch.h:2733

llvm::PatternMatch::m_Shuffle
TwoOps_match< V1_t, V2_t, Instruction::ShuffleVector > m_Shuffle(const V1_t &v1, const V2_t &v2)
Matches ShuffleVectorInst independently of mask value.
Definition: PatternMatch.h:1849

llvm::PatternMatch::m_ImmConstant
match_combine_and< class_match< Constant >, match_unless< constantexpr_match > > m_ImmConstant()
Match an arbitrary immediate Constant and ignore it.
Definition: PatternMatch.h:854

llvm::PatternMatch::m_FPExt
CastInst_match< OpTy, FPExtInst > m_FPExt(const OpTy &Op)
Definition: PatternMatch.h:2114

llvm::PatternMatch::m_ZExt
CastInst_match< OpTy, ZExtInst > m_ZExt(const OpTy &Op)
Matches ZExt.
Definition: PatternMatch.h:2045

llvm::PatternMatch::m_NUWShl
OverflowingBinaryOp_match< LHS, RHS, Instruction::Shl, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWShl(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1338

llvm::PatternMatch::m_UMax
MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty > m_UMax(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2292

llvm::PatternMatch::m_Cmp
class_match< CmpInst > m_Cmp()
Matches any compare instruction and ignore it.
Definition: PatternMatch.h:105

llvm::PatternMatch::m_NegatedPower2
cst_pred_ty< is_negated_power2 > m_NegatedPower2()
Match a integer or vector negated power-of-2.
Definition: PatternMatch.h:627

llvm::PatternMatch::m_CheckedInt
cst_pred_ty< custom_checkfn< APInt > > m_CheckedInt(function_ref< bool(const APInt &)> CheckFn)
Match an integer or vector where CheckFn(ele) for each element is true.
Definition: PatternMatch.h:481

llvm::PatternMatch::m_FShl
m_Intrinsic_Ty< Opnd0, Opnd1, Opnd2 >::Ty m_FShl(const Opnd0 &Op0, const Opnd1 &Op1, const Opnd2 &Op2)
Definition: PatternMatch.h:2637

llvm::PatternMatch::m_c_MaxOrMin
match_combine_or< match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty, true >, MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty, true > >, match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty, true >, MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty, true > > > m_c_MaxOrMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2777

llvm::PatternMatch::m_UnOp
class_match< UnaryOperator > m_UnOp()
Match an arbitrary unary operation and ignore it.
Definition: PatternMatch.h:95

llvm::PatternMatch::m_NUWSub
OverflowingBinaryOp_match< LHS, RHS, Instruction::Sub, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWSub(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1322

llvm::PatternMatch::m_SMax
MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty > m_SMax(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2280

llvm::PatternMatch::m_APInt
apint_match m_APInt(const APInt *&Res)
Match a ConstantInt or splatted ConstantVector, binding the specified pointer to the contained APInt.
Definition: PatternMatch.h:299

llvm::PatternMatch::m_NSWAddLike
match_combine_or< OverflowingBinaryOp_match< LHS, RHS, Instruction::Add, OverflowingBinaryOperator::NoSignedWrap >, DisjointOr_match< LHS, RHS > > m_NSWAddLike(const LHS &L, const RHS &R)
Match either "add nsw" or "or disjoint".
Definition: PatternMatch.h:1409

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition: PatternMatch.h:92

llvm::PatternMatch::m_LShr
BinaryOp_match< LHS, RHS, Instruction::LShr > m_LShr(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1230

llvm::PatternMatch::m_Exact
Exact_match< T > m_Exact(const T &SubPattern)
Definition: PatternMatch.h:1542

llvm::PatternMatch::m_FNeg
FNeg_match< OpTy > m_FNeg(const OpTy &X)
Match 'fneg X' as 'fsub -0.0, X'.
Definition: PatternMatch.h:1146

llvm::PatternMatch::m_Shift
BinOpPred_match< LHS, RHS, is_shift_op > m_Shift(const LHS &L, const RHS &R)
Matches shift operations.
Definition: PatternMatch.h:1480

llvm::PatternMatch::m_PosZeroFP
cstfp_pred_ty< is_pos_zero_fp > m_PosZeroFP()
Match a floating-point positive zero.
Definition: PatternMatch.h:773

llvm::PatternMatch::m_Shl
BinaryOp_match< LHS, RHS, Instruction::Shl > m_Shl(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1224

llvm::PatternMatch::m_VecReverse
m_Intrinsic_Ty< Opnd0 >::Ty m_VecReverse(const Opnd0 &Op0)
Definition: PatternMatch.h:2659

llvm::PatternMatch::m_APFloat
apfloat_match m_APFloat(const APFloat *&Res)
Match a ConstantFP or splatted ConstantVector, binding the specified pointer to the contained APFloat...
Definition: PatternMatch.h:316

llvm::PatternMatch::m_LogicalAnd
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
Definition: PatternMatch.h:2983

llvm::PatternMatch::m_MaxOrMin
match_combine_or< match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > >, match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty > > > m_MaxOrMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2309

llvm::PatternMatch::m_FShr
m_Intrinsic_Ty< Opnd0, Opnd1, Opnd2 >::Ty m_FShr(const Opnd0 &Op0, const Opnd1 &Op1, const Opnd2 &Op2)
Definition: PatternMatch.h:2643

llvm::PatternMatch::m_SRem
BinaryOp_match< LHS, RHS, Instruction::SRem > m_SRem(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1194

llvm::PatternMatch::m_Undef
auto m_Undef()
Match an arbitrary undef constant.
Definition: PatternMatch.h:152

llvm::PatternMatch::m_Not
BinaryOp_match< cst_pred_ty< is_all_ones >, ValTy, Instruction::Xor, true > m_Not(const ValTy &V)
Matches a 'Not' as 'xor V, -1' or 'xor -1, V'.
Definition: PatternMatch.h:2379

llvm::PatternMatch::m_BSwap
m_Intrinsic_Ty< Opnd0 >::Ty m_BSwap(const Opnd0 &Op0)
Definition: PatternMatch.h:2609

llvm::PatternMatch::m_SExt
CastInst_match< OpTy, SExtInst > m_SExt(const OpTy &Op)
Matches SExt.
Definition: PatternMatch.h:2039

llvm::PatternMatch::m_Zero
is_zero m_Zero()
Match any null constant or a vector with all elements equal to 0.
Definition: PatternMatch.h:612

llvm::PatternMatch::m_c_Or
BinaryOp_match< LHS, RHS, Instruction::Or, true > m_c_Or(const LHS &L, const RHS &R)
Matches an Or with LHS and RHS in either order.
Definition: PatternMatch.h:2718

llvm::PatternMatch::m_NUWAddLike
match_combine_or< OverflowingBinaryOp_match< LHS, RHS, Instruction::Add, OverflowingBinaryOperator::NoUnsignedWrap >, DisjointOr_match< LHS, RHS > > m_NUWAddLike(const LHS &L, const RHS &R)
Match either "add nuw" or "or disjoint".
Definition: PatternMatch.h:1419

llvm::PatternMatch::m_BitwiseLogic
BinOpPred_match< LHS, RHS, is_bitwiselogic_op > m_BitwiseLogic(const LHS &L, const RHS &R)
Matches bitwise logic operations.
Definition: PatternMatch.h:1502

llvm::PatternMatch::m_FAbs
m_Intrinsic_Ty< Opnd0 >::Ty m_FAbs(const Opnd0 &Op0)
Definition: PatternMatch.h:2614

llvm::PatternMatch::m_c_Mul
BinaryOp_match< LHS, RHS, Instruction::Mul, true > m_c_Mul(const LHS &L, const RHS &R)
Matches a Mul with LHS and RHS in either order.
Definition: PatternMatch.h:2704

llvm::PatternMatch::m_CopySign
m_Intrinsic_Ty< Opnd0, Opnd1 >::Ty m_CopySign(const Opnd0 &Op0, const Opnd1 &Op1)
Definition: PatternMatch.h:2653

llvm::PatternMatch::m_PtrToInt
CastOperator_match< OpTy, Instruction::PtrToInt > m_PtrToInt(const OpTy &Op)
Matches PtrToInt.
Definition: PatternMatch.h:1994

llvm::PatternMatch::m_UMin
MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty > m_UMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2298

llvm::PatternMatch::m_CombineOr
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
Definition: PatternMatch.h:239

llvm::SyncScope::SingleThread
@ SingleThread
Synchronized with respect to signal handlers executing in the same thread.
Definition: LLVMContext.h:54

llvm::SyncScope::System
@ System
Synchronized with respect to all concurrently executing threads.
Definition: LLVMContext.h:57

llvm::X86::FirstMacroFusionInstKind::AddSub
@ AddSub

llvm::at::getAssignmentMarkers
AssignmentMarkerRange getAssignmentMarkers(DIAssignID *ID)
Return a range of dbg.assign intrinsics which use \ID as an operand.
Definition: DebugInfo.cpp:1808

llvm::at::getDVRAssignmentMarkers
SmallVector< DbgVariableRecord * > getDVRAssignmentMarkers(const Instruction *Inst)
Definition: DebugInfo.h:238

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:443

llvm::codeview::EncodedFramePtrReg::BasePtr
@ BasePtr

llvm::dwarf::Index
Index
Definition: Dwarf.h:875

llvm::logicalview::LVAttributeKind::Zero
@ Zero

llvm::numbers::e
constexpr double e
Definition: MathExtras.h:47

llvm::ore::NV
DiagnosticInfoOptimizationBase::Argument NV
Definition: OptimizationRemarkEmitter.h:137

llvm::pdb::PDB_SymType::Caller
@ Caller

llvm::pdb::PDB_SymType::Callee
@ Callee

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::EnableKnowledgeRetention
cl::opt< bool > EnableKnowledgeRetention

llvm::getInverseMinMaxIntrinsic
Intrinsic::ID getInverseMinMaxIntrinsic(Intrinsic::ID MinMaxID)
Definition: ValueTracking.cpp:8776

llvm::Log2_32_Ceil
unsigned Log2_32_Ceil(uint32_t Value)
Return the ceil log base 2 of the specified value, 32 if the value is zero.
Definition: MathExtras.h:353

llvm::Offset
@ Offset
Definition: DWP.cpp:480

llvm::OverflowResult
OverflowResult
Definition: ValueTracking.h:897

llvm::OverflowResult::NeverOverflows
@ NeverOverflows
Never overflows.

llvm::OverflowResult::AlwaysOverflowsHigh
@ AlwaysOverflowsHigh
Always overflows in the direction of signed/unsigned max value.

llvm::OverflowResult::AlwaysOverflowsLow
@ AlwaysOverflowsLow
Always overflows in the direction of signed/unsigned min value.

llvm::OverflowResult::MayOverflow
@ MayOverflow
May or may not overflow.

llvm::for_each
UnaryFunction for_each(R &&Range, UnaryFunction F)
Provide wrappers to std::for_each which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1715

llvm::simplifyFMulInst
Value * simplifyFMulInst(Value *LHS, Value *RHS, FastMathFlags FMF, const SimplifyQuery &Q, fp::ExceptionBehavior ExBehavior=fp::ebIgnore, RoundingMode Rounding=RoundingMode::NearestTiesToEven)
Given operands for an FMul, fold the result or return null.
Definition: InstructionSimplify.cpp:5860

llvm::isValidAssumeForContext
bool isValidAssumeForContext(const Instruction *I, const Instruction *CxtI, const DominatorTree *DT=nullptr, bool AllowEphemerals=false)
Return true if it is valid to use the assumptions provided by an assume intrinsic,...
Definition: ValueTracking.cpp:493

llvm::possiblyDemandedEltsInMask
APInt possiblyDemandedEltsInMask(Value *Mask)
Given a mask vector of the form <Y x i1>, return an APInt (of bitwidth Y) for each lane which may be ...
Definition: VectorUtils.cpp:1101

llvm::simplifyRetainedKnowledge
RetainedKnowledge simplifyRetainedKnowledge(AssumeInst *Assume, RetainedKnowledge RK, AssumptionCache *AC, DominatorTree *DT)
canonicalize the RetainedKnowledge RK.
Definition: AssumeBundleBuilder.cpp:318

llvm::isRemovableAlloc
bool isRemovableAlloc(const CallBase *V, const TargetLibraryInfo *TLI)
Return true if this is a call to an allocation function that does not have side effects that we are r...
Definition: MemoryBuiltins.cpp:342

llvm::lowerObjectSizeCall
Value * lowerObjectSizeCall(IntrinsicInst *ObjectSize, const DataLayout &DL, const TargetLibraryInfo *TLI, bool MustSucceed)
Try to turn a call to @llvm.objectsize into an integer value of the given Type.
Definition: MemoryBuiltins.cpp:603

llvm::getAllocAlignment
Value * getAllocAlignment(const CallBase *V, const TargetLibraryInfo *TLI)
Gets the alignment argument for an aligned_alloc-like function, using either built-in knowledge based...
Definition: MemoryBuiltins.cpp:353

llvm::maximum
LLVM_READONLY APFloat maximum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximum semantics.
Definition: APFloat.h:1508

llvm::getUnderlyingObject
const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=6)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
Definition: ValueTracking.cpp:6535

llvm::simplifyCall
Value * simplifyCall(CallBase *Call, Value *Callee, ArrayRef< Value * > Args, const SimplifyQuery &Q)
Given a callsite, callee, and arguments, fold the result or return null.
Definition: InstructionSimplify.cpp:6969

llvm::ConstantFoldCompareInstOperands
Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
Definition: ConstantFolding.cpp:1175

llvm::alignDown
constexpr T alignDown(U Value, V Align, W Skew=0)
Returns the largest unsigned integer less than or equal to Value and is Skew mod Align.
Definition: MathExtras.h:547

llvm::isPowerOf2_64
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
Definition: MathExtras.h:296

llvm::isAssumeWithEmptyBundle
bool isAssumeWithEmptyBundle(const AssumeInst &Assume)
Return true iff the operand bundles of the provided llvm.assume doesn't contain any valuable informat...
Definition: AssumeBundleQueries.cpp:128

llvm::getSplatValue
Value * getSplatValue(const Value *V)
Get splat value if the input is a splat vector or return nullptr.
Definition: VectorUtils.cpp:251

llvm::MinAlign
constexpr T MinAlign(U A, V B)
A and B are either alignments or offsets.
Definition: MathExtras.h:366

llvm::getKnowledgeFromBundle
RetainedKnowledge getKnowledgeFromBundle(AssumeInst &Assume, const CallBase::BundleOpInfo &BOI)
This extracts the Knowledge from an element of an operand bundle.
Definition: AssumeBundleQueries.cpp:99

llvm::getKnownAlignment
Align getKnownAlignment(Value *V, const DataLayout &DL, const Instruction *CxtI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr)
Try to infer an alignment for the specified pointer.
Definition: Local.h:242

llvm::isSplatValue
bool isSplatValue(const Value *V, int Index=-1, unsigned Depth=0)
Return true if each element of the vector value V is poisoned or equal to every other non-poisoned el...
Definition: VectorUtils.cpp:266

llvm::maxnum
LLVM_READONLY APFloat maxnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2019 maximumNumber semantics.
Definition: APFloat.h:1469

llvm::fneg
FPClassTest fneg(FPClassTest Mask)
Return the test mask which returns true if the value's sign bit is flipped.
Definition: FloatingPointMode.cpp:14

llvm::SelectPatternFlavor
SelectPatternFlavor
Specific patterns of select instructions we can match.
Definition: ValueTracking.h:1104

llvm::SPF_ABS
@ SPF_ABS
Floating point maxnum.
Definition: ValueTracking.h:1112

llvm::SPF_NABS
@ SPF_NABS
Absolute value.
Definition: ValueTracking.h:1113

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition: MathExtras.h:291

llvm::isModSet
bool isModSet(const ModRefInfo MRI)
Definition: ModRef.h:48

llvm::ComplexDeinterleavingOperation::Splat
@ Splat

llvm::FPClassTest
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
Definition: FloatingPointMode.h:239

llvm::fcInf
@ fcInf
Definition: FloatingPointMode.h:254

llvm::fcNegSubnormal
@ fcNegSubnormal
Definition: FloatingPointMode.h:246

llvm::fcPosNormal
@ fcPosNormal
Definition: FloatingPointMode.h:250

llvm::fcNegZero
@ fcNegZero
Definition: FloatingPointMode.h:247

llvm::fcNegInf
@ fcNegInf
Definition: FloatingPointMode.h:244

llvm::fcSubnormal
@ fcSubnormal
Definition: FloatingPointMode.h:256

llvm::fcNone
@ fcNone
Definition: FloatingPointMode.h:240

llvm::fcPositive
@ fcPositive
Definition: FloatingPointMode.h:261

llvm::fcPosZero
@ fcPosZero
Definition: FloatingPointMode.h:248

llvm::fcNegNormal
@ fcNegNormal
Definition: FloatingPointMode.h:245

llvm::fcZero
@ fcZero
Definition: FloatingPointMode.h:257

llvm::fcNegative
@ fcNegative
Definition: FloatingPointMode.h:262

llvm::fcAllFlags
@ fcAllFlags
Definition: FloatingPointMode.h:264

llvm::fcPosSubnormal
@ fcPosSubnormal
Definition: FloatingPointMode.h:249

llvm::fcPosInf
@ fcPosInf
Definition: FloatingPointMode.h:251

llvm::fcNan
@ fcNan
Definition: FloatingPointMode.h:253

llvm::None
@ None
Definition: X86MachineFunctionInfo.h:26

llvm::matchSelectPattern
SelectPatternResult matchSelectPattern(Value *V, Value *&LHS, Value *&RHS, Instruction::CastOps *CastOp=nullptr, unsigned Depth=0)
Pattern match integer [SU]MIN, [SU]MAX and ABS idioms, returning the kind and providing the out param...
Definition: ValueTracking.cpp:8698

llvm::NullPointerIsDefined
bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
Definition: Function.cpp:2102

llvm::dbgs
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163

llvm::none_of
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1736

llvm::isAtLeastOrStrongerThan
bool isAtLeastOrStrongerThan(AtomicOrdering AO, AtomicOrdering Other)
Definition: AtomicOrdering.h:106

llvm::buildAssumeFromKnowledge
AssumeInst * buildAssumeFromKnowledge(ArrayRef< RetainedKnowledge > Knowledge, Instruction *CtxI, AssumptionCache *AC=nullptr, DominatorTree *DT=nullptr)
Build and return a new assume created from the provided knowledge if the knowledge in the assume is f...
Definition: AssumeBundleBuilder.cpp:309

llvm::isSafeToSpeculativelyExecute
bool isSafeToSpeculativelyExecute(const Instruction *I, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr, bool UseVariableInfo=true)
Return true if the instruction does not have any effects besides calculating the result and does not ...
Definition: ValueTracking.cpp:6812

llvm::inverse_fabs
FPClassTest inverse_fabs(FPClassTest Mask)
Return the test mask which returns true after fabs is applied to the value.
Definition: FloatingPointMode.cpp:35

llvm::maskIsAllOneOrUndef
bool maskIsAllOneOrUndef(Value *Mask)
Given a mask vector of i1, Return true if all of the elements of this predicate mask are known to be ...
Definition: VectorUtils.cpp:1048

llvm::ConstantFoldBinaryOpOperands
Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
Definition: ConstantFolding.cpp:1287

llvm::isKnownNonZero
bool isKnownNonZero(const Value *V, const SimplifyQuery &Q, unsigned Depth=0)
Return true if the given value is known to be non-zero when defined.
Definition: ValueTracking.cpp:3303

llvm::PoisonMaskElem
constexpr int PoisonMaskElem
Definition: Instructions.h:1796

llvm::AtomicOrdering::Unordered
@ Unordered

llvm::ModRefInfo::Mod
@ Mod
The access may modify the value stored in memory.

llvm::simplifyFMAFMul
Value * simplifyFMAFMul(Value *LHS, Value *RHS, FastMathFlags FMF, const SimplifyQuery &Q, fp::ExceptionBehavior ExBehavior=fp::ebIgnore, RoundingMode Rounding=RoundingMode::NearestTiesToEven)
Given operands for the multiplication of a FMA, fold the result or return null.
Definition: InstructionSimplify.cpp:5868

llvm::IRMemLocation::Other
@ Other
Any other memory.

llvm::simplifyConstrainedFPCall
Value * simplifyConstrainedFPCall(CallBase *Call, const SimplifyQuery &Q)
Given a constrained FP intrinsic call, tries to compute its simplified version.
Definition: InstructionSimplify.cpp:6995

llvm::minnum
LLVM_READONLY APFloat minnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2019 minimumNumber semantics.
Definition: APFloat.h:1455

llvm::RecurKind::Add
@ Add
Sum of integers.

llvm::RecurKind::FAdd
@ FAdd
Sum of floats.

llvm::computeConstantRangeIncludingKnownBits
ConstantRange computeConstantRangeIncludingKnownBits(const WithCache< const Value * > &V, bool ForSigned, const SimplifyQuery &SQ)
Combine constant ranges from computeConstantRange() and computeKnownBits().
Definition: ValueTracking.cpp:6958

llvm::computeKnownBits
void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, unsigned Depth=0, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
Definition: ValueTracking.cpp:165

llvm::getFreedOperand
Value * getFreedOperand(const CallBase *CB, const TargetLibraryInfo *TLI)
If this if a call to a free function, return the freed operand.
Definition: MemoryBuiltins.cpp:558

llvm::BitWidth
constexpr unsigned BitWidth
Definition: BitmaskEnum.h:191

llvm::isDereferenceablePointer
bool isDereferenceablePointer(const Value *V, Type *Ty, const DataLayout &DL, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr)
Return true if this is always a dereferenceable pointer.
Definition: Loads.cpp:221

llvm::is_contained
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
Definition: STLExtras.h:1879

llvm::getAllocSize
std::optional< APInt > getAllocSize(const CallBase *CB, const TargetLibraryInfo *TLI, function_ref< const Value *(const Value *)> Mapper=[](const Value *V) { return V;})
Return the size of the requested allocation.
Definition: MemoryBuiltins.cpp:379

llvm::computeKnownFPSignBit
std::optional< bool > computeKnownFPSignBit(const Value *V, unsigned Depth, const SimplifyQuery &SQ)
Return false if we can prove that the specified FP value's sign bit is 0.
Definition: ValueTracking.h:611

llvm::Log2
unsigned Log2(Align A)
Returns the log2 of the alignment.
Definition: Alignment.h:208

llvm::maskContainsAllOneOrUndef
bool maskContainsAllOneOrUndef(Value *Mask)
Given a mask vector of i1, Return true if any of the elements of this predicate mask are known to be ...
Definition: VectorUtils.cpp:1074

llvm::isImpliedByDomCondition
std::optional< bool > isImpliedByDomCondition(const Value *Cond, const Instruction *ContextI, const DataLayout &DL)
Return the boolean condition value in the context of the given instruction if it is known based on do...
Definition: ValueTracking.cpp:9292

llvm::minimum
LLVM_READONLY APFloat minimum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimum semantics.
Definition: APFloat.h:1482

llvm::isKnownNegation
bool isKnownNegation(const Value *X, const Value *Y, bool NeedNSW=false, bool AllowPoison=true)
Return true if the two given values are negation.
Definition: ValueTracking.cpp:8344

llvm::Data
@ Data
Definition: SIMachineScheduler.h:55

llvm::isKnownNonNegative
bool isKnownNonNegative(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Returns true if the give value is known to be non-negative.
Definition: ValueTracking.cpp:284

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition: BitVector.h:860

raw_ostream.h

NC
#define NC
Definition: regutils.h:42

llvm::AAMDNodes
A collection of metadata nodes that might be associated with a memory access used by the alias-analys...
Definition: Metadata.h:760

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::BitTracker
Definition: BitTracker.h:35

llvm::DenormalMode::IEEE
@ IEEE
IEEE-754 denormal numbers preserved.
Definition: FloatingPointMode.h:77

llvm::KnownBits
Definition: KnownBits.h:23

llvm::KnownBits::isNonNegative
bool isNonNegative() const
Returns true if this value is known to be non-negative.
Definition: KnownBits.h:97

llvm::KnownBits::countMinTrailingZeros
unsigned countMinTrailingZeros() const
Returns the minimum number of trailing zero bits.
Definition: KnownBits.h:231

llvm::KnownBits::countMaxTrailingZeros
unsigned countMaxTrailingZeros() const
Returns the maximum number of trailing zero bits possible.
Definition: KnownBits.h:263

llvm::KnownBits::countMaxPopulation
unsigned countMaxPopulation() const
Returns the maximum number of bits that could be one.
Definition: KnownBits.h:278

llvm::KnownBits::getBitWidth
unsigned getBitWidth() const
Get the bit width of this value.
Definition: KnownBits.h:40

llvm::KnownBits::isNonZero
bool isNonZero() const
Returns true if this value is known to be non-zero.
Definition: KnownBits.h:100

llvm::KnownBits::countMinLeadingZeros
unsigned countMinLeadingZeros() const
Returns the minimum number of leading zero bits.
Definition: KnownBits.h:237

llvm::KnownBits::isNegative
bool isNegative() const
Returns true if this value is known to be negative.
Definition: KnownBits.h:94

llvm::KnownBits::countMaxLeadingZeros
unsigned countMaxLeadingZeros() const
Returns the maximum number of leading zero bits possible.
Definition: KnownBits.h:269

llvm::KnownBits::One
APInt One
Definition: KnownBits.h:25

llvm::KnownBits::Zero
APInt Zero
Definition: KnownBits.h:24

llvm::KnownBits::countMinPopulation
unsigned countMinPopulation() const
Returns the number of bits known to be one.
Definition: KnownBits.h:275

llvm::KnownBits::isAllOnes
bool isAllOnes() const
Returns true if value is all one bits.
Definition: KnownBits.h:79

llvm::KnownFPClass
Definition: ValueTracking.h:262

llvm::KnownFPClass::KnownFPClasses
FPClassTest KnownFPClasses
Floating-point classes the value could be one of.
Definition: ValueTracking.h:264

llvm::MaybeAlign
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Definition: Alignment.h:117

llvm::MaybeAlign::valueOrOne
Align valueOrOne() const
For convenience, returns a valid alignment or 1 if undefined.
Definition: Alignment.h:141

llvm::MinMax
Definition: AssumeBundleQueries.h:71

llvm::OperandBundleUse
A lightweight accessor for an operand bundle meant to be passed around by value.
Definition: InstrTypes.h:1131

llvm::OperandBundleUse::getTagName
StringRef getTagName() const
Return the tag of this operand bundle as a string.
Definition: InstrTypes.h:1150

llvm::OperandBundleUse::Inputs
ArrayRef< Use > Inputs
Definition: InstrTypes.h:1132

llvm::PatternMatch::m_Mask
Definition: PatternMatch.h:1797

llvm::PatternMatch::m_SpecificMask
Definition: PatternMatch.h:1812

llvm::RetainedKnowledge
Represent one information held inside an operand bundle of an llvm.assume.
Definition: AssumeBundleQueries.h:100

llvm::RetainedKnowledge::AttrKind
Attribute::AttrKind AttrKind
Definition: AssumeBundleQueries.h:101

llvm::RetainedKnowledge::ArgValue
uint64_t ArgValue
Definition: AssumeBundleQueries.h:102

llvm::RetainedKnowledge::WasOn
Value * WasOn
Definition: AssumeBundleQueries.h:103

llvm::SelectPatternResult::Flavor
SelectPatternFlavor Flavor
Definition: ValueTracking.h:1128

llvm::SimplifyQuery
Definition: SimplifyQuery.h:70

llvm::SimplifyQuery::DL
const DataLayout & DL
Definition: SimplifyQuery.h:71

llvm::SimplifyQuery::CxtI
const Instruction * CxtI
Definition: SimplifyQuery.h:75

llvm::SimplifyQuery::getWithInstruction
SimplifyQuery getWithInstruction(const Instruction *I) const
Definition: SimplifyQuery.h:107

llvm::UnderlyingObject
Definition: ScheduleDAGInstrs.h:103

llvm::cl::desc
Definition: CommandLine.h:409