24#ifndef LLVM_TRANSFORMS_VECTORIZE_VPLAN_H
25#define LLVM_TRANSFORMS_VECTORIZE_VPLAN_H
97 const unsigned char SubclassID;
114 VPlan *Plan =
nullptr;
124 assert(Predecessor &&
"Cannot add nullptr predecessor!");
129 void removePredecessor(VPBlockBase *Predecessor) {
130 auto Pos =
find(Predecessors, Predecessor);
131 assert(Pos &&
"Predecessor does not exist");
132 Predecessors.
erase(Pos);
136 void removeSuccessor(VPBlockBase *Successor) {
137 auto Pos =
find(Successors, Successor);
138 assert(Pos &&
"Successor does not exist");
139 Successors.
erase(Pos);
144 void replacePredecessor(VPBlockBase *Old, VPBlockBase *New) {
145 auto I =
find(Predecessors, Old);
147 assert(Old->getParent() ==
New->getParent() &&
148 "replaced predecessor must have the same parent");
154 void replaceSuccessor(VPBlockBase *Old, VPBlockBase *New) {
155 auto I =
find(Successors, Old);
157 assert(Old->getParent() ==
New->getParent() &&
158 "replaced successor must have the same parent");
164 : SubclassID(SC), Name(
N) {}
171 using VPBlockTy =
enum { VPRegionBlockSC, VPBasicBlockSC, VPIRBasicBlockSC };
177 const std::string &
getName()
const {
return Name; }
191 const VPlan *getPlan()
const;
195 void setPlan(
VPlan *ParentPlan);
228 return (Successors.size() == 1 ? *Successors.begin() :
nullptr);
234 return (Predecessors.size() == 1 ? *Predecessors.begin() :
nullptr);
287 assert(Successors.empty() &&
"Setting one successor when others exist.");
289 "connected blocks must have the same parent");
298 assert(Successors.empty() &&
"Setting two successors when others exist.");
299 appendSuccessor(IfTrue);
300 appendSuccessor(IfFalse);
307 assert(Predecessors.empty() &&
"Block predecessors already set.");
308 for (
auto *Pred : NewPreds)
309 appendPredecessor(Pred);
316 assert(Successors.empty() &&
"Block successors already set.");
317 for (
auto *Succ : NewSuccs)
318 appendSuccessor(Succ);
330 assert(Predecessors.size() == 2 &&
"must have 2 predecessors to swap");
331 std::swap(Predecessors[0], Predecessors[1]);
338 assert(Successors.size() == 2 &&
"must have 2 successors to swap");
345 "must have Pred exactly once in Predecessors");
346 return std::distance(Predecessors.begin(),
find(Predecessors, Pred));
352 "must have Succ exactly once in Successors");
353 return std::distance(Successors.begin(),
find(Successors, Succ));
363#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
407 const unsigned char SubclassID;
410 VPBasicBlock *Parent =
nullptr;
434 VPVectorEndPointerSC,
436 VPWidenCanonicalIVSC,
440 VPWidenMemIntrinsicSC,
453 VPCurrentIterationPHISC,
454 VPActiveLaneMaskPHISC,
455 VPFirstOrderRecurrencePHISC,
456 VPWidenIntOrFpInductionSC,
457 VPWidenPointerInductionSC,
461 VPFirstPHISC = VPWidenPHISC,
462 VPFirstHeaderPHISC = VPCurrentIterationPHISC,
463 VPLastHeaderPHISC = VPReductionPHISC,
464 VPLastPHISC = VPReductionPHISC,
469 :
VPDef(),
VPUser(Operands), SubclassID(SC), DL(DL) {}
478 const VPBasicBlock *
getParent()
const {
return Parent; }
544 bool mayReadFromMemory()
const;
547 bool mayWriteToMemory()
const;
560#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
576#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
585#define VP_CLASSOF_IMPL(VPRecipeID) \
586 static inline bool classof(const VPRecipeBase *R) { \
587 return R->getVPRecipeID() == VPRecipeID; \
589 static inline bool classof(const VPValue *V) { \
590 auto *R = V->getDefiningRecipe(); \
591 return R && R->getVPRecipeID() == VPRecipeID; \
593 static inline bool classof(const VPUser *U) { \
594 auto *R = dyn_cast<VPRecipeBase>(U); \
595 return R && R->getVPRecipeID() == VPRecipeID; \
597 static inline bool classof(const VPSingleDefRecipe *R) { \
598 return R->getVPRecipeID() == VPRecipeID; \
624 switch (R->getVPRecipeID()) {
625 case VPRecipeBase::VPDerivedIVSC:
626 case VPRecipeBase::VPExpandSCEVSC:
627 case VPRecipeBase::VPExpressionSC:
628 case VPRecipeBase::VPInstructionSC:
629 case VPRecipeBase::VPReductionEVLSC:
630 case VPRecipeBase::VPReductionSC:
631 case VPRecipeBase::VPReplicateSC:
632 case VPRecipeBase::VPScalarIVStepsSC:
633 case VPRecipeBase::VPVectorPointerSC:
634 case VPRecipeBase::VPVectorEndPointerSC:
635 case VPRecipeBase::VPWidenCallSC:
636 case VPRecipeBase::VPWidenCanonicalIVSC:
637 case VPRecipeBase::VPWidenCastSC:
638 case VPRecipeBase::VPWidenGEPSC:
639 case VPRecipeBase::VPWidenIntrinsicSC:
640 case VPRecipeBase::VPWidenMemIntrinsicSC:
641 case VPRecipeBase::VPWidenSC:
642 case VPRecipeBase::VPBlendSC:
643 case VPRecipeBase::VPPredInstPHISC:
644 case VPRecipeBase::VPCurrentIterationPHISC:
645 case VPRecipeBase::VPActiveLaneMaskPHISC:
646 case VPRecipeBase::VPFirstOrderRecurrencePHISC:
647 case VPRecipeBase::VPWidenPHISC:
648 case VPRecipeBase::VPWidenIntOrFpInductionSC:
649 case VPRecipeBase::VPWidenPointerInductionSC:
650 case VPRecipeBase::VPReductionPHISC:
651 case VPRecipeBase::VPWidenLoadEVLSC:
652 case VPRecipeBase::VPWidenLoadSC:
654 case VPRecipeBase::VPBranchOnMaskSC:
655 case VPRecipeBase::VPInterleaveEVLSC:
656 case VPRecipeBase::VPInterleaveSC:
657 case VPRecipeBase::VPIRInstructionSC:
658 case VPRecipeBase::VPWidenStoreEVLSC:
659 case VPRecipeBase::VPWidenStoreSC:
660 case VPRecipeBase::VPHistogramSC:
667 auto *R = V->getDefiningRecipe();
686#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
695 enum class OperationType :
unsigned char {
735 struct ExactFlagsTy {
737 ExactFlagsTy(
bool Exact) : IsExact(Exact) {}
739 struct FastMathFlagsTy {
740 char AllowReassoc : 1;
743 char NoSignedZeros : 1;
744 char AllowReciprocal : 1;
745 char AllowContract : 1;
753 uint8_t CmpPredStorage;
754 FastMathFlagsTy FMFs;
757 struct ReductionFlagsTy {
760 unsigned char Kind : 6;
762 unsigned char IsOrdered : 1;
763 unsigned char IsInLoop : 1;
764 FastMathFlagsTy FMFs;
766 ReductionFlagsTy(
RecurKind Kind,
bool IsOrdered,
bool IsInLoop,
768 : Kind(static_cast<unsigned char>(Kind)), IsOrdered(IsOrdered),
769 IsInLoop(IsInLoop), FMFs(FMFs) {}
772 OperationType OpType;
793 OpType = OperationType::FCmp;
795 FCmp->getPredicate());
797 FCmpFlags.FMFs = FCmp->getFastMathFlags();
799 OpType = OperationType::Cmp;
804 OpType = OperationType::DisjointOp;
807 OpType = OperationType::OverflowingBinOp;
808 WrapFlags = {
Op->hasNoUnsignedWrap(),
Op->hasNoSignedWrap()};
810 OpType = OperationType::Trunc;
813 OpType = OperationType::PossiblyExactOp;
816 OpType = OperationType::GEPOp;
819 "wrap flags truncated");
821 OpType = OperationType::NonNegOp;
824 OpType = OperationType::FPMathOp;
825 FMFs =
Op->getFastMathFlags();
835 : OpType(OperationType::FCmp),
AllFlags() {
842 : OpType(OperationType::OverflowingBinOp),
AllFlags() {
847 : OpType(OperationType::Trunc),
AllFlags() {
856 : OpType(OperationType::DisjointOp),
AllFlags() {
861 : OpType(OperationType::NonNegOp),
AllFlags() {
866 : OpType(OperationType::PossiblyExactOp),
AllFlags() {
871 : OpType(OperationType::GEPOp),
AllFlags() {
876 : OpType(OperationType::ReductionOp),
AllFlags() {
881 OpType = Other.OpType;
895 case OperationType::OverflowingBinOp:
899 case OperationType::Trunc:
903 case OperationType::DisjointOp:
906 case OperationType::PossiblyExactOp:
909 case OperationType::GEPOp:
912 case OperationType::FPMathOp:
913 case OperationType::FCmp:
914 case OperationType::ReductionOp:
915 getFMFsRef().NoNaNs =
false;
916 getFMFsRef().NoInfs =
false;
918 case OperationType::NonNegOp:
921 case OperationType::Cmp:
922 case OperationType::Other:
930 case OperationType::OverflowingBinOp:
934 case OperationType::Trunc:
938 case OperationType::DisjointOp:
941 case OperationType::PossiblyExactOp:
944 case OperationType::GEPOp:
948 case OperationType::FPMathOp:
949 case OperationType::FCmp: {
950 const FastMathFlagsTy &
F = getFMFsRef();
951 I.setHasAllowReassoc(
F.AllowReassoc);
952 I.setHasNoNaNs(
F.NoNaNs);
953 I.setHasNoInfs(
F.NoInfs);
954 I.setHasNoSignedZeros(
F.NoSignedZeros);
955 I.setHasAllowReciprocal(
F.AllowReciprocal);
956 I.setHasAllowContract(
F.AllowContract);
957 I.setHasApproxFunc(
F.ApproxFunc);
960 case OperationType::NonNegOp:
963 case OperationType::ReductionOp:
965 case OperationType::Cmp:
966 case OperationType::Other:
972 assert((OpType == OperationType::Cmp || OpType == OperationType::FCmp) &&
973 "recipe doesn't have a compare predicate");
980 assert((OpType == OperationType::Cmp || OpType == OperationType::FCmp) &&
981 "recipe doesn't have a compare predicate");
982 if (OpType == OperationType::FCmp)
995 return OpType == OperationType::Cmp || OpType == OperationType::FCmp;
1000 return OpType == OperationType::FPMathOp || OpType == OperationType::FCmp ||
1001 OpType == OperationType::ReductionOp;
1010 assert(OpType == OperationType::NonNegOp &&
1011 "recipe doesn't have a NNEG flag");
1017 case OperationType::OverflowingBinOp:
1019 case OperationType::Trunc:
1028 case OperationType::OverflowingBinOp:
1030 case OperationType::Trunc:
1039 case OperationType::OverflowingBinOp:
1040 case OperationType::Trunc:
1052 assert(OpType == OperationType::DisjointOp &&
1053 "recipe cannot have a disjoing flag");
1058 assert(OpType == OperationType::ReductionOp &&
1059 "recipe doesn't have reduction flags");
1064 assert(OpType == OperationType::ReductionOp &&
1065 "recipe doesn't have reduction flags");
1070 assert(OpType == OperationType::ReductionOp &&
1071 "recipe doesn't have reduction flags");
1077 FastMathFlagsTy &getFMFsRef() {
1078 if (OpType == OperationType::FCmp)
1080 if (OpType == OperationType::ReductionOp)
1084 const FastMathFlagsTy &getFMFsRef()
const {
1085 if (OpType == OperationType::FCmp)
1087 if (OpType == OperationType::ReductionOp)
1106#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1112static_assert(
sizeof(
VPIRFlags) <= 3,
"VPIRFlags should not grow");
1129 return R->getVPRecipeID() == VPRecipeBase::VPBlendSC ||
1130 R->getVPRecipeID() == VPRecipeBase::VPInstructionSC ||
1131 R->getVPRecipeID() == VPRecipeBase::VPWidenSC ||
1132 R->getVPRecipeID() == VPRecipeBase::VPWidenGEPSC ||
1133 R->getVPRecipeID() == VPRecipeBase::VPWidenCallSC ||
1134 R->getVPRecipeID() == VPRecipeBase::VPWidenCastSC ||
1135 R->getVPRecipeID() == VPRecipeBase::VPWidenIntrinsicSC ||
1136 R->getVPRecipeID() == VPRecipeBase::VPWidenMemIntrinsicSC ||
1137 R->getVPRecipeID() == VPRecipeBase::VPReductionSC ||
1138 R->getVPRecipeID() == VPRecipeBase::VPReductionEVLSC ||
1139 R->getVPRecipeID() == VPRecipeBase::VPReplicateSC ||
1140 R->getVPRecipeID() == VPRecipeBase::VPVectorEndPointerSC ||
1141 R->getVPRecipeID() == VPRecipeBase::VPVectorPointerSC ||
1142 R->getVPRecipeID() == VPRecipeBase::VPWidenCanonicalIVSC;
1151 auto *R = V->getDefiningRecipe();
1192 llvm::find_if(Metadata, [Kind](
const std::pair<unsigned, MDNode *> &
P) {
1193 return P.first == Kind;
1195 if (It != Metadata.end())
1198 Metadata.emplace_back(Kind,
Node);
1208 find_if(Metadata, [Kind](
const auto &
P) {
return P.first == Kind; });
1209 return It != Metadata.end() ? It->second :
nullptr;
1212#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1230 Instruction::OtherOpsEnd + 1,
1358 bool doesGeneratePerAllLanes()
const;
1363 unsigned getNumOperandsForOpcode()
const;
1366 typedef unsigned char OpcodeTy;
1374 bool canGenerateScalarForFirstLane()
const;
1382 bool alwaysUnmasked()
const {
1388 if (!getUnderlyingValue())
1392 Opcode == Instruction::GetElementPtr;
1396 VPInstruction(
unsigned Opcode, ArrayRef<VPValue *> Operands,
1397 const VPIRFlags &Flags = {},
const VPIRMetadata &MD = {},
1399 Type *ResultTy =
nullptr);
1408 Type *ResultTy =
nullptr) {
1409 auto *New =
new VPInstruction(Opcode, NewOperands, *
this, *
this,
1427#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1436 case Instruction::Ret:
1437 case Instruction::UncondBr:
1438 case Instruction::CondBr:
1439 case Instruction::Store:
1440 case Instruction::Switch:
1441 case Instruction::IndirectBr:
1442 case Instruction::Resume:
1443 case Instruction::CatchRet:
1444 case Instruction::Unreachable:
1445 case Instruction::Fence:
1446 case Instruction::AtomicRMW:
1460 if (NumOpsForOpcode == -1u)
1474 if (alwaysUnmasked())
1495 bool opcodeMayReadOrWriteFromMemory()
const;
1498 bool usesFirstLaneOnly(
const VPValue *
Op)
const override;
1501 bool usesFirstPartOnly(
const VPValue *
Op)
const override;
1505 bool isVectorToScalar()
const;
1509 bool isSingleScalar()
const;
1518#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1537 const Twine &Name =
"")
1546 unsigned Opc = VPI->getOpcode();
1553 case Instruction::Load:
1584#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1632 std::function<
const VPBasicBlock *(size_t)> GetBlock = [
this](
size_t Idx) {
1650#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1658 const Twine &Name =
"",
Type *ResultTy =
nullptr)
1664 return VPI && VPI->getOpcode() == Instruction::PHI;
1669 return VPI && VPI->getOpcode() == Instruction::PHI;
1674 return VPI && VPI->getOpcode() == Instruction::PHI;
1686#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1733 "Op must be an operand of the recipe");
1739 "Op must be an operand of the recipe");
1745 "Op must be an operand of the recipe");
1750#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1780#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1802 setUnderlyingValue(&
I);
1808 : VPRecipeWithIRFlags(VPRecipeBase::VPWidenSC, Operands,
1811 VPIRMetadata(
Metadata), Opcode(Opcode) {}
1837#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1846 "Op must be an operand of the recipe");
1847 return Opcode == Instruction::Select &&
Op ==
getOperand(0) &&
1848 Op->isDefinedOutsideLoopRegions();
1868 "Set flags not supported for the provided opcode");
1870 "Opcode requires specific flags to be set");
1894#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
1907 bool MayReadFromMemory;
1910 bool MayWriteToMemory;
1913 bool MayHaveSideEffects;
1923 VectorIntrinsicID(VectorIntrinsicID) {
1924 LLVMContext &Ctx = Ty->getContext();
1927 MayReadFromMemory = !ME.onlyWritesMemory();
1928 MayWriteToMemory = !ME.onlyReadsMemory();
1929 MayHaveSideEffects = MayWriteToMemory ||
1930 !Attrs.hasAttribute(Attribute::NoUnwind) ||
1931 !Attrs.hasAttribute(Attribute::WillReturn);
1945 VPIRMetadata(MD), VectorIntrinsicID(VectorIntrinsicID),
1958 VectorIntrinsicID, CallArguments, Ty, Flags,
1974 return R->getVPRecipeID() == VPRecipeBase::VPWidenIntrinsicSC ||
1975 R->getVPRecipeID() == VPRecipeBase::VPWidenMemIntrinsicSC;
1984 auto *R = V->getDefiningRecipe();
2023#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2042 VectorIntrinsicID, CallArguments, Ty, {}, MD,
2044 Alignment(Alignment) {
2045 assert(VectorIntrinsicID == Intrinsic::experimental_vp_strided_load &&
2046 "Unexpected intrinsic");
2064 bool IsMasked,
Align Alignment,
2085 : VPRecipeWithIRFlags(VPRecipeBase::VPWidenCallSC, CallArguments,
2089 setUnderlyingValue(UV);
2091 isa<Function>(getOperand(getNumOperands() - 1)->getLiveInIRValue()) &&
2092 "last operand must be the called function");
2093 assert(cast<Function>(CallArguments.
back()->getLiveInIRValue())
2094 ->getReturnType() == getScalarType() &&
2095 "Scalar type must match return type of called scalar function");
2125 bool usesFirstLaneOnly(
const VPValue *
Op)
const override;
2128#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2175#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2184 Type *SourceElementTy;
2186 bool isPointerLoopInvariant()
const {
2187 return getOperand(0)->isDefinedOutsideLoopRegions();
2190 bool isIndexLoopInvariant(
unsigned I)
const {
2191 return getOperand(
I + 1)->isDefinedOutsideLoopRegions();
2200 Operands[0]->getScalarType(), Flags,
DL),
2201 SourceElementTy(SourceElementTy) {
2203 setUnderlyingValue(UV);
2236 bool usesFirstLaneOnly(
const VPValue *
Op)
const override;
2239#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2252 Type *SourceElementTy;
2262 Ptr->getScalarType(), GEPFlags,
DL),
2263 SourceElementTy(SourceElementTy), Stride(Stride) {
2264 assert(Stride < 0 &&
"Stride must be negative");
2285 "Op must be an operand of the recipe");
2299 "Op must be an operand of the recipe");
2309 VEPR->addOperand(
Offset);
2314#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2326 Type *SourceElementTy;
2333 Ptr->getScalarType(), GEPFlags,
DL),
2334 SourceElementTy(SourceElementTy) {}
2350 "Op must be an operand of the recipe");
2357 "Op must be an operand of the recipe");
2367 Clone->addOperand(VFxPart);
2379#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2424 return R->getVPRecipeID() >= VPRecipeBase::VPFirstHeaderPHISC &&
2425 R->getVPRecipeID() <= VPRecipeBase::VPLastHeaderPHISC;
2467#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2495 return R->getVPRecipeID() == VPRecipeBase::VPWidenIntOrFpInductionSC ||
2496 R->getVPRecipeID() == VPRecipeBase::VPWidenPointerInductionSC;
2500 auto *R = V->getDefiningRecipe();
2538 return IndDesc.getNoWrapPredicates();
2545 "VPWidenIntOrFpInductionRecipe generates its own backedge value");
2552 "VPWidenIntOrFpInductionRecipe generates its own backedge value");
2558 "Op must be an operand of the recipe");
2581 Start, Step, IndDesc,
DL),
2591 Start, Step, IndDesc,
2613 "expandVPWidenIntOrFpInductionRecipe");
2648#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2664 Start, Step, IndDesc,
DL) {
2681 "expandVPWidenPointerInduction");
2688#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2718 "all incoming values must have the same type");
2737#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2773 "Op must be an operand of the recipe");
2778#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2799 unsigned ScaleFactor) {
2800 assert((!Ordered || InLoop) &&
"Ordered implies in-loop");
2821 bool HasUsesOutsideReductionChain;
2828 bool HasUsesOutsideReductionChain =
false)
2830 VPIRFlags(Flags), Kind(Kind), Style(Style),
2831 HasUsesOutsideReductionChain(HasUsesOutsideReductionChain) {
2841 *Start, *BackedgeValue, Style, *
this, HasUsesOutsideReductionChain);
2856 auto *Partial = std::get_if<RdxUnordered>(&Style);
2857 return Partial ? Partial->VFScaleFactor : 1;
2863 assert(ScaleFactor > 1 &&
"must set to scale factor > 1");
2876 bool isOrdered()
const {
return std::holds_alternative<RdxOrdered>(Style); }
2880 return std::holds_alternative<RdxInLoop>(Style) ||
2881 std::holds_alternative<RdxOrdered>(Style);
2889 return HasUsesOutsideReductionChain;
2895 "Op must be an operand of the recipe");
2900#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
2919 assert(Operands.size() >= 2 &&
"Expected at least two operands!");
2921 [
this](
unsigned I) {
2925 "all incoming values must have the same type");
2927 [
this](
unsigned I) {
2928 return getMask(
I)->getScalarType()->isIntegerTy(1);
2930 "masks must be a bool");
2979 bool usesFirstLaneOnly(
const VPValue *
Op)
const override;
2982#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3000 bool HasMask =
false;
3004 bool NeedsMaskForGaps =
false;
3013 NeedsMaskForGaps(NeedsMaskForGaps) {
3015 assert((!Mask || !IG->isReverse()) &&
3016 "Reversed masked interleave-group not supported.");
3017 if (StoredValues.
empty()) {
3019 assert(!Inst->getType()->isVoidTy() &&
"must have result");
3023 for (
auto *SV : StoredValues)
3036 return R->getVPRecipeID() == VPRecipeBase::VPInterleaveSC ||
3037 R->getVPRecipeID() == VPRecipeBase::VPInterleaveEVLSC;
3097 Mask, NeedsMaskForGaps, MD, DL) {}
3114 "Op must be an operand of the recipe");
3123#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3138 R.getStoredValues(), Mask, R.needsMaskForGaps(), R,
3140 assert(!getInterleaveGroup()->isReverse() &&
3141 "Reversed interleave-group with tail folding is not supported.");
3142 assert(!needsMaskForGaps() &&
"Interleaved access with gap mask is not "
3143 "supported for scalable vector.");
3163 "Op must be an operand of the recipe");
3173#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3189 bool IsConditional =
false;
3199 RdxKind(RdxKind), Style(Style) {
3207 "all incoming values must have the same type");
3210 "CondOp must be a bool");
3211 IsConditional =
true;
3222 {ChainOp, VecOp}, CondOp, Style,
DL) {}
3228 {ChainOp, VecOp}, CondOp, Style,
DL) {}
3239 return R->getVPRecipeID() == VPRecipeBase::VPReductionSC ||
3240 R->getVPRecipeID() == VPRecipeBase::VPReductionEVLSC;
3267 bool isOrdered()
const {
return std::holds_alternative<RdxOrdered>(Style); };
3274 return std::holds_alternative<RdxInLoop>(Style) ||
3275 std::holds_alternative<RdxOrdered>(Style);
3288 auto *Partial = std::get_if<RdxUnordered>(&Style);
3289 return Partial ? Partial->VFScaleFactor : 1;
3293#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3311 {R.getChainOp(), R.getVecOp(), &EVL}, CondOp,
3332 "Op must be an operand of the recipe");
3337#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3351 bool IsSingleScalar;
3358 bool IsSingleScalar,
VPValue *Mask =
nullptr,
3360 DebugLoc
DL = DebugLoc::getUnknown())
3361 : VPRecipeWithIRFlags(VPRecipeBase::VPReplicateSC, Operands,
3362 computeScalarType(
I, Operands), Flags,
DL),
3363 VPIRMetadata(
Metadata), IsSingleScalar(IsSingleScalar),
3364 IsPredicated(Mask) {
3365 setUnderlyingValue(
I);
3383 Copy->transferFlags(*
this);
3412 "Op must be an operand of the recipe");
3419 "Op must be an operand of the recipe");
3432#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3459#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3463 O << Indent <<
"BRANCH-ON-MASK ";
3471 "Op must be an operand of the recipe");
3494 enum class ExpressionTypes {
3501 NegatedExtendedReduction,
3513 ExtNegatedMulAccReduction,
3517 ExpressionTypes ExpressionType;
3525 VPExpressionRecipe(ExpressionTypes ExpressionType,
3530 : VPExpressionRecipe(ExpressionTypes::ExtendedReduction, {Ext, Red}) {}
3533 : VPExpressionRecipe(ExpressionTypes::NegatedExtendedReduction,
3537 "Expected an add reduction");
3538 if (Neg->getOpcode() == Instruction::Sub) {
3540 assert(SubConst && SubConst->isZero() &&
"Expected a negating sub");
3542 assert(Neg->getOpcode() == Instruction::FNeg &&
"Unexpected opcode");
3545 : VPExpressionRecipe(ExpressionTypes::MulAccReduction, {
Mul, Red}) {}
3548 : VPExpressionRecipe(ExpressionTypes::ExtMulAccReduction,
3549 {Ext0, Ext1,
Mul, Red}) {}
3553 : VPExpressionRecipe(ExpressionTypes::ExtNegatedMulAccReduction,
3554 {Ext0, Ext1,
Mul, Neg, Red}) {
3555 assert((
Mul->getOpcode() == Instruction::Mul ||
3556 Mul->getOpcode() == Instruction::FMul) &&
3560 "Expected an add reduction");
3562 if (Neg->getOpcode() == Instruction::Sub) {
3564 assert(SubConst && SubConst->isZero() &&
3565 Neg->getOpcode() == Instruction::Sub &&
"Expected a negating sub");
3567 assert(Neg->getOpcode() == Instruction::FNeg &&
"Unexpected opcode");
3572 for (
auto *R :
reverse(ExpressionRecipes)) {
3573 if (ExpressionRecipesSeen.
insert(R).second)
3576 for (
VPValue *
T : LiveInPlaceholders)
3583 assert(!ExpressionRecipes.empty() &&
"empty expressions should be removed");
3585 for (
auto *R : ExpressionRecipes)
3586 NewExpressiondRecipes.
push_back(R->clone());
3587 for (
auto *New : NewExpressiondRecipes) {
3588 for (
const auto &[Idx, Old] :
enumerate(ExpressionRecipes))
3589 New->replaceUsesOfWith(Old, NewExpressiondRecipes[Idx]);
3592 for (
const auto &[Placeholder, OutsideOp] :
3594 New->replaceUsesOfWith(Placeholder, OutsideOp);
3596 return new VPExpressionRecipe(ExpressionType, NewExpressiondRecipes);
3614 return PR ? PR->getVFScaleFactor() : 1;
3637#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3676#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3732 return isMasked() ? R->getOperand(R->getNumOperands() - 1) :
nullptr;
3775 "Op must be an operand of the recipe");
3785#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3800 L.getIngredient().
getType(), &L.getIngredient(),
3825 "Op must be an operand of the recipe");
3835#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3877 "Op must be an operand of the recipe");
3887#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3929 "Op must be an operand of the recipe");
3944#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
3965 llvm_unreachable(
"SCEV expressions must be expanded before final execute");
3978#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
4008#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
4035 "scalar phi recipe");
4048 "Op must be an operand of the recipe");
4053#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
4068 CanonicalIV->
getType(), Flags) {}
4076 WideCanIV->addOperand(Step);
4103#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
4126 Start, CanonicalIV, Step) {}
4132 Start->getScalarType(),
nullptr),
4133 Kind(Kind), FPBinOp(FPBinOp) {}
4164 "Op must be an operand of the recipe");
4169#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
4191 IV->getScalarType(), FMFs,
DL),
4192 InductionOpcode(Opcode) {}
4211 NewR->setStartIndex(StartIndex);
4250 "Op must be an operand of the recipe");
4257#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
4268template <
typename VPMixin,
typename... RecipeTys>
4271 CastInfoMixinImpl<VPMixin, RecipeTys...>> {
4272 static_assert((std::is_base_of_v<VPMixin, RecipeTys> && ...),
4273 "Each type in RecipeTys must derive from VPMixin");
4280 VPMixin *Out =
nullptr;
4282 assert(Out &&
"Illegal recipe for cast");
4303 CastInfo<VPPhiAccessors, VPRecipeBase *>> {};
4333 CastInfo<VPIRMetadata, VPRecipeBase *>> {};
4400 return V->getVPBlockID() == VPBlockBase::VPBasicBlockSC ||
4401 V->getVPBlockID() == VPBlockBase::VPIRBasicBlockSC;
4405 assert(Recipe &&
"No recipe to append.");
4406 assert(!Recipe->Parent &&
"Recipe already in VPlan");
4407 Recipe->Parent =
this;
4408 Recipes.insert(InsertPt, Recipe);
4438#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
4455 bool isExiting()
const;
4465 const VPBasicBlock *getCFGPredecessor(
unsigned Idx)
const;
4481inline const VPBasicBlock *
4491class VPIRBasicBlock :
public VPBasicBlock {
4498 : VPBasicBlock(VPIRBasicBlockSC,
4506 return V->getVPBlockID() == VPBlockBase::VPIRBasicBlockSC;
4523 std::unique_ptr<VPRegionValue> CanIV;
4562 std::unique_ptr<VPCanonicalIVInfo> CanIVInfo;
4567 const std::string &Name =
"")
4568 :
VPBlockBase(VPRegionBlockSC, Name), Entry(Entry), Exiting(Exiting) {
4570 assert(!Entry->hasPredecessors() &&
"Entry block has predecessors.");
4571 assert(Exiting &&
"Must also pass Exiting if Entry is passed.");
4572 assert(!Exiting->hasSuccessors() &&
"Exit block has successors.");
4573 Entry->setParent(
this);
4574 Exiting->setParent(
this);
4578 VPRegionBlock(Type *CanIVTy, DebugLoc
DL, VPBlockBase *Entry,
4579 VPBlockBase *Exiting,
const std::string &Name =
"")
4580 : VPRegionBlock(Entry, Exiting, Name) {
4581 CanIVInfo = std::make_unique<VPCanonicalIVInfo>(CanIVTy,
DL,
this);
4589 return V->getVPBlockID() == VPBlockBase::VPRegionBlockSC;
4599 "Entry block cannot have predecessors.");
4611 "Exit block cannot have successors.");
4612 Exiting = ExitingBlock;
4633#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
4651 void dissolveToCFGLoop();
4661 return CanIVInfo ? CanIVInfo->getRegionValue() :
nullptr;
4664 return CanIVInfo ? CanIVInfo->getRegionValue() :
nullptr;
4669 return CanIVInfo->getRegionValue()->getType();
4679 CanIVInfo->clearNUW();
4757 : Entry(Entry), ScalarHeader(ScalarHeader), VectorTripCount(IdxTy),
4758 VF(IdxTy), UF(IdxTy), VFxUF(IdxTy) {
4759 Entry->setPlan(
this);
4760 assert(ScalarHeader->getNumSuccessors() == 0 &&
4761 "scalar header must be a leaf node");
4774 : VectorTripCount(IdxTy), VF(IdxTy), UF(IdxTy), VFxUF(IdxTy) {
4825 "cannot call the function after vector loop region has been removed");
4856 assert(TripCount &&
"trip count needs to be set before accessing it");
4863 assert(!TripCount && NewTripCount &&
"TripCount should not be set yet.");
4864 TripCount = NewTripCount;
4871 "TripCount must be set when resetting");
4872 TripCount = NewTripCount;
4878 if (!BackedgeTakenCount)
4880 return BackedgeTakenCount;
4908 assert(
hasVF(VF) &&
"Cannot set VF not already in plan");
4915 assert(
hasVF(VF) &&
"tried to remove VF not present in plan");
4933 assert(VFs.size() == 1 &&
"expected plan with single VF");
4938 bool HasScalarVFOnly = VFs.size() == 1 && VFs[0].isScalar();
4940 "Plan with scalar VF should only have a single VF");
4941 return HasScalarVFOnly;
4944 bool hasUF(
unsigned UF)
const {
return UFs.empty() || UFs.contains(UF); }
4948 assert(UFs.size() == 1 &&
"Expected a single UF");
4953 assert(
hasUF(UF) &&
"Cannot set the UF not already in plan");
4970 assert(V &&
"Trying to get or add the VPIRValue of a null Value");
4971 auto [It, Inserted] = LiveIns.try_emplace(V);
4980 "Only VPIRValues should be in mapping");
4984 assert(V &&
"Trying to get or add the VPIRValue of a null VPIRValue");
5010 bool IsSigned =
false) {
5026#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
5050 CreatedBlocks.push_back(VPB);
5059 const std::string &Name =
"",
5063 CreatedBlocks.push_back(VPB);
5071 const std::string &Name =
"") {
5073 CreatedBlocks.push_back(VPB);
5096 (ExitBlocks.size() == 1 && ExitBlocks[0]->getNumPredecessors() > 1);
5112#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static MCDisassembler::DecodeStatus addOperand(MCInst &Inst, const MCOperand &Opnd)
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static void print(raw_ostream &Out, object::Archive::Kind Kind, T Val)
This file implements methods to test, set and extract typed bits from packed unsigned integers.
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
#define LLVM_DUMP_METHOD
Mark debug helper function definitions like dump() that should not be stripped from debug builds.
#define LLVM_ABI_FOR_TEST
#define LLVM_PACKED_START
This file defines an InstructionCost class that is used when calculating the cost of an instruction,...
static Value * getOpcode(Value &V, Type &Ty, InstrumentationConfig &IConf, InstrumentorIRBuilderTy &IIRB)
static std::pair< Value *, APInt > getMask(Value *WideMask, unsigned Factor, ElementCount LeafValueEC)
static DebugLoc getDebugLoc(MachineBasicBlock::instr_iterator FirstMI, MachineBasicBlock::instr_iterator LastMI)
Return the first DebugLoc that has line number information, given a range of instructions.
This file implements a map that provides insertion order iteration.
This file provides utility analysis objects describing memory locations.
MachineInstr unsigned OpIdx
static StringRef getName(Value *V)
static bool mayHaveSideEffects(MachineInstr &MI)
This file defines the SmallPtrSet class.
This file defines the SmallVector class.
static SymbolRef::Type getType(const Symbol *Sym)
static const BasicSubtargetSubTypeKV * find(StringRef S, ArrayRef< BasicSubtargetSubTypeKV > A)
Find KV in array using binary search.
This file contains the declarations of the entities induced by Vectorization Plans,...
#define VP_CLASSOF_IMPL(VPRecipeID)
static const uint32_t IV[8]
Class for arbitrary precision integers.
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Represent a constant reference to an array (0 or more elements consecutively in memory),...
const T & back() const
Get the last element.
bool empty() const
Check if the array is empty.
LLVM Basic Block Representation.
LLVM_ABI const DataLayout & getDataLayout() const
Get the data layout of the module this basic block belongs to.
LLVM_ABI LLVMContext & getContext() const
Get the context in which this basic block lives.
This class represents a function call, abstracting a target machine's calling convention.
This is the base class for all instructions that perform data casts.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
A parsed version of the target data layout string in and methods for querying it.
static DebugLoc getUnknown()
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
static constexpr ElementCount getFixed(ScalarTy MinVal)
Utility class for floating point operations which can have information about relaxed accuracy require...
Convenience struct for specifying and reasoning about fast-math flags.
Represents flags for the getelementptr instruction/expression.
static GEPNoWrapFlags fromRaw(unsigned Flags)
an instruction for type-safe pointer arithmetic to access elements of arrays and structs
Common base class shared among various IRBuilders.
A struct for saving information about induction variables.
InductionKind
This enum represents the kinds of inductions that we support.
InnerLoopVectorizer vectorizes loops which contain only one basic block to a specified vectorization ...
The group of interleaved loads/stores sharing the same stride and close to each other.
This is an important class for using LLVM in a threaded context.
An instruction for reading from memory.
LoopVectorizationCostModel - estimates the expected speedups due to vectorization.
Represents a single loop in the control flow graph.
The RecurrenceDescriptor is used to identify recurrences variables in a loop.
This class represents an assumption made using SCEV expressions which can be checked at run-time.
This class represents an analyzed expression in the program.
This class provides computation of slot numbers for LLVM Assembly writing.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
A SetVector that performs no allocations if smaller than a certain size.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
iterator erase(const_iterator CI)
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
An instruction for storing to memory.
Represent a constant reference to a string, i.e.
std::string str() const
Get the contents as an std::string.
This class represents a truncation of integer types.
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
LLVM_ABI std::string str() const
Return the twine contents as a std::string.
The instances of the Type class are immutable: once they are created, they are never changed.
bool isIntegerTy() const
True if this is an instance of IntegerType.
void execute(VPTransformState &State) override
Generate the active lane mask phi of the vector loop.
VPActiveLaneMaskPHIRecipe * clone() override
Clone the current recipe.
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
VPActiveLaneMaskPHIRecipe(VPValue *StartMask, DebugLoc DL)
~VPActiveLaneMaskPHIRecipe() override=default
VPBasicBlock serves as the leaf of the Hierarchical Control-Flow Graph.
RecipeListTy::const_iterator const_iterator
void appendRecipe(VPRecipeBase *Recipe)
Augment the existing recipes of a VPBasicBlock with an additional Recipe as the last recipe.
RecipeListTy::const_reverse_iterator const_reverse_iterator
RecipeListTy::iterator iterator
Instruction iterators...
RecipeListTy & getRecipeList()
Returns a reference to the list of recipes.
iplist< VPRecipeBase > RecipeListTy
VPBasicBlock(const unsigned char BlockSC, const Twine &Name="")
iterator begin()
Recipe iterator methods.
RecipeListTy::reverse_iterator reverse_iterator
iterator_range< iterator > phis()
Returns an iterator range over the PHI-like recipes in the block.
const VPBasicBlock * getCFGPredecessor(unsigned Idx) const
Returns the predecessor block at index Idx with the predecessors as per the corresponding plain CFG.
iterator getFirstNonPhi()
Return the position of the first non-phi node recipe in the block.
const_reverse_iterator rbegin() const
RecipeListTy Recipes
The VPRecipes held in the order of output instructions to generate.
const VPRecipeBase & front() const
const_iterator begin() const
const VPRecipeBase & back() const
void insert(VPRecipeBase *Recipe, iterator InsertPt)
const_iterator end() const
static bool classof(const VPBlockBase *V)
Method to support type inquiry through isa, cast, and dyn_cast.
static RecipeListTy VPBasicBlock::* getSublistAccess(VPRecipeBase *)
Returns a pointer to a member of the recipe list.
reverse_iterator rbegin()
const_reverse_iterator rend() const
VPValue * getIncomingValue(unsigned Idx) const
Return incoming value number Idx.
VPValue * getMask(unsigned Idx) const
Return mask number Idx.
VPBlendRecipe(PHINode *Phi, ArrayRef< VPValue * > Operands, const VPIRFlags &Flags, DebugLoc DL)
The blend operation is a User of the incoming values and of their respective masks,...
unsigned getNumIncomingValues() const
Return the number of incoming values, taking into account when normalized the first incoming value wi...
void execute(VPTransformState &State) override
The method which generates the output IR instructions that correspond to this VPRecipe,...
VPBlendRecipe * cloneWithOperands(ArrayRef< VPValue * > NewOperands)
VPBlendRecipe * clone() override
Clone the current recipe.
void setMask(unsigned Idx, VPValue *V)
Set mask number Idx to V.
bool isNormalized() const
A normalized blend is one that has an odd number of operands, whereby the first operand does not have...
VPBlockBase is the building block of the Hierarchical Control-Flow Graph.
void setSuccessors(ArrayRef< VPBlockBase * > NewSuccs)
Set each VPBasicBlock in NewSuccss as successor of this VPBlockBase.
VPRegionBlock * getParent()
VPBlocksTy & getPredecessors()
iterator_range< VPBlockBase ** > predecessors()
LLVM_DUMP_METHOD void dump() const
Dump this VPBlockBase to dbgs().
void setName(const Twine &newName)
size_t getNumSuccessors() const
iterator_range< VPBlockBase ** > successors()
virtual void print(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const =0
Print plain-text dump of this VPBlockBase to O, prefixing all lines with Indent.
bool hasPredecessors() const
Returns true if this block has any predecessors.
void swapSuccessors()
Swap successors of the block. The block must have exactly 2 successors.
void printSuccessors(raw_ostream &O, const Twine &Indent) const
Print the successors of this block to O, prefixing all lines with Indent.
SmallVectorImpl< VPBlockBase * > VPBlocksTy
virtual ~VPBlockBase()=default
const VPBlocksTy & getHierarchicalPredecessors()
unsigned getIndexForSuccessor(const VPBlockBase *Succ) const
Returns the index for Succ in the blocks successor list.
size_t getNumPredecessors() const
void setPredecessors(ArrayRef< VPBlockBase * > NewPreds)
Set each VPBasicBlock in NewPreds as predecessor of this VPBlockBase.
VPBlockBase * getEnclosingBlockWithPredecessors()
unsigned getIndexForPredecessor(const VPBlockBase *Pred) const
Returns the index for Pred in the blocks predecessors list.
bool hasSuccessors() const
Returns true if this block has any successors.
const VPBlocksTy & getPredecessors() const
virtual VPBlockBase * clone()=0
Clone the current block and it's recipes without updating the operands of the cloned recipes,...
enum { VPRegionBlockSC, VPBasicBlockSC, VPIRBasicBlockSC } VPBlockTy
An enumeration for keeping track of the concrete subclass of VPBlockBase that are actually instantiat...
virtual InstructionCost cost(ElementCount VF, VPCostContext &Ctx)=0
Return the cost of the block.
void setPlan(VPlan *ParentPlan)
Sets the pointer of the plan containing the block.
const VPRegionBlock * getParent() const
const std::string & getName() const
void clearSuccessors()
Remove all the successors of this block.
VPBlockBase * getSingleHierarchicalSuccessor()
void setTwoSuccessors(VPBlockBase *IfTrue, VPBlockBase *IfFalse)
Set two given VPBlockBases IfTrue and IfFalse to be the two successors of this VPBlockBase.
VPBlockBase * getSinglePredecessor() const
virtual void execute(VPTransformState *State)=0
The method which generates the output IR that correspond to this VPBlockBase, thereby "executing" the...
const VPBlocksTy & getHierarchicalSuccessors()
void clearPredecessors()
Remove all the predecessor of this block.
friend class VPBlockUtils
unsigned getVPBlockID() const
void printAsOperand(raw_ostream &OS, bool PrintType=false) const
void swapPredecessors()
Swap predecessors of the block.
VPBlockBase(const unsigned char SC, const std::string &N)
VPBlocksTy & getSuccessors()
VPBlockBase * getEnclosingBlockWithSuccessors()
An Enclosing Block of a block B is any block containing B, including B itself.
void setOneSuccessor(VPBlockBase *Successor)
Set a given VPBlockBase Successor as the single successor of this VPBlockBase.
void setParent(VPRegionBlock *P)
VPBlockBase * getSingleHierarchicalPredecessor()
VPBlockBase * getSingleSuccessor() const
const VPBlocksTy & getSuccessors() const
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
VPBranchOnMaskRecipe * clone() override
Clone the current recipe.
bool usesScalars(const VPValue *Op) const override
Returns true if the recipe uses scalars of operand Op.
VPBranchOnMaskRecipe(VPValue *BlockInMask, DebugLoc DL)
VPlan-based builder utility analogous to IRBuilder.
VPRegionValue * getRegionValue()
VPCanonicalIVInfo(Type *Ty, DebugLoc DL, VPRegionBlock *Region)
const VPRegionValue * getRegionValue() const
VPCurrentIterationPHIRecipe * clone() override
Clone the current recipe.
VPCurrentIterationPHIRecipe(VPValue *StartIV, DebugLoc DL)
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPCurrentIterationPHIRecipe.
LLVM_ABI_FOR_TEST void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
void execute(VPTransformState &State) override
Generate the phi nodes.
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
~VPCurrentIterationPHIRecipe() override=default
InductionDescriptor::InductionKind getInductionKind() const
VPValue * getIndex() const
const FPMathOperator * getFPBinOp() const
VPIRValue * getStartValue() const
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPDerivedIVRecipe.
VPValue * getStepValue() const
void execute(VPTransformState &State) override
The method which generates the output IR instructions that correspond to this VPRecipe,...
VPDerivedIVRecipe * clone() override
Clone the current recipe.
VPDerivedIVRecipe(InductionDescriptor::InductionKind Kind, const FPMathOperator *FPBinOp, VPIRValue *Start, VPValue *IV, VPValue *Step)
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
~VPDerivedIVRecipe() override=default
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
VPDerivedIVRecipe(const InductionDescriptor &IndDesc, VPIRValue *Start, VPValue *CanonicalIV, VPValue *Step)
Template specialization of the standard LLVM dominator tree utility for VPBlockBases.
void execute(VPTransformState &State) override
The method which generates the output IR instructions that correspond to this VPRecipe,...
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPExpandSCEVRecipe.
VPExpandSCEVRecipe(const SCEV *Expr)
const SCEV * getSCEV() const
VPExpandSCEVRecipe * clone() override
Clone the current recipe.
~VPExpandSCEVRecipe() override=default
void execute(VPTransformState &State) override
Method for generating code, must not be called as this recipe is abstract.
bool isVectorToScalar() const
Returns true if this VPExpressionRecipe produces a single scalar.
VPValue * getOperandOfResultType() const
Return the VPValue to use to infer the result type of the recipe.
VPExpressionRecipe(VPWidenCastRecipe *Ext, VPWidenRecipe *Neg, VPReductionRecipe *Red)
VPExpressionRecipe * clone() override
Clone the current recipe.
void decompose()
Insert the recipes of the expression back into the VPlan, directly before the current recipe.
~VPExpressionRecipe() override
VPExpressionRecipe(VPWidenCastRecipe *Ext, VPReductionRecipe *Red)
bool mayHaveSideEffects() const
Returns true if this expression contains recipes that may have side effects.
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Compute the cost of this recipe either using a recipe's specialized implementation or using the legac...
bool mayReadOrWriteMemory() const
Returns true if this expression contains recipes that may read from or write to memory.
VPExpressionRecipe(VPWidenCastRecipe *Ext0, VPWidenCastRecipe *Ext1, VPWidenRecipe *Mul, VPReductionRecipe *Red)
VPExpressionRecipe(VPWidenCastRecipe *Ext0, VPWidenCastRecipe *Ext1, VPWidenRecipe *Mul, VPWidenRecipe *Neg, VPReductionRecipe *Red)
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
unsigned getVFScaleFactor() const
VPExpressionRecipe(VPWidenRecipe *Mul, VPReductionRecipe *Red)
A recipe representing a sequence of load -> update -> store as part of a histogram operation.
void execute(VPTransformState &State) override
Produce a vectorized histogram operation.
VPHistogramRecipe * clone() override
Clone the current recipe.
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPHistogramRecipe.
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
VPValue * getMask() const
Return the mask operand if one was provided, or a null pointer if all lanes should be executed uncond...
unsigned getOpcode() const
VP_CLASSOF_IMPL(VPRecipeBase::VPHistogramSC)
~VPHistogramRecipe() override=default
VPHistogramRecipe(unsigned Opcode, ArrayRef< VPValue * > Operands, const VPIRMetadata &Metadata={}, DebugLoc DL=DebugLoc::getUnknown())
A special type of VPBasicBlock that wraps an existing IR basic block.
void execute(VPTransformState *State) override
The method which generates the output IR instructions that correspond to this VPBasicBlock,...
BasicBlock * getIRBasicBlock() const
static bool classof(const VPBlockBase *V)
~VPIRBasicBlock() override=default
VPIRBasicBlock * clone() override
Clone the current block and it's recipes, without updating the operands of the cloned recipes.
Class to record and manage LLVM IR flags.
ReductionFlagsTy ReductionFlags
LLVM_ABI_FOR_TEST bool hasRequiredFlagsForOpcode(unsigned Opcode) const
Returns true if Opcode has its required flags set.
bool hasNoWrapFlags() const
VPIRFlags(RecurKind Kind, bool IsOrdered, bool IsInLoop, FastMathFlags FMFs)
LLVM_ABI_FOR_TEST bool flagsValidForOpcode(unsigned Opcode) const
Returns true if the set flags are valid for Opcode.
static VPIRFlags getDefaultFlags(unsigned Opcode)
Returns default flags for Opcode for opcodes that support it, asserts otherwise.
VPIRFlags(DisjointFlagsTy DisjointFlags)
VPIRFlags(WrapFlagsTy WrapFlags)
void printFlags(raw_ostream &O) const
VPIRFlags(CmpInst::Predicate Pred, FastMathFlags FMFs)
bool hasFastMathFlags() const
Returns true if the recipe has fast-math flags.
LLVM_ABI_FOR_TEST FastMathFlags getFastMathFlags() const
bool isReductionOrdered() const
CmpInst::Predicate getPredicate() const
WrapFlagsTy getNoWrapFlags() const
bool hasNonNegFlag() const
Returns true if the recipe has non-negative flag.
void transferFlags(VPIRFlags &Other)
bool hasNoSignedWrap() const
void intersectFlags(const VPIRFlags &Other)
Only keep flags also present in Other.
VPIRFlags(TruncFlagsTy TruncFlags)
VPIRFlags(FastMathFlags FMFs)
VPIRFlags(NonNegFlagsTy NonNegFlags)
VPIRFlags(CmpInst::Predicate Pred)
VPIRFlags(ExactFlagsTy ExactFlags)
GEPNoWrapFlags getGEPNoWrapFlags() const
bool hasPredicate() const
Returns true if the recipe has a comparison predicate.
DisjointFlagsTy DisjointFlags
void setPredicate(CmpInst::Predicate Pred)
bool hasNoUnsignedWrap() const
NonNegFlagsTy NonNegFlags
bool isReductionInLoop() const
void dropPoisonGeneratingFlags()
Drop all poison-generating flags.
void applyFlags(Instruction &I) const
Apply the IR flags to I.
VPIRFlags(GEPNoWrapFlags GEPFlags)
RecurKind getRecurKind() const
VPIRFlags(Instruction &I)
Instruction & getInstruction() const
bool usesFirstPartOnly(const VPValue *Op) const override
Returns true if the VPUser only uses the first part of operand Op.
~VPIRInstruction() override=default
void execute(VPTransformState &State) override
The method which generates the output IR instructions that correspond to this VPRecipe,...
VPIRInstruction * clone() override
Clone the current recipe.
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the VPUser only uses the first lane of operand Op.
static LLVM_ABI_FOR_TEST VPIRInstruction * create(Instruction &I)
Create a new VPIRPhi for \I , if it is a PHINode, otherwise create a VPIRInstruction.
LLVM_ABI_FOR_TEST InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPIRInstruction.
bool usesScalars(const VPValue *Op) const override
Returns true if the VPUser uses scalars of operand Op.
VPIRInstruction(Instruction &I)
VPIRInstruction::create() should be used to create VPIRInstructions, as subclasses may need to be cre...
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
VPInstructionWithType(unsigned Opcode, ArrayRef< VPValue * > Operands, Type *ResultTy, const VPIRFlags &Flags={}, const VPIRMetadata &Metadata={}, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPInstruction.
static bool classof(const VPUser *R)
static bool classof(const VPRecipeBase *R)
Type * getResultType() const
VPInstruction * clone() override
Clone the current recipe.
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
void execute(VPTransformState &State) override
Generate the instruction.
This is a concrete Recipe that models a single VPlan-level instruction.
VPInstruction(unsigned Opcode, ArrayRef< VPValue * > Operands, const VPIRFlags &Flags={}, const VPIRMetadata &MD={}, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="", Type *ResultTy=nullptr)
unsigned getNumOperandsWithoutMask() const
Returns the number of operands, excluding the mask if the VPInstruction is masked.
iterator_range< operand_iterator > operandsWithoutMask()
Returns an iterator range over the operands excluding the mask operand if present.
VPInstruction * clone() override
Clone the current recipe.
@ ExtractLastActive
Extracts the last active lane from a set of vectors.
@ ExtractLane
Extracts a single lane (first operand) from a set of vector operands.
@ ExitingIVValue
Compute the exiting value of a wide induction after vectorization, that is the value of the last lane...
@ WideIVStep
Scale the first operand (vector step) by the second operand (scalar-step).
@ ExtractPenultimateElement
@ ResumeForEpilogue
Explicit user for the resume phi of the canonical induction in the main VPlan, used by the epilogue v...
@ Unpack
Extracts all lanes from its (non-scalable) vector operand.
@ FirstOrderRecurrenceSplice
@ ReductionStartVector
Start vector for reductions with 3 operands: the original start value, the identity value for the red...
@ BuildVector
Creates a fixed-width vector containing all operands.
@ BuildStructVector
Given operands of (the same) struct type, creates a struct of fixed- width vectors each containing a ...
@ VScale
Returns the value for vscale.
@ CanonicalIVIncrementForPart
@ ComputeReductionResult
Reduce the operands to the final reduction result using the operation specified via the operation's V...
@ CalculateTripCountMinusVF
iterator_range< const_operand_iterator > operandsWithoutMask() const
void addMask(VPValue *Mask)
Add mask Mask to an unmasked VPInstruction, if it needs masking.
StringRef getName() const
Returns the symbolic name assigned to the VPInstruction.
unsigned getOpcode() const
void setName(StringRef NewName)
Set the symbolic name for the VPInstruction.
VPValue * getMask() const
Returns the mask for the VPInstruction.
VPInstruction * cloneWithOperands(ArrayRef< VPValue * > NewOperands, Type *ResultTy=nullptr)
unsigned getNumOperandsForOpcode() const
Return the number of operands determined by the opcode of the VPInstruction, excluding mask.
bool isMasked() const
Returns true if the VPInstruction has a mask operand.
A common base class for interleaved memory operations.
virtual unsigned getNumStoreOperands() const =0
Returns the number of stored operands of this interleave group.
bool usesFirstLaneOnly(const VPValue *Op) const override=0
Returns true if the recipe only uses the first lane of operand Op.
bool needsMaskForGaps() const
Return true if the access needs a mask because of the gaps.
void execute(VPTransformState &State) override
The method which generates the output IR instructions that correspond to this VPRecipe,...
static bool classof(const VPUser *U)
VPInterleaveBase(const unsigned char SC, const InterleaveGroup< Instruction > *IG, ArrayRef< VPValue * > Operands, ArrayRef< VPValue * > StoredValues, VPValue *Mask, bool NeedsMaskForGaps, const VPIRMetadata &MD, DebugLoc DL)
Instruction * getInsertPos() const
static bool classof(const VPRecipeBase *R)
const InterleaveGroup< Instruction > * getInterleaveGroup() const
VPValue * getMask() const
Return the mask used by this recipe.
ArrayRef< VPValue * > getStoredValues() const
Return the VPValues stored by this interleave group.
VPInterleaveBase * clone() override=0
Clone the current recipe.
VPValue * getAddr() const
Return the address accessed by this recipe.
bool usesFirstLaneOnly(const VPValue *Op) const override
The recipe only uses the first lane of the address, and EVL operand.
VPValue * getEVL() const
The VPValue of the explicit vector length.
~VPInterleaveEVLRecipe() override=default
unsigned getNumStoreOperands() const override
Returns the number of stored operands of this interleave group.
VPInterleaveEVLRecipe * clone() override
Clone the current recipe.
VPInterleaveEVLRecipe(VPInterleaveRecipe &R, VPValue &EVL, VPValue *Mask)
VPInterleaveRecipe is a recipe for transforming an interleave group of load or stores into one wide l...
unsigned getNumStoreOperands() const override
Returns the number of stored operands of this interleave group.
~VPInterleaveRecipe() override=default
VPInterleaveRecipe * clone() override
Clone the current recipe.
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
VPInterleaveRecipe(const InterleaveGroup< Instruction > *IG, VPValue *Addr, ArrayRef< VPValue * > StoredValues, VPValue *Mask, bool NeedsMaskForGaps, const VPIRMetadata &MD, DebugLoc DL)
In what follows, the term "input IR" refers to code that is fed into the vectorizer whereas the term ...
A VPRecipeValue defined by a multi-def recipe, stores a pointer to it.
Helper type to provide functions to access incoming values and blocks for phi-like recipes.
virtual const VPRecipeBase * getAsRecipe() const =0
Return a VPRecipeBase* to the current object.
VPValue * getIncomingValueForBlock(const VPBasicBlock *VPBB) const
Returns the incoming value for VPBB. VPBB must be an incoming block.
VPUser::const_operand_range incoming_values() const
Returns an interator range over the incoming values.
virtual unsigned getNumIncoming() const
Returns the number of incoming values, also number of incoming blocks.
void removeIncomingValueFor(VPBlockBase *IncomingBlock) const
Removes the incoming value for IncomingBlock, which must be a predecessor.
const VPBasicBlock * getIncomingBlock(unsigned Idx) const
Returns the incoming block with index Idx.
detail::zippy< llvm::detail::zip_first, VPUser::const_operand_range, const_incoming_blocks_range > incoming_values_and_blocks() const
Returns an iterator range over pairs of incoming values and corresponding incoming blocks.
VPValue * getIncomingValue(unsigned Idx) const
Returns the incoming VPValue with index Idx.
virtual ~VPPhiAccessors()=default
void printPhiOperands(raw_ostream &O, VPSlotTracker &SlotTracker) const
Print the recipe.
void setIncomingValueForBlock(const VPBasicBlock *VPBB, VPValue *V) const
Sets the incoming value for VPBB to V.
iterator_range< mapped_iterator< detail::index_iterator, std::function< const VPBasicBlock *(size_t)> > > const_incoming_blocks_range
const_incoming_blocks_range incoming_blocks() const
Returns an iterator range over the incoming blocks.
~VPPredInstPHIRecipe() override=default
VPPredInstPHIRecipe * clone() override
Clone the current recipe.
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPPredInstPHIRecipe.
VPPredInstPHIRecipe(VPValue *PredV, DebugLoc DL)
Construct a VPPredInstPHIRecipe given PredInst whose value needs a phi nodes after merging back from ...
VPRecipeBase is a base class modeling a sequence of one or more output IR instructions.
bool mayReadFromMemory() const
Returns true if the recipe may read from memory.
bool mayReadOrWriteMemory() const
Returns true if the recipe may read from or write to memory.
virtual void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const =0
Each concrete VPRecipe prints itself, without printing common information, like debug info or metadat...
VPRegionBlock * getRegion()
enum { VPBranchOnMaskSC, VPDerivedIVSC, VPExpandSCEVSC, VPExpressionSC, VPIRInstructionSC, VPInstructionSC, VPInterleaveEVLSC, VPInterleaveSC, VPReductionEVLSC, VPReductionSC, VPReplicateSC, VPScalarIVStepsSC, VPVectorPointerSC, VPVectorEndPointerSC, VPWidenCallSC, VPWidenCanonicalIVSC, VPWidenCastSC, VPWidenGEPSC, VPWidenIntrinsicSC, VPWidenMemIntrinsicSC, VPWidenLoadEVLSC, VPWidenLoadSC, VPWidenStoreEVLSC, VPWidenStoreSC, VPWidenSC, VPBlendSC, VPHistogramSC, VPWidenPHISC, VPPredInstPHISC, VPCurrentIterationPHISC, VPActiveLaneMaskPHISC, VPFirstOrderRecurrencePHISC, VPWidenIntOrFpInductionSC, VPWidenPointerInductionSC, VPReductionPHISC, VPFirstPHISC=VPWidenPHISC, VPFirstHeaderPHISC=VPCurrentIterationPHISC, VPLastHeaderPHISC=VPReductionPHISC, VPLastPHISC=VPReductionPHISC, } VPRecipeTy
An enumeration for keeping track of the concrete subclass of VPRecipeBase that is actually instantiat...
void setDebugLoc(DebugLoc NewDL)
Set the recipe's debug location to NewDL.
bool mayWriteToMemory() const
Returns true if the recipe may write to memory.
~VPRecipeBase() override=default
VPBasicBlock * getParent()
DebugLoc getDebugLoc() const
Returns the debug location of the recipe.
virtual void execute(VPTransformState &State)=0
The method which generates the output IR instructions that correspond to this VPRecipe,...
void moveBefore(VPBasicBlock &BB, iplist< VPRecipeBase >::iterator I)
Unlink this recipe and insert into BB before I.
void insertBefore(VPRecipeBase *InsertPos)
Insert an unlinked recipe into a basic block immediately before the specified recipe.
void insertAfter(VPRecipeBase *InsertPos)
Insert an unlinked Recipe into a basic block immediately after the specified Recipe.
static bool classof(const VPDef *D)
Method to support type inquiry through isa, cast, and dyn_cast.
iplist< VPRecipeBase >::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
virtual VPRecipeBase * clone()=0
Clone the current recipe.
friend class VPBlockUtils
const VPBasicBlock * getParent() const
InstructionCost cost(ElementCount VF, VPCostContext &Ctx)
Return the cost of this recipe, taking into account if the cost computation should be skipped and the...
static bool classof(const VPUser *U)
void removeFromParent()
This method unlinks 'this' from the containing basic block, but does not delete it.
unsigned getVPRecipeID() const
void moveAfter(VPRecipeBase *MovePos)
Unlink this recipe from its current VPBasicBlock and insert it into the VPBasicBlock that MovePos liv...
VPRecipeBase(const unsigned char SC, ArrayRef< VPValue * > Operands, DebugLoc DL=DebugLoc::getUnknown())
Type * getScalarType() const
Returns the scalar type of this VPRecipeValue.
VPValue * getEVL() const
The VPValue of the explicit vector length.
VPReductionEVLRecipe(VPReductionRecipe &R, VPValue &EVL, VPValue *CondOp, DebugLoc DL=DebugLoc::getUnknown())
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
VPReductionEVLRecipe * clone() override
Clone the current recipe.
~VPReductionEVLRecipe() override=default
bool isOrdered() const
Returns true, if the phi is part of an ordered reduction.
void setVFScaleFactor(unsigned ScaleFactor)
Set the VFScaleFactor for this reduction phi.
VPReductionPHIRecipe * clone() override
Clone the current recipe.
unsigned getVFScaleFactor() const
Get the factor that the VF of this recipe's output should be scaled by, or 1 if it isn't scaled.
~VPReductionPHIRecipe() override=default
bool hasUsesOutsideReductionChain() const
Returns true, if the phi is part of a multi-use reduction.
unsigned getNumIncoming() const override
Returns the number of incoming values, also number of incoming blocks.
VPReductionPHIRecipe(PHINode *Phi, RecurKind Kind, VPValue &Start, VPValue &BackedgeValue, ReductionStyle Style, const VPIRFlags &Flags, bool HasUsesOutsideReductionChain=false)
Create a new VPReductionPHIRecipe for the reduction Phi.
bool isInLoop() const
Returns true if the phi is part of an in-loop reduction.
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
void execute(VPTransformState &State) override
Generate the phi/select nodes.
VPReductionPHIRecipe * cloneWithOperands(VPValue *Start, VPValue *BackedgeValue)
bool isPartialReduction() const
Returns true if the reduction outputs a vector with a scaled down VF.
RecurKind getRecurrenceKind() const
Returns the recurrence kind of the reduction.
A recipe to represent inloop, ordered or partial reduction operations.
VPReductionRecipe(const unsigned char SC, RecurKind RdxKind, FastMathFlags FMFs, Instruction *I, ArrayRef< VPValue * > Operands, VPValue *CondOp, ReductionStyle Style, DebugLoc DL)
bool isConditional() const
Return true if the in-loop reduction is conditional.
static bool classof(const VPRecipeBase *R)
static bool classof(const VPSingleDefRecipe *R)
VPValue * getVecOp() const
The VPValue of the vector value to be reduced.
VPValue * getCondOp() const
The VPValue of the condition for the block.
RecurKind getRecurrenceKind() const
Return the recurrence kind for the in-loop reduction.
VPReductionRecipe(RecurKind RdxKind, FastMathFlags FMFs, Instruction *I, VPValue *ChainOp, VPValue *VecOp, VPValue *CondOp, ReductionStyle Style, DebugLoc DL=DebugLoc::getUnknown())
bool isOrdered() const
Return true if the in-loop reduction is ordered.
VPReductionRecipe(const RecurKind RdxKind, FastMathFlags FMFs, VPValue *ChainOp, VPValue *VecOp, VPValue *CondOp, ReductionStyle Style, DebugLoc DL=DebugLoc::getUnknown())
bool isPartialReduction() const
Returns true if the reduction outputs a vector with a scaled down VF.
~VPReductionRecipe() override=default
VPValue * getChainOp() const
The VPValue of the scalar Chain being accumulated.
bool isInLoop() const
Returns true if the reduction is in-loop.
VPReductionRecipe * clone() override
Clone the current recipe.
static bool classof(const VPUser *U)
static bool classof(const VPValue *VPV)
unsigned getVFScaleFactor() const
Get the factor that the VF of this recipe's output should be scaled by, or 1 if it isn't scaled.
VPRegionBlock represents a collection of VPBasicBlocks and VPRegionBlocks which form a Single-Entry-S...
const VPBlockBase * getEntry() const
bool isReplicator() const
An indicator whether this region is to generate multiple replicated instances of output IR correspond...
~VPRegionBlock() override=default
void setExiting(VPBlockBase *ExitingBlock)
Set ExitingBlock as the exiting VPBlockBase of this VPRegionBlock.
VPBlockBase * getExiting()
const VPRegionValue * getCanonicalIV() const
void setEntry(VPBlockBase *EntryBlock)
Set EntryBlock as the entry VPBlockBase of this VPRegionBlock.
Type * getCanonicalIVType() const
Return the type of the canonical IV for loop regions.
bool hasCanonicalIVNUW() const
Indicates if NUW is set for the canonical IV increment, for loop regions.
void clearCanonicalIVNUW(VPInstruction *Increment)
Unsets NUW for the canonical IV increment Increment, for loop regions.
VPRegionValue * getCanonicalIV()
Return the canonical induction variable of the region, null for replicating regions.
const VPBlockBase * getExiting() const
VPBasicBlock * getPreheaderVPBB()
Returns the pre-header VPBasicBlock of the loop region.
static bool classof(const VPBlockBase *V)
Method to support type inquiry through isa, cast, and dyn_cast.
VPValues defined by a VPRegionBlock, like the canonical IV.
VPReplicateRecipe replicates a given instruction producing multiple scalar copies of the original sca...
bool isSingleScalar() const
VPReplicateRecipe(Instruction *I, ArrayRef< VPValue * > Operands, bool IsSingleScalar, VPValue *Mask=nullptr, const VPIRFlags &Flags={}, VPIRMetadata Metadata={}, DebugLoc DL=DebugLoc::getUnknown())
~VPReplicateRecipe() override=default
static Type * computeScalarType(const Instruction *I, ArrayRef< VPValue * > Operands)
Compute the scalar result type for a VPReplicateRecipe wrapping I with Operands (excluding any predic...
VPReplicateRecipe * cloneWithOperands(ArrayRef< VPValue * > NewOperands)
bool usesScalars(const VPValue *Op) const override
Returns true if the recipe uses scalars of operand Op.
bool isPredicated() const
VPReplicateRecipe * clone() override
Clone the current recipe.
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
unsigned getOpcode() const
VPValue * getMask()
Return the mask of a predicated VPReplicateRecipe.
Instruction::BinaryOps getInductionOpcode() const
VPValue * getStepValue() const
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPScalarIVStepsRecipe.
VPScalarIVStepsRecipe(const InductionDescriptor &IndDesc, VPValue *IV, VPValue *Step, VPValue *VF, DebugLoc DL=DebugLoc::getUnknown())
void setStartIndex(VPValue *StartIndex)
Set or add the StartIndex operand.
VPScalarIVStepsRecipe * clone() override
Clone the current recipe.
VPValue * getStartIndex() const
Return the StartIndex, or null if known to be zero, valid only after unrolling.
VPValue * getVFValue() const
Return the number of scalars to produce per unroll part, used to compute StartIndex during unrolling.
VPScalarIVStepsRecipe(VPValue *IV, VPValue *Step, VPValue *VF, Instruction::BinaryOps Opcode, FastMathFlags FMFs, DebugLoc DL)
~VPScalarIVStepsRecipe() override=default
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
VPSingleDefRecipe is a base class for recipes that model a sequence of one or more output IR that def...
VPSingleDefRecipe(const unsigned char SC, ArrayRef< VPValue * > Operands, Value *UV, DebugLoc DL=DebugLoc::getUnknown())
static bool classof(const VPValue *V)
Instruction * getUnderlyingInstr()
Returns the underlying instruction.
static bool classof(const VPRecipeBase *R)
const Instruction * getUnderlyingInstr() const
VPSingleDefRecipe(const unsigned char SC, ArrayRef< VPValue * > Operands, Type *ResultTy, Value *UV=nullptr, DebugLoc DL=DebugLoc::getUnknown())
static bool classof(const VPUser *U)
LLVM_ABI_FOR_TEST LLVM_DUMP_METHOD void dump() const
Print this VPSingleDefRecipe to dbgs() (for debugging).
VPSingleDefRecipe * clone() override=0
Clone the current recipe.
VPSingleDefRecipe(const unsigned char SC, ArrayRef< VPValue * > Operands, DebugLoc DL=DebugLoc::getUnknown())
LLVM_ABI_FOR_TEST VPSingleDefValue(VPSingleDefRecipe *Def, Value *UV=nullptr, Type *Ty=nullptr)
Construct a VPSingleDefValue. Must only be used by VPSingleDefRecipe.
This class can be used to assign names to VPValues.
This class augments VPValue with operands which provide the inverse def-use edges from VPValue's user...
void printOperands(raw_ostream &O, VPSlotTracker &SlotTracker) const
Print the operands to O.
void setOperand(unsigned I, VPValue *New)
unsigned getNumOperands() const
operand_iterator op_end()
operand_iterator op_begin()
VPValue * getOperand(unsigned N) const
VPUser(ArrayRef< VPValue * > Operands)
iterator_range< const_operand_iterator > const_operand_range
iterator_range< operand_iterator > operand_range
This is the base class of the VPlan Def/Use graph, used for modeling the data flow into,...
Type * getScalarType() const
Returns the scalar type of this VPValue, dispatching based on the concrete subclass.
Value * getLiveInIRValue() const
Return the underlying IR value for a VPIRValue.
VPRecipeBase * getDefiningRecipe()
Returns the recipe defining this VPValue or nullptr if it is not defined by a recipe,...
Value * getUnderlyingValue() const
Return the underlying Value attached to this VPValue.
void setUnderlyingValue(Value *Val)
unsigned getNumUsers() const
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the VPUser only uses the first lane of operand Op.
VPValue * getVFValue() const
void execute(VPTransformState &State) override
The method which generates the output IR instructions that correspond to this VPRecipe,...
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
Type * getSourceElementType() const
int64_t getStride() const
VPVectorEndPointerRecipe * clone() override
Clone the current recipe.
VPValue * getOffset() const
bool usesFirstPartOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first part of operand Op.
VPVectorEndPointerRecipe(VPValue *Ptr, VPValue *VF, Type *SourceElementTy, int64_t Stride, GEPNoWrapFlags GEPFlags, DebugLoc DL)
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPVectorPointerRecipe.
VPValue * getPointer() const
void materializeOffset(unsigned Part=0)
Adds the offset operand to the recipe.
VPValue * getStride() const
Type * getSourceElementType() const
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the VPUser only uses the first lane of operand Op.
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
void execute(VPTransformState &State) override
The method which generates the output IR instructions that correspond to this VPRecipe,...
bool usesFirstPartOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first part of operand Op.
VPVectorPointerRecipe(VPValue *Ptr, Type *SourceElementTy, VPValue *Stride, GEPNoWrapFlags GEPFlags, DebugLoc DL)
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPHeaderPHIRecipe.
VPVectorPointerRecipe * clone() override
Clone the current recipe.
VPValue * getVFxPart() const
A recipe for widening Call instructions using library calls.
VPWidenCallRecipe(Value *UV, Function *Variant, ArrayRef< VPValue * > CallArguments, const VPIRFlags &Flags={}, const VPIRMetadata &Metadata={}, DebugLoc DL={})
const_operand_range args() const
VPWidenCallRecipe * clone() override
Clone the current recipe.
Function * getCalledScalarFunction() const
~VPWidenCallRecipe() override=default
VPWidenCanonicalIVRecipe(VPRegionValue *CanonicalIV, const VPIRFlags::WrapFlagsTy &Flags={false, false})
~VPWidenCanonicalIVRecipe() override=default
VPValue * getStepValue() const
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPWidenCanonicalIVPHIRecipe.
VPRegionValue * getCanonicalIV() const
Return the canonical IV being widened.
VPWidenCanonicalIVRecipe * clone() override
Clone the current recipe.
void execute(VPTransformState &State) override
The method which generates the output IR instructions that correspond to this VPRecipe,...
VPWidenCastRecipe is a recipe to create vector cast instructions.
Instruction::CastOps getOpcode() const
LLVM_ABI_FOR_TEST void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
LLVM_ABI_FOR_TEST void execute(VPTransformState &State) override
Produce widened copies of the cast.
~VPWidenCastRecipe() override=default
LLVM_ABI_FOR_TEST InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPWidenCastRecipe.
VPWidenCastRecipe(Instruction::CastOps Opcode, VPValue *Op, Type *ResultTy, CastInst *CI=nullptr, const VPIRFlags &Flags={}, const VPIRMetadata &Metadata={}, DebugLoc DL=DebugLoc::getUnknown())
VPWidenCastRecipe * clone() override
Clone the current recipe.
unsigned getOpcode() const
This recipe generates a GEP instruction.
Type * getSourceElementType() const
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPWidenGEPRecipe.
VPWidenGEPRecipe * clone() override
Clone the current recipe.
~VPWidenGEPRecipe() override=default
VPWidenGEPRecipe(Type *SourceElementTy, ArrayRef< VPValue * > Operands, const VPIRFlags &Flags={}, DebugLoc DL=DebugLoc::getUnknown(), GetElementPtrInst *UV=nullptr)
void execute(VPTransformState &State) override=0
Generate the phi nodes.
ArrayRef< const SCEVPredicate * > getNoWrapPredicates() const
Returns the SCEV predicates associated with this induction.
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
static bool classof(const VPValue *V)
void setStepValue(VPValue *V)
Update the step value of the recipe.
VPValue * getBackedgeValue() override
Returns the incoming value from the loop backedge.
VPIRValue * getStartValue() const
Returns the start value of the induction.
unsigned getNumIncoming() const override
Returns the number of incoming values, also number of incoming blocks.
PHINode * getPHINode() const
Returns the underlying PHINode if one exists, or null otherwise.
VPWidenInductionRecipe(unsigned char Kind, PHINode *IV, VPValue *Start, VPValue *Step, const InductionDescriptor &IndDesc, DebugLoc DL)
VPValue * getStepValue()
Returns the step value of the induction.
VPWidenInductionRecipe(unsigned char Kind, PHINode *IV, VPValue *Start, VPValue *Step, const InductionDescriptor &IndDesc, Type *ResultTy, DebugLoc DL)
const InductionDescriptor & getInductionDescriptor() const
Returns the induction descriptor for the recipe.
VPRecipeBase & getBackedgeRecipe() override
Returns the backedge value as a recipe.
static bool classof(const VPRecipeBase *R)
const VPValue * getVFValue() const
static bool classof(const VPSingleDefRecipe *R)
const VPValue * getStepValue() const
VPIRValue * getStartValue() const
Returns the start value of the induction.
const TruncInst * getTruncInst() const
void execute(VPTransformState &State) override
Generate the phi nodes.
~VPWidenIntOrFpInductionRecipe() override=default
VPValue * getSplatVFValue() const
If the recipe has been unrolled, return the VPValue for the induction increment, otherwise return nul...
VPWidenIntOrFpInductionRecipe * clone() override
Clone the current recipe.
VPWidenIntOrFpInductionRecipe(PHINode *IV, VPIRValue *Start, VPValue *Step, VPValue *VF, const InductionDescriptor &IndDesc, const VPIRFlags &Flags, DebugLoc DL)
TruncInst * getTruncInst()
Returns the first defined value as TruncInst, if it is one or nullptr otherwise.
VPWidenIntOrFpInductionRecipe(PHINode *IV, VPIRValue *Start, VPValue *Step, VPValue *VF, const InductionDescriptor &IndDesc, TruncInst *Trunc, const VPIRFlags &Flags, DebugLoc DL)
VPValue * getLastUnrolledPartOperand()
Returns the VPValue representing the value of this induction at the last unrolled part,...
unsigned getNumIncoming() const override
Returns the number of incoming values, also number of incoming blocks.
bool isCanonical() const
Returns true if the induction is canonical, i.e.
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
A recipe for widening vector intrinsics.
VPWidenIntrinsicRecipe(Intrinsic::ID VectorIntrinsicID, ArrayRef< VPValue * > CallArguments, Type *Ty, const VPIRFlags &Flags={}, const VPIRMetadata &Metadata={}, DebugLoc DL=DebugLoc::getUnknown())
CallInst * createVectorCall(VPTransformState &State)
Helper function to produce the widened intrinsic call.
Intrinsic::ID getVectorIntrinsicID() const
Return the ID of the intrinsic.
LLVM_ABI_FOR_TEST void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
bool mayReadFromMemory() const
Returns true if the intrinsic may read from memory.
StringRef getIntrinsicName() const
Return to name of the intrinsic as string.
static InstructionCost computeCallCost(Intrinsic::ID ID, ArrayRef< const VPValue * > Operands, const VPRecipeWithIRFlags &R, ElementCount VF, VPCostContext &Ctx)
Compute the cost of a vector intrinsic with ID and Operands.
VPWidenIntrinsicRecipe(CallInst &CI, Intrinsic::ID VectorIntrinsicID, ArrayRef< VPValue * > CallArguments, Type *Ty, const VPIRFlags &Flags={}, const VPIRMetadata &MD={}, DebugLoc DL=DebugLoc::getUnknown())
bool mayHaveSideEffects() const
Returns true if the intrinsic may have side-effects.
static bool classof(const VPSingleDefRecipe *R)
static bool classof(const VPValue *V)
VPWidenIntrinsicRecipe * clone() override
Clone the current recipe.
VPWidenIntrinsicRecipe(const unsigned char SC, Intrinsic::ID VectorIntrinsicID, ArrayRef< VPValue * > CallArguments, Type *Ty, const VPIRFlags &Flags={}, const VPIRMetadata &MD={}, DebugLoc DL=DebugLoc::getUnknown())
bool mayWriteToMemory() const
Returns true if the intrinsic may write to memory.
~VPWidenIntrinsicRecipe() override=default
static bool classof(const VPRecipeBase *R)
LLVM_ABI_FOR_TEST bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the VPUser only uses the first lane of operand Op.
LLVM_ABI_FOR_TEST void execute(VPTransformState &State) override
Produce a widened version of the vector intrinsic.
LLVM_ABI_FOR_TEST InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this vector intrinsic.
static bool classof(const VPUser *U)
static InstructionCost computeMemIntrinsicCost(Intrinsic::ID IID, Type *Ty, bool IsMasked, Align Alignment, VPCostContext &Ctx)
Helper function for computing the cost of vector memory intrinsic.
void execute(VPTransformState &State) override
Produce a widened version of the vector memory intrinsic.
~VPWidenMemIntrinsicRecipe() override=default
VPWidenMemIntrinsicRecipe * clone() override
Clone the current recipe.
VPWidenMemIntrinsicRecipe(Intrinsic::ID VectorIntrinsicID, ArrayRef< VPValue * > CallArguments, Type *Ty, Align Alignment, const VPIRMetadata &MD={}, DebugLoc DL=DebugLoc::getUnknown())
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this vector memory intrinsic.
A common mixin class for widening memory operations.
bool IsMasked
Whether the memory access is masked.
bool isConsecutive() const
Return whether the loaded-from / stored-to addresses are consecutive.
virtual ~VPWidenMemoryRecipe()=default
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const
Return the cost of this VPWidenMemoryRecipe.
Instruction & getIngredient() const
bool Consecutive
Whether the accessed addresses are consecutive.
virtual const VPRecipeBase * getAsRecipe() const =0
VPValue * getMask() const
Return the mask used by this recipe.
Align Alignment
Alignment information for this memory access.
VPWidenMemoryRecipe(Instruction &I, bool Consecutive, const VPIRMetadata &Metadata)
virtual VPRecipeBase * getAsRecipe()=0
Return a VPRecipeBase* to the current object.
bool isMasked() const
Returns true if the recipe is masked.
void setMask(VPValue *Mask)
Align getAlign() const
Returns the alignment of the memory access.
VPValue * getAddr() const
Return the address accessed by this recipe.
A recipe for widened phis.
const VPRecipeBase * getAsRecipe() const override
Return a VPRecipeBase* to the current object.
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPWidenPHIRecipe.
VPWidenPHIRecipe * clone() override
Clone the current recipe.
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
~VPWidenPHIRecipe() override=default
VPWidenPHIRecipe(ArrayRef< VPValue * > IncomingValues, DebugLoc DL=DebugLoc::getUnknown(), const Twine &Name="")
Create a new VPWidenPHIRecipe with incoming values IncomingValues, debug location DL and Name.
void execute(VPTransformState &State) override
Generate the phi/select nodes.
VPWidenPointerInductionRecipe * clone() override
Clone the current recipe.
~VPWidenPointerInductionRecipe() override=default
bool onlyScalarsGenerated(bool IsScalable)
Returns true if only scalar values will be generated.
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
void execute(VPTransformState &State) override
Generate vector values for the pointer induction.
VPWidenPointerInductionRecipe(PHINode *Phi, VPValue *Start, VPValue *Step, VPValue *NumUnrolledElems, const InductionDescriptor &IndDesc, DebugLoc DL)
Create a new VPWidenPointerInductionRecipe for Phi with start value Start and the number of elements ...
VPWidenRecipe is a recipe for producing a widened instruction using the opcode and operands of the re...
VPWidenRecipe * clone() override
Clone the current recipe.
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
VPWidenRecipe(Instruction &I, ArrayRef< VPValue * > Operands, const VPIRFlags &Flags={}, const VPIRMetadata &Metadata={}, DebugLoc DL={})
VPWidenRecipe(unsigned Opcode, ArrayRef< VPValue * > Operands, const VPIRFlags &Flags={}, const VPIRMetadata &Metadata={}, DebugLoc DL={})
~VPWidenRecipe() override=default
VPWidenRecipe * cloneWithOperands(ArrayRef< VPValue * > NewOperands)
unsigned getOpcode() const
VPlan models a candidate for vectorization, encoding various decisions take to produce efficient outp...
VPIRValue * getLiveIn(Value *V) const
Return the live-in VPIRValue for V, if there is one or nullptr otherwise.
LLVM_ABI_FOR_TEST void printDOT(raw_ostream &O) const
Print this VPlan in DOT format to O.
friend class VPSlotTracker
std::string getName() const
Return a string with the name of the plan and the applicable VFs and UFs.
bool hasVF(ElementCount VF) const
ElementCount getSingleVF() const
Returns the single VF of the plan, asserting that the plan has exactly one VF.
const DataLayout & getDataLayout() const
LLVMContext & getContext() const
VPBasicBlock * getEntry()
Type * getIndexType() const
The type of the canonical induction variable of the vector loop.
void setName(const Twine &newName)
bool hasScalableVF() const
VPValue * getTripCount() const
The trip count of the original loop.
VPValue * getOrCreateBackedgeTakenCount()
The backedge taken count of the original loop.
iterator_range< SmallSetVector< ElementCount, 2 >::iterator > vectorFactors() const
Returns an iterator range over all VFs of the plan.
VPIRBasicBlock * getExitBlock(BasicBlock *IRBB) const
Return the VPIRBasicBlock corresponding to IRBB.
LLVM_ABI_FOR_TEST ~VPlan()
VPIRValue * getOrAddLiveIn(VPIRValue *V)
bool isExitBlock(VPBlockBase *VPBB)
Returns true if VPBB is an exit block.
const VPBasicBlock * getEntry() const
friend class VPlanPrinter
VPIRValue * getFalse()
Return a VPIRValue wrapping i1 false.
VPIRValue * getConstantInt(const APInt &Val)
Return a VPIRValue wrapping a ConstantInt with the given APInt value.
VPSymbolicValue & getVFxUF()
Returns VF * UF of the vector loop region.
VPIRValue * getAllOnesValue(Type *Ty)
Return a VPIRValue wrapping the AllOnes value of type Ty.
VPRegionBlock * createReplicateRegion(VPBlockBase *Entry, VPBlockBase *Exiting, const std::string &Name="")
Create a new replicate region with Entry, Exiting and Name.
VPIRBasicBlock * createEmptyVPIRBasicBlock(BasicBlock *IRBB)
Create a VPIRBasicBlock wrapping IRBB, but do not create VPIRInstructions wrapping the instructions i...
auto getLiveIns() const
Return the list of live-in VPValues available in the VPlan.
bool hasUF(unsigned UF) const
ArrayRef< VPIRBasicBlock * > getExitBlocks() const
Return an ArrayRef containing VPIRBasicBlocks wrapping the exit blocks of the original scalar loop.
VPlan(BasicBlock *ScalarHeaderBB, Type *IdxTy)
Construct a VPlan with a new VPBasicBlock as entry, a VPIRBasicBlock wrapping ScalarHeaderBB and vect...
VPSymbolicValue & getVectorTripCount()
The vector trip count.
VPValue * getBackedgeTakenCount() const
VPIRValue * getOrAddLiveIn(Value *V)
Gets the live-in VPIRValue for V or adds a new live-in (if none exists yet) for V.
VPRegionBlock * createLoopRegion(Type *CanIVTy, DebugLoc DL, const std::string &Name="", VPBlockBase *Entry=nullptr, VPBlockBase *Exiting=nullptr)
Create a new loop region with a canonical IV using CanIVTy and DL.
VPIRValue * getZero(Type *Ty)
Return a VPIRValue wrapping the null value of type Ty.
void setVF(ElementCount VF)
bool isUnrolled() const
Returns true if the VPlan already has been unrolled, i.e.
LLVM_ABI_FOR_TEST VPRegionBlock * getVectorLoopRegion()
Returns the VPRegionBlock of the vector loop.
bool hasEarlyExit() const
Returns true if the VPlan is based on a loop with an early exit.
InstructionCost cost(ElementCount VF, VPCostContext &Ctx)
Return the cost of this plan.
LLVM_ABI_FOR_TEST bool isOuterLoop() const
Returns true if this VPlan is for an outer loop, i.e., its vector loop region contains a nested loop ...
unsigned getConcreteUF() const
Returns the concrete UF of the plan, after unrolling.
VPIRValue * getConstantInt(unsigned BitWidth, uint64_t Val, bool IsSigned=false)
Return a VPIRValue wrapping a ConstantInt with the given bitwidth and value.
const VPBasicBlock * getMiddleBlock() const
void setTripCount(VPValue *NewTripCount)
Set the trip count assuming it is currently null; if it is not - use resetTripCount().
void resetTripCount(VPValue *NewTripCount)
Resets the trip count for the VPlan.
VPBasicBlock * getMiddleBlock()
Returns the 'middle' block of the plan, that is the block that selects whether to execute the scalar ...
void setEntry(VPBasicBlock *VPBB)
VPBasicBlock * createVPBasicBlock(const Twine &Name, VPRecipeBase *Recipe=nullptr)
Create a new VPBasicBlock with Name and containing Recipe if present.
LLVM_ABI_FOR_TEST VPIRBasicBlock * createVPIRBasicBlock(BasicBlock *IRBB)
Create a VPIRBasicBlock from IRBB containing VPIRInstructions for all instructions in IRBB,...
void removeVF(ElementCount VF)
Remove VF from the plan.
VPIRValue * getTrue()
Return a VPIRValue wrapping i1 true.
VPBasicBlock * getVectorPreheader() const
Returns the preheader of the vector loop region, if one exists, or null otherwise.
LLVM_DUMP_METHOD void dump() const
Dump the plan to stderr (for debugging).
VPSymbolicValue & getUF()
Returns the UF of the vector loop region.
bool hasScalarVFOnly() const
VPBasicBlock * getScalarPreheader() const
Return the VPBasicBlock for the preheader of the scalar loop.
void execute(VPTransformState *State)
Generate the IR code for this VPlan.
LLVM_ABI_FOR_TEST void print(raw_ostream &O) const
Print this VPlan to O.
void addVF(ElementCount VF)
VPIRBasicBlock * getScalarHeader() const
Return the VPIRBasicBlock wrapping the header of the scalar loop.
void printLiveIns(raw_ostream &O) const
Print the live-ins of this VPlan to O.
VPSymbolicValue & getVF()
Returns the VF of the vector loop region.
const VPSymbolicValue & getVF() const
bool hasScalarTail() const
Returns true if the scalar tail may execute after the vector loop, i.e.
LLVM_ABI_FOR_TEST VPlan * duplicate()
Clone the current VPlan, update all VPValues of the new VPlan and cloned recipes to refer to the clon...
VPIRValue * getConstantInt(Type *Ty, uint64_t Val, bool IsSigned=false)
Return a VPIRValue wrapping a ConstantInt with the given type and value.
LLVM Value Representation.
ilist_node_with_parent()=default
Increasing range of size_t indices.
typename base_list_type::const_reverse_iterator const_reverse_iterator
typename base_list_type::reverse_iterator reverse_iterator
typename base_list_type::iterator iterator
typename base_list_type::const_iterator const_iterator
An intrusive list with ownership and callbacks specified/controlled by ilist_traits,...
A range adaptor for a pair of iterators.
This class implements an extremely fast bulk output stream that can only output to a stream.
This file defines classes to implement an intrusive doubly linked list class (i.e.
This file defines the ilist_node class template, which is a convenient base class for creating classe...
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
LLVM_ABI AttributeSet getFnAttributes(LLVMContext &C, ID id)
Return the function attributes for an intrinsic.
std::variant< std::monostate, Loc::Single, Loc::Multi, Loc::MMI, Loc::EntryValue > Variant
Alias for the std::variant specialization base class of DbgVariable.
CastInfo helper for casting from VPRecipeBase to a mixin class that is not part of the VPRecipeBase c...
This is an optimization pass for GlobalISel generic memory operations.
void dump(const SparseBitVector< ElementSize > &LHS, raw_ostream &out)
detail::zippy< detail::zip_shortest, T, U, Args... > zip(T &&t, U &&u, Args &&...args)
zip iterator for two or more iteratable types.
auto cast_if_present(const Y &Val)
cast_if_present<X> - Functionally identical to cast, except that a null value is accepted.
auto find(R &&Range, const T &Val)
Provide wrappers to std::find which take ranges instead of having to pass begin/end explicitly.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
detail::zippy< detail::zip_first, T, U, Args... > zip_equal(T &&t, U &&u, Args &&...args)
zip iterator that assumes that all iteratees have the same length.
ReductionStyle getReductionStyle(bool InLoop, bool Ordered, unsigned ScaleFactor)
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Type * toScalarizedTy(Type *Ty)
A helper for converting vectorized types to scalarized (non-vector) types.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
LLVM_ABI void getMetadataToPropagate(Instruction *Inst, SmallVectorImpl< std::pair< unsigned, MDNode * > > &Metadata)
Add metadata from Inst to Metadata, if it can be preserved after vectorization.
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
auto cast_or_null(const Y &Val)
Align getLoadStoreAlignment(const Value *I)
A helper function that returns the alignment of load or store instruction.
MemoryEffectsBase< IRMemLocation > MemoryEffects
Summary of how a function affects memory in the program.
LLVM_ABI bool isSafeToSpeculativelyExecute(const Instruction *I, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr, bool UseVariableInfo=true, bool IgnoreUBImplyingAttrs=true)
Return true if the instruction does not have any effects besides calculating the result and does not ...
auto map_range(ContainerTy &&C, FuncTy F)
Return a range that applies F to the elements of C.
auto dyn_cast_or_null(const Y &Val)
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
auto reverse(ContainerTy &&C)
UncountableExitStyle
Different methods of handling early exits.
@ MaskedHandleExitInScalarLoop
All memory operations other than the load(s) required to determine whether an uncountable exit occurr...
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
LLVM_ABI Type * computeScalarTypeForInstruction(unsigned Opcode, ArrayRef< VPValue * > Operands)
Compute the scalar result type for an IR Opcode given Operands.
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
auto drop_end(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the last N elements excluded.
RecurKind
These are the kinds of recurrences that we support.
@ Mul
Product of integers.
auto count(R &&Range, const E &Element)
Wrapper function around std::count to count the number of times an element Element occurs in the give...
DWARFExpression::Operation Op
raw_ostream & operator<<(raw_ostream &OS, const APFixedPoint &FX)
ArrayRef(const T &OneElt) -> ArrayRef< T >
constexpr unsigned BitWidth
auto count_if(R &&Range, UnaryPredicate P)
Wrapper function around std::count_if to count the number of times an element satisfying a given pred...
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
std::variant< RdxOrdered, RdxInLoop, RdxUnordered > ReductionStyle
auto seq(T Begin, T End)
Iterate over an integral type from Begin up to - but not including - End.
@ Increment
Incrementally increasing token ID.
std::unique_ptr< VPlan > VPlanPtr
Implement std::hash so that hash_code can be used in STL containers.
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
This struct is a compact representation of a valid (non-zero power of two) alignment.
static Bitfield::Type get(StorageType Packed)
Unpacks the field from the Packed value.
static void set(StorageType &Packed, typename Bitfield::Type Value)
Sets the typed value in the provided Packed value.
This struct provides a method for customizing the way a cast is performed.
Provides a cast trait that strips const from types to make it easier to implement a const-version of ...
This cast trait just provides the default implementation of doCastIfPossible to make CastInfo special...
Provides a cast trait that uses a defined pointer to pointer cast as a base for reference-to-referenc...
This reduction is in-loop.
Possible variants of a reduction.
This reduction is unordered with the partial result scaled down by some factor.
A MapVector that performs no allocations if smaller than a certain size.
An overlay on VPIRValue for VPValues that wrap a ConstantInt.
Struct to hold various analysis needed for cost computations.
void execute(VPTransformState &State) override
Generate the phi nodes.
VPFirstOrderRecurrencePHIRecipe * clone() override
Clone the current recipe.
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this first-order recurrence phi recipe.
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
VPFirstOrderRecurrencePHIRecipe(PHINode *Phi, VPValue &Start, VPValue &BackedgeValue)
DisjointFlagsTy(bool IsDisjoint)
NonNegFlagsTy(bool IsNonNeg)
TruncFlagsTy(bool HasNUW, bool HasNSW)
WrapFlagsTy(bool HasNUW, bool HasNSW)
An overlay for VPIRInstructions wrapping PHI nodes enabling convenient use cast/dyn_cast/isa and exec...
static bool classof(const VPRecipeBase *U)
static bool classof(const VPUser *U)
const VPRecipeBase * getAsRecipe() const override
Return a VPRecipeBase* to the current object.
A VPValue representing a live-in from the input IR or a constant.
static bool classof(const VPUser *U)
VPPhi * clone() override
Clone the current recipe.
const VPRecipeBase * getAsRecipe() const override
Return a VPRecipeBase* to the current object.
static bool classof(const VPSingleDefRecipe *SDR)
static bool classof(const VPValue *V)
VPPhi(ArrayRef< VPValue * > Operands, const VPIRFlags &Flags, DebugLoc DL, const Twine &Name="", Type *ResultTy=nullptr)
A pure-virtual common base class for recipes defining a single VPValue and using IR flags.
static bool classof(const VPSingleDefRecipe *R)
static bool classof(const VPRecipeBase *R)
InstructionCost getCostForRecipeWithOpcode(unsigned Opcode, ElementCount VF, VPCostContext &Ctx) const
Compute the cost for this recipe for VF, using Opcode and Ctx.
VPRecipeWithIRFlags(const unsigned char SC, ArrayRef< VPValue * > Operands, const VPIRFlags &Flags, DebugLoc DL=DebugLoc::getUnknown())
static bool classof(const VPValue *V)
void execute(VPTransformState &State) override=0
The method which generates the output IR instructions that correspond to this VPRecipe,...
VPRecipeWithIRFlags(const unsigned char SC, ArrayRef< VPValue * > Operands, Type *ResultTy, const VPIRFlags &Flags, DebugLoc DL=DebugLoc::getUnknown())
VPRecipeWithIRFlags * clone() override=0
Clone the current recipe.
static bool classof(const VPUser *U)
A symbolic live-in VPValue, used for values like vector trip count, VF, and VFxUF.
A recipe for widening load operations with vector-predication intrinsics, using the address to load f...
const VPRecipeBase * getAsRecipe() const override
LLVM_ABI_FOR_TEST void execute(VPTransformState &State) override
Generate the wide load or gather.
VPWidenLoadEVLRecipe * clone() override
Clone the current recipe.
LLVM_ABI_FOR_TEST void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
VPRecipeBase * getAsRecipe() override
Return a VPRecipeBase* to the current object.
LLVM_ABI_FOR_TEST InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPWidenLoadEVLRecipe.
VPValue * getEVL() const
Return the EVL operand.
VPWidenLoadEVLRecipe(VPWidenLoadRecipe &L, VPValue *Addr, VPValue &EVL, VPValue *Mask)
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
A recipe for widening load operations, using the address to load from and an optional mask.
VPWidenLoadRecipe(LoadInst &Load, VPValue *Addr, VPValue *Mask, bool Consecutive, const VPIRMetadata &Metadata, DebugLoc DL)
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
const VPRecipeBase * getAsRecipe() const override
void execute(VPTransformState &State) override
Generate a wide load or gather.
VPWidenLoadRecipe * clone() override
Clone the current recipe.
VP_CLASSOF_IMPL(VPRecipeBase::VPWidenLoadSC)
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPWidenLoadRecipe.
VPRecipeBase * getAsRecipe() override
Return a VPRecipeBase* to the current object.
A recipe for widening store operations with vector-predication intrinsics, using the value to store,...
VPValue * getStoredValue() const
Return the address accessed by this recipe.
LLVM_ABI_FOR_TEST void execute(VPTransformState &State) override
Generate the wide store or scatter.
VPWidenStoreEVLRecipe * clone() override
Clone the current recipe.
const VPRecipeBase * getAsRecipe() const override
VPWidenStoreEVLRecipe(VPWidenStoreRecipe &S, VPValue *Addr, VPValue *StoredVal, VPValue &EVL, VPValue *Mask)
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
LLVM_ABI_FOR_TEST void printRecipe(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print the recipe.
LLVM_ABI_FOR_TEST InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPWidenStoreEVLRecipe.
VPRecipeBase * getAsRecipe() override
Return a VPRecipeBase* to the current object.
VPValue * getEVL() const
Return the EVL operand.
A recipe for widening store operations, using the stored value, the address to store to and an option...
VPRecipeBase * getAsRecipe() override
Return a VPRecipeBase* to the current object.
VPWidenStoreRecipe(StoreInst &Store, VPValue *Addr, VPValue *StoredVal, VPValue *Mask, bool Consecutive, const VPIRMetadata &Metadata, DebugLoc DL)
VP_CLASSOF_IMPL(VPRecipeBase::VPWidenStoreSC)
VPValue * getStoredValue() const
Return the value stored by this recipe.
VPWidenStoreRecipe * clone() override
Clone the current recipe.
const VPRecipeBase * getAsRecipe() const override
InstructionCost computeCost(ElementCount VF, VPCostContext &Ctx) const override
Return the cost of this VPWidenStoreRecipe.
bool usesFirstLaneOnly(const VPValue *Op) const override
Returns true if the recipe only uses the first lane of operand Op.
static VPMixin * castFailed()
static bool isPossible(VPRecipeBase *R)
Used by isa.
static VPMixin * doCast(VPRecipeBase *R)
Used by cast.