39#define LV_NAME "loop-vectorize"
40#define DEBUG_TYPE LV_NAME
44 cl::desc(
"Enable if-conversion during vectorization."));
48 cl::desc(
"Enable recognition of non-constant strided "
49 "pointer induction variables."));
53 cl::desc(
"Allow enabling loop hints to reorder "
54 "FP operations during vectorization."));
60 cl::desc(
"Control whether the compiler can use scalable vectors to "
64 "Scalable vectorization is disabled."),
67 "Scalable vectorization is available and favored when the "
68 "cost is inconclusive."),
71 "Scalable vectorization is available and favored when the "
72 "cost is inconclusive."),
75 "Scalable vectorization is available and always favored when "
80 cl::desc(
"Enables autovectorization of some loops containing histograms"));
87bool LoopVectorizeHints::Hint::validate(
unsigned Val) {
98 return (Val == 0 || Val == 1);
104 bool InterleaveOnlyWhenForced,
108 Interleave(
"interleave.count", InterleaveOnlyWhenForced, HK_INTERLEAVE),
110 IsVectorized(
"isvectorized", 0, HK_ISVECTORIZED),
111 Predicate(
"vectorize.predicate.enable",
FK_Undefined, HK_PREDICATE),
112 Scalable(
"vectorize.scalable.enable",
SK_Unspecified, HK_SCALABLE),
113 TheLoop(L), ORE(ORE) {
115 getHintsFromMetadata();
149 if (IsVectorized.Value != 1)
156 <<
"LV: Interleaving disabled by the pass manager\n");
160 TheLoop->addIntLoopAttribute(
"llvm.loop.isvectorized", 1,
161 {
Twine(Prefix(),
"vectorize.").
str(),
162 Twine(Prefix(),
"interleave.").
str()});
165 IsVectorized.Value = 1;
168void LoopVectorizeHints::reportDisallowedVectorization(
171 LLVM_DEBUG(
dbgs() <<
"LV: Not vectorizing: " << DebugMsg <<
".\n");
174 <<
"loop not vectorized: " << RemarkMsg);
181 reportDisallowedVectorization(
"#pragma vectorize disable",
182 "MissedExplicitlyDisabled",
183 "vectorization is explicitly disabled", L);
185 reportDisallowedVectorization(
"loop hasDisableAllTransformsHint",
186 "MissedTransformsDisabled",
187 "loop transformations are disabled", L);
195 reportDisallowedVectorization(
196 "VectorizeOnlyWhenForced is set, and no #pragma vectorize enable",
197 "MissedForceOnly",
"only vectorizing loops that explicitly request it",
203 LLVM_DEBUG(
dbgs() <<
"LV: Not vectorizing: Disabled/already vectorized.\n");
209 L->getStartLoc(), L->getHeader())
210 <<
"loop not vectorized: vectorization and interleaving are "
211 "explicitly disabled, or the loop has already been "
226 TheLoop->getStartLoc(),
227 TheLoop->getHeader())
228 <<
"loop not vectorized: vectorization is explicitly disabled";
231 TheLoop->getHeader());
232 R <<
"loop not vectorized";
234 R <<
" (Force=" << NV(
"Force",
true);
235 if (Width.Value != 0)
236 R <<
", Vector Width=" << NV(
"VectorWidth",
getWidth());
238 R <<
", Interleave Count=" << NV(
"InterleaveCount",
getInterleave());
251 EC.getKnownMinValue() > 1);
254void LoopVectorizeHints::getHintsFromMetadata() {
270 if (!MD || MD->getNumOperands() == 0)
273 for (
unsigned Idx = 1; Idx < MD->getNumOperands(); ++Idx)
274 Args.push_back(MD->getOperand(Idx));
277 assert(Args.size() == 0 &&
"too many arguments for MDString");
285 if (
Args.size() == 1)
286 setHint(Name, Args[0]);
291 if (!
Name.consume_front(Prefix()))
297 unsigned Val =
C->getZExtValue();
299 Hint *Hints[] = {&Width, &Interleave, &Force,
300 &IsVectorized, &Predicate, &Scalable};
301 for (
auto *
H : Hints) {
302 if (Name ==
H->Name) {
303 if (
H->validate(Val))
306 LLVM_DEBUG(
dbgs() <<
"LV: ignoring invalid hint '" << Name <<
"'\n");
362 dbgs() <<
"LV: Loop latch condition is not a compare instruction.\n");
366 Value *CondOp0 = LatchCmp->getOperand(0);
367 Value *CondOp1 = LatchCmp->getOperand(1);
368 Value *IVUpdate =
IV->getIncomingValueForBlock(Latch);
371 LLVM_DEBUG(
dbgs() <<
"LV: Loop latch condition is not uniform.\n");
385 for (
Loop *SubLp : *Lp)
393 assert(Ty->isIntOrPtrTy() &&
"Expected integer or pointer type");
395 if (Ty->isPointerTy())
396 return DL.getIntPtrType(Ty->getContext(), Ty->getPointerAddressSpace());
400 if (Ty->getScalarSizeInBits() < 32)
421 Value *APtr =
A->getPointerOperand();
422 Value *BPtr =
B->getPointerOperand();
431 if (!AllowRuntimeSCEVChecks || !TheLoop->isInnermost())
448 const auto &Strides = LAI && AllowRuntimeSCEVChecks
449 ? LAI->getSymbolicStrides()
451 int Stride =
getPtrStride(PSE, AccessTy, Ptr, TheLoop, *DT, Strides,
452 AllowRuntimeSCEVChecks,
false)
454 if (Stride == 1 || Stride == -1)
460 return LAI->isInvariant(V);
470class SCEVAddRecForUniformityRewriter
473 unsigned StepMultiplier;
482 bool CannotAnalyze =
false;
484 bool canAnalyze()
const {
return !CannotAnalyze; }
487 SCEVAddRecForUniformityRewriter(
ScalarEvolution &SE,
unsigned StepMultiplier,
492 const SCEV *visitAddRecExpr(
const SCEVAddRecExpr *Expr) {
494 "addrec outside of TheLoop must be invariant and should have been "
500 if (!SE.isLoopInvariant(Step, TheLoop)) {
501 CannotAnalyze =
true;
504 const SCEV *NewStep =
505 SE.getMulExpr(Step, SE.getConstant(Ty, StepMultiplier));
506 const SCEV *ScaledOffset = SE.getMulExpr(Step, SE.getConstant(Ty, Offset));
507 const SCEV *NewStart =
512 const SCEV *
visit(
const SCEV *S) {
513 if (CannotAnalyze || SE.isLoopInvariant(S, TheLoop))
518 const SCEV *visitUnknown(
const SCEVUnknown *S) {
519 if (SE.isLoopInvariant(S, TheLoop))
522 CannotAnalyze =
true;
526 const SCEV *visitCouldNotCompute(
const SCEVCouldNotCompute *S) {
528 CannotAnalyze =
true;
532 static const SCEV *rewrite(
const SCEV *S, ScalarEvolution &SE,
533 unsigned StepMultiplier,
unsigned Offset,
543 SCEVAddRecForUniformityRewriter
Rewriter(SE, StepMultiplier, Offset,
556 Value *V, std::optional<ElementCount> VF)
const {
559 if (!VF || VF->isScalable())
566 auto *SE = PSE.getSE();
573 unsigned FixedVF = VF->getKnownMinValue();
574 const SCEV *FirstLaneExpr =
575 SCEVAddRecForUniformityRewriter::rewrite(S, *SE, FixedVF, 0, TheLoop);
583 const SCEV *IthLaneExpr =
584 SCEVAddRecForUniformityRewriter::rewrite(S, *SE, FixedVF,
I, TheLoop);
585 return FirstLaneExpr == IthLaneExpr;
601bool LoopVectorizationLegality::canVectorizeOuterLoop() {
614 "Unsupported basic block terminator",
615 "loop control flow is not understood by vectorizer",
616 "CFGNotUnderstood", ORE, TheLoop);
634 "Unsupported conditional branch",
635 "loop control flow is not understood by vectorizer",
636 "CFGNotUnderstood", ORE, TheLoop);
649 "Outer loop contains divergent loops",
650 "loop control flow is not understood by vectorizer",
"CFGNotUnderstood",
659 if (!setupOuterLoopInductions()) {
661 "UnsupportedPhi", ORE, TheLoop);
671void LoopVectorizationLegality::addInductionPhi(
PHINode *Phi,
673 Inductions[
Phi] =
ID;
681 InductionCastsToIgnore.insert(*Casts.
begin());
684 const DataLayout &
DL =
Phi->getDataLayout();
687 "Expected int, ptr, or FP induction phi type");
699 ID.getConstIntStepValue() &&
ID.getConstIntStepValue()->isOne() &&
707 if (!PrimaryInduction || PhiTy == WidestIndTy)
708 PrimaryInduction =
Phi;
714bool LoopVectorizationLegality::setupOuterLoopInductions() {
718 auto IsSupportedPhi = [&](PHINode &
Phi) ->
bool {
719 InductionDescriptor
ID;
722 addInductionPhi(&Phi,
ID);
728 dbgs() <<
"LV: Found unsupported PHI for outer loop vectorization.\n");
751 TLI.
getWidestVF(ScalarName, WidestFixedVF, WidestScalableVF);
759 "Caller may decide to scalarize a variant using a scalable VF");
764bool LoopVectorizationLegality::canVectorizeInstrs() {
772 Result &= canVectorizeInstr(
I);
773 if (!DoExtraAnalysis && !Result)
778 if (!PrimaryInduction) {
779 if (Inductions.empty()) {
781 "Did not find one integer induction var",
782 "loop induction variable could not be identified",
783 "NoInductionVariable", ORE, TheLoop);
788 "Did not find one integer induction var",
789 "integer loop induction variable could not be identified",
790 "NoIntegerInductionVariable", ORE, TheLoop);
793 LLVM_DEBUG(
dbgs() <<
"LV: Did not find one integer induction var.\n");
799 if (PrimaryInduction && WidestIndTy != PrimaryInduction->getType())
800 PrimaryInduction =
nullptr;
805bool LoopVectorizationLegality::canVectorizeInstr(
Instruction &
I) {
815 "Found a non-int non-pointer PHI",
816 "loop control flow is not understood by vectorizer",
817 "CFGNotUnderstood", ORE, TheLoop);
832 if (
Phi->getNumIncomingValues() != 2) {
834 "Found an invalid PHI",
835 "loop control flow is not understood by vectorizer",
836 "CFGNotUnderstood", ORE, TheLoop, Phi);
840 RecurrenceDescriptor RedDes;
844 Reductions[
Phi] = std::move(RedDes);
848 "Only min/max recurrences are allowed to have multiple uses "
857 auto IsDisallowedStridedPointerInduction =
858 [](
const InductionDescriptor &
ID) {
862 ID.getConstIntStepValue() ==
nullptr;
865 InductionDescriptor
ID;
867 !IsDisallowedStridedPointerInduction(
ID)) {
868 addInductionPhi(Phi,
ID);
869 Requirements->addExactFPMathInst(
ID.getExactFPMathInst());
874 FixedOrderRecurrences.insert(Phi);
881 !IsDisallowedStridedPointerInduction(
ID)) {
882 addInductionPhi(Phi,
ID);
887 "value that could not be identified as "
888 "reduction is used outside the loop",
889 "NonReductionValueUsedOutsideLoop", ORE, TheLoop,
900 !(CI->getCalledFunction() && TLI &&
906 TLI && CI->getCalledFunction() && CI->getType()->isFloatingPointTy() &&
907 TLI->getLibFunc(CI->getCalledFunction()->getName(), Func) &&
908 TLI->hasOptimizedCodeGen(Func);
916 "Found a non-intrinsic callsite",
917 "library call cannot be vectorized. "
918 "Try compiling with -fno-math-errno, -ffast-math, "
920 "CantVectorizeLibcall", ORE, TheLoop, CI);
923 "call instruction cannot be vectorized",
924 "CantVectorizeLibcall", ORE, TheLoop, CI);
932 auto *SE = PSE.getSE();
934 for (
unsigned Idx = 0; Idx < CI->arg_size(); ++Idx)
938 "Found unvectorizable intrinsic",
939 "intrinsic instruction cannot be vectorized",
940 "CantVectorizeIntrinsic", ORE, TheLoop, CI);
949 VecCallVariantsFound =
true;
951 auto CanWidenInstructionTy = [](
Instruction const &Inst) {
952 Type *InstTy = Inst.getType();
966 if (!CanWidenInstructionTy(
I) ||
971 "instruction return type cannot be vectorized",
972 "CantVectorizeInstructionReturnType", ORE,
979 Type *
T =
ST->getValueOperand()->getType();
982 "CantVectorizeStore", ORE, TheLoop, ST);
988 if (
ST->getMetadata(LLVMContext::MD_nontemporal)) {
991 assert(VecTy &&
"did not find vectorized version of stored type");
992 if (!TTI->isLegalNTStore(VecTy,
ST->getAlign())) {
994 "nontemporal store instruction cannot be vectorized",
995 "CantVectorizeNontemporalStore", ORE, TheLoop, ST);
1001 if (
LD->getMetadata(LLVMContext::MD_nontemporal)) {
1005 assert(VecTy &&
"did not find vectorized version of load type");
1006 if (!TTI->isLegalNTLoad(VecTy,
LD->getAlign())) {
1008 "nontemporal load instruction cannot be vectorized",
1009 "CantVectorizeNontemporalLoad", ORE, TheLoop, LD);
1019 }
else if (
I.getType()->isFloatingPointTy() && (CI ||
I.isBinaryOp()) &&
1022 Hints->setPotentiallyUnsafe();
1055 Value *HIncVal =
nullptr;
1070 Value *HIdx =
nullptr;
1071 for (
Value *Index :
GEP->indices()) {
1094 if (!AR || AR->getLoop() != TheLoop)
1104 LLVM_DEBUG(
dbgs() <<
"LV: Found histogram for: " << *HSt <<
"\n");
1111bool LoopVectorizationLegality::canVectorizeIndirectUnsafeDependences() {
1151 LLVM_DEBUG(
dbgs() <<
"LV: Checking for a histogram on: " << *SI <<
"\n");
1152 return findHistogram(LI, SI, TheLoop, LAI->getPSE(), Histograms);
1155bool LoopVectorizationLegality::canVectorizeMemory() {
1156 LAI = &LAIs.getInfo(*TheLoop);
1157 const OptimizationRemarkAnalysis *LAR = LAI->getReport();
1160 return OptimizationRemarkAnalysis(
LV_NAME,
"loop not vectorized: ", *LAR);
1164 if (!LAI->canVectorizeMemory()) {
1167 "Cannot vectorize unsafe dependencies in uncountable exit loop with "
1169 "CantVectorizeUnsafeDependencyForEELoopWithSideEffects", ORE,
1174 return canVectorizeIndirectUnsafeDependences();
1177 if (LAI->hasLoadStoreDependenceInvolvingLoopInvariantAddress()) {
1179 "write to a loop invariant address could not "
1181 "CantVectorizeStoreToLoopInvariantAddress", ORE,
1190 if (!LAI->getStoresToInvariantAddresses().empty()) {
1193 for (StoreInst *SI : LAI->getStoresToInvariantAddresses()) {
1199 "We don't allow storing to uniform addresses",
1200 "write of conditional recurring variant value to a loop "
1201 "invariant address could not be vectorized",
1202 "CantVectorizeStoreToLoopInvariantAddress", ORE, TheLoop);
1210 if (TheLoop->contains(Ptr)) {
1212 "Invariant address is calculated inside the loop",
1213 "write to a loop invariant address could not "
1215 "CantVectorizeStoreToLoopInvariantAddress", ORE, TheLoop);
1221 if (LAI->hasStoreStoreDependenceInvolvingLoopInvariantAddress()) {
1227 ScalarEvolution *SE = PSE.getSE();
1229 for (StoreInst *SI : LAI->getStoresToInvariantAddresses()) {
1241 erase_if(UnhandledStores, [SE, SI](StoreInst *
I) {
1243 I->getValueOperand()->getType() ==
1244 SI->getValueOperand()->getType();
1251 bool IsOK = UnhandledStores.
empty();
1255 "We don't allow storing to uniform addresses",
1256 "write to a loop invariant address could not "
1258 "CantVectorizeStoreToLoopInvariantAddress", ORE, TheLoop);
1264 PSE.addPredicate(LAI->getPSE().getPredicate());
1269 bool EnableStrictReductions) {
1272 if (!Requirements->getExactFPInst() || Hints->allowReordering())
1278 if (!EnableStrictReductions ||
1309 return V == InvariantAddress ||
1320 return Inductions.count(PN);
1345 const Value *V)
const {
1347 return (Inst && InductionCastsToIgnore.count(Inst));
1356 return FixedOrderRecurrences.count(Phi);
1371bool LoopVectorizationLegality::blockCanBePredicated(
1400 if (!SafePtrs.
count(LI->getPointerOperand()))
1415 if (
I.mayReadFromMemory() ||
I.mayWriteToMemory() ||
I.mayThrow())
1422bool LoopVectorizationLegality::canVectorizeWithIfConvert() {
1425 "IfConversionDisabled", ORE, TheLoop);
1429 assert(TheLoop->getNumBlocks() > 1 &&
"Single block loops are vectorizable");
1436 SmallPtrSet<Value *, 8> SafePointers;
1439 for (BasicBlock *BB : TheLoop->blocks()) {
1441 for (Instruction &
I : *BB)
1443 SafePointers.
insert(Ptr);
1452 ScalarEvolution &SE = *PSE.getSE();
1454 for (Instruction &
I : *BB) {
1464 auto CanSpeculatePointerOp = [
this](
Value *Ptr) {
1466 SmallPtrSet<Value *, 4> Visited;
1467 while (!Worklist.
empty()) {
1469 if (!Visited.
insert(CurrV).second)
1473 if (!CurrI || !TheLoop->contains(CurrI)) {
1477 TheLoop->getLoopPredecessor()
1501 CanSpeculatePointerOp(LI->getPointerOperand()) &&
1504 SafePointers.
insert(LI->getPointerOperand());
1510 for (BasicBlock *BB : TheLoop->blocks()) {
1514 if (TheLoop->isLoopExiting(BB)) {
1516 "LoopContainsUnsupportedSwitch", ORE,
1517 TheLoop, BB->getTerminator());
1522 "LoopContainsUnsupportedTerminator", ORE,
1523 TheLoop, BB->getTerminator());
1529 !blockCanBePredicated(BB, SafePointers, ConditionallyExecutedOps)) {
1531 "Control flow cannot be substituted for a select",
"NoCFGForSelect",
1532 ORE, TheLoop, BB->getTerminator());
1542bool LoopVectorizationLegality::canVectorizeLoopCFG(
Loop *Lp,
1543 bool UseVPlanNativePath) {
1545 "VPlan-native path is not enabled.");
1555 bool DoExtraAnalysis = ORE->allowExtraAnalysis(
DEBUG_TYPE);
1561 "Loop doesn't have a legal pre-header",
1562 "loop control flow is not understood by vectorizer",
"CFGNotUnderstood",
1564 if (DoExtraAnalysis)
1573 "The loop must have a single backedge",
1574 "loop control flow is not understood by vectorizer",
"CFGNotUnderstood",
1576 if (DoExtraAnalysis)
1586 "The loop latch terminator is not a UncondBrInst/CondBrInst",
1587 "loop control flow is not understood by vectorizer",
"CFGNotUnderstood",
1589 if (DoExtraAnalysis)
1598bool LoopVectorizationLegality::canVectorizeLoopNestCFG(
1599 Loop *Lp,
bool UseVPlanNativePath) {
1603 bool DoExtraAnalysis = ORE->allowExtraAnalysis(
DEBUG_TYPE);
1604 if (!canVectorizeLoopCFG(Lp, UseVPlanNativePath)) {
1605 if (DoExtraAnalysis)
1613 for (Loop *SubLp : *Lp)
1614 if (!canVectorizeLoopNestCFG(SubLp, UseVPlanNativePath)) {
1615 if (DoExtraAnalysis)
1624bool LoopVectorizationLegality::isVectorizableEarlyExitLoop() {
1625 BasicBlock *LatchBB = TheLoop->getLoopLatch();
1628 "Cannot vectorize early exit loop",
1629 "NoLatchEarlyExit", ORE, TheLoop);
1633 if (Reductions.size() || FixedOrderRecurrences.size()) {
1635 "Found reductions or recurrences in early-exit loop",
1636 "Cannot vectorize early exit loop with reductions or recurrences",
1637 "RecurrencesInEarlyExitLoop", ORE, TheLoop);
1641 SmallVector<BasicBlock *, 8> ExitingBlocks;
1642 TheLoop->getExitingBlocks(ExitingBlocks);
1647 for (BasicBlock *BB : ExitingBlocks) {
1649 PSE.getSE()->getPredicatedExitCount(TheLoop, BB, &Predicates);
1653 "Early exiting block does not have exactly two successors",
1654 "Incorrect number of successors from early exiting block",
1655 "EarlyExitTooManySuccessors", ORE, TheLoop);
1661 CountableExitingBlocks.push_back(BB);
1669 if (UncountableExitingBlocks.
empty()) {
1670 LLVM_DEBUG(
dbgs() <<
"LV: Could not find any uncountable exits");
1676 PSE.getSE()->getPredicatedExitCount(TheLoop, LatchBB, &Predicates))) {
1678 "Cannot determine exact exit count for latch block",
1679 "Cannot vectorize early exit loop",
1680 "UnknownLatchExitCountEarlyExitLoop", ORE, TheLoop);
1684 "Latch block not found in list of countable exits!");
1689 switch (
I->getOpcode()) {
1690 case Instruction::Load:
1691 case Instruction::Store:
1692 case Instruction::PHI:
1693 case Instruction::UncondBr:
1694 case Instruction::CondBr:
1702 bool HasSideEffects =
false;
1703 for (
auto *BB : TheLoop->blocks())
1704 for (
auto &
I : *BB) {
1705 if (
I.mayWriteToMemory()) {
1707 HasSideEffects =
true;
1713 "Complex writes to memory unsupported in early exit loops",
1714 "Cannot vectorize early exit loop with complex writes to memory",
1715 "WritesInEarlyExitLoop", ORE, TheLoop);
1719 if (!IsSafeOperation(&
I)) {
1721 "cannot be speculatively executed",
1722 "UnsafeOperationsEarlyExitLoop", ORE,
1730 if (!HasSideEffects) {
1736 "Loop may fault",
"Cannot vectorize non-read-only early exit loop",
1737 "NonReadOnlyEarlyExitLoop", ORE, TheLoop);
1742 for (BasicBlock *ExitingBB : UncountableExitingBlocks) {
1743 if (!canUncountableExitConditionLoadBeMoved(ExitingBB))
1749 for (LoadInst *LI : NonDerefLoads) {
1754 "Loop contains potentially faulting strided load",
1755 "Cannot vectorize early exit loop with "
1756 "strided fault-only-first load",
1757 "EarlyExitLoopWithStridedFaultOnlyFirstLoad", ORE, TheLoop);
1762 [[maybe_unused]]
const SCEV *SymbolicMaxBTC =
1763 PSE.getSymbolicMaxBackedgeTakenCount();
1767 "Failed to get symbolic expression for backedge taken count");
1768 LLVM_DEBUG(
dbgs() <<
"LV: Found an early exit loop with symbolic max "
1769 "backedge taken count: "
1770 << *SymbolicMaxBTC <<
'\n');
1776bool LoopVectorizationLegality::canUncountableExitConditionLoadBeMoved(
1787 using namespace llvm::PatternMatch;
1789 Value *Ptr =
nullptr;
1791 if (!
match(Br->getCondition(),
1795 "Early exit loop with store but no supported condition load",
1796 "NoConditionLoadForEarlyExitLoop", ORE, TheLoop);
1801 if (!TheLoop->isLoopInvariant(R)) {
1803 "Early exit loop with store but no supported condition load",
1804 "NoConditionLoadForEarlyExitLoop", ORE, TheLoop);
1811 if (!AR || AR->getLoop() != TheLoop || !AR->isAffine()) {
1813 "Uncountable exit condition depends on load with an address that is "
1814 "not an add recurrence in the loop",
1815 "EarlyExitLoadInvariantAddress", ORE, TheLoop);
1819 ICFLoopSafetyInfo SafetyInfo;
1826 "Load for uncountable exit not guaranteed to execute",
1827 "ConditionalUncountableExitLoad", ORE, TheLoop);
1834 for (
auto *BB : TheLoop->blocks()) {
1835 for (
auto &
I : *BB) {
1839 if (
I.mayWriteToMemory()) {
1841 AliasResult AR = AA->alias(Ptr,
SI->getPointerOperand());
1847 "Cannot determine whether critical uncountable exit load address "
1848 "does not alias with a memory write",
1849 "CantVectorizeAliasWithCriticalUncountableExitLoad", ORE, TheLoop);
1863 bool DoExtraAnalysis = ORE->allowExtraAnalysis(
DEBUG_TYPE);
1866 if (!canVectorizeLoopNestCFG(TheLoop, UseVPlanNativePath)) {
1867 if (DoExtraAnalysis) {
1876 LLVM_DEBUG(
dbgs() <<
"LV: Found a loop: " << TheLoop->getHeader()->getName()
1881 if (!TheLoop->isInnermost()) {
1882 assert(UseVPlanNativePath &&
"VPlan-native path is not enabled.");
1884 if (!canVectorizeOuterLoop()) {
1886 "UnsupportedOuterLoop", ORE, TheLoop);
1896 assert(TheLoop->isInnermost() &&
"Inner loop expected.");
1898 unsigned NumBlocks = TheLoop->getNumBlocks();
1899 if (NumBlocks != 1 && !canVectorizeWithIfConvert()) {
1901 if (DoExtraAnalysis)
1908 if (!canVectorizeInstrs()) {
1909 LLVM_DEBUG(
dbgs() <<
"LV: Can't vectorize the instructions or CFG\n");
1910 if (DoExtraAnalysis)
1917 if (TheLoop->getExitingBlock()) {
1919 "UnsupportedUncountableLoop", ORE, TheLoop);
1920 if (DoExtraAnalysis)
1925 if (!isVectorizableEarlyExitLoop()) {
1927 "Must be false without vectorizable early-exit loop");
1928 if (DoExtraAnalysis)
1937 if (!canVectorizeMemory()) {
1938 LLVM_DEBUG(
dbgs() <<
"LV: Can't vectorize due to memory conflicts\n");
1939 if (DoExtraAnalysis)
1948 "Writes to memory unsupported in early exit loops",
1949 "Cannot vectorize early exit loop with writes to memory",
1950 "WritesInEarlyExitLoop", ORE, TheLoop);
1956 << (LAI->getRuntimePointerChecking()->Need
1957 ?
" (with a runtime bound check)"
1974 if (TheLoop->getExitingBlock() != TheLoop->getLoopLatch()) {
1977 <<
"LV: Cannot fold tail by masking. Requires a singe latch exit\n");
1981 LLVM_DEBUG(
dbgs() <<
"LV: checking if tail can be folded by masking.\n");
1990 if (!blockCanBePredicated(BB, SafePointers, TmpMaskedOp)) {
2009 [[maybe_unused]]
bool R =
2010 blockCanBePredicated(BB, SafePointers, TailFoldedMaskedOp);
2011 assert(R &&
"Must be able to predicate block when tail-folding.");
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
#define clEnumValN(ENUMVAL, FLAGNAME, DESC)
static cl::opt< bool > HintsAllowReordering("hints-allow-reordering", cl::init(true), cl::Hidden, cl::desc("Allow enabling loop hints to reorder " "FP operations during vectorization."))
static const unsigned MaxInterleaveFactor
Maximum vectorization interleave count.
static cl::opt< bool > AllowStridedPointerIVs("lv-strided-pointer-ivs", cl::init(false), cl::Hidden, cl::desc("Enable recognition of non-constant strided " "pointer induction variables."))
static cl::opt< LoopVectorizeHints::ScalableForceKind > ForceScalableVectorization("scalable-vectorization", cl::init(LoopVectorizeHints::SK_Unspecified), cl::Hidden, cl::desc("Control whether the compiler can use scalable vectors to " "vectorize a loop"), cl::values(clEnumValN(LoopVectorizeHints::SK_FixedWidthOnly, "off", "Scalable vectorization is disabled."), clEnumValN(LoopVectorizeHints::SK_PreferScalable, "preferred", "Scalable vectorization is available and favored when the " "cost is inconclusive."), clEnumValN(LoopVectorizeHints::SK_PreferScalable, "on", "Scalable vectorization is available and favored when the " "cost is inconclusive."), clEnumValN(LoopVectorizeHints::SK_AlwaysScalable, "always", "Scalable vectorization is available and always favored when " "feasible")))
static cl::opt< bool > EnableHistogramVectorization("enable-histogram-loop-vectorization", cl::init(false), cl::Hidden, cl::desc("Enables autovectorization of some loops containing histograms"))
static cl::opt< bool > EnableIfConversion("enable-if-conversion", cl::init(true), cl::Hidden, cl::desc("Enable if-conversion during vectorization."))
This file defines the LoopVectorizationLegality class.
This file provides a LoopVectorizationPlanner class.
Contains a collection of routines for determining if a given instruction is guaranteed to execute if ...
static bool isSimple(Instruction *I)
static void visit(BasicBlock &Start, std::function< bool(BasicBlock *)> op)
Virtual Register Rewriter
static const uint32_t IV[8]
@ NoAlias
The two locations do not alias at all.
bool empty() const
Check if the array is empty.
LLVM Basic Block Representation.
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction; assumes that the block is well-formed.
Function * getCalledFunction() const
Returns the function called, or null if this is an indirect function invocation or the function signa...
This class represents a function call, abstracting a target machine's calling convention.
A parsed version of the target data layout string in and methods for querying it.
static constexpr ElementCount getScalable(ScalarTy MinVal)
static constexpr ElementCount getFixed(ScalarTy MinVal)
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
an instruction for type-safe pointer arithmetic to access elements of arrays and structs
bool isGuaranteedToExecute(const Instruction &Inst, const DominatorTree *DT, const Loop *CurLoop) const override
Returns true if the instruction in a loop is guaranteed to execute at least once (under the assumptio...
void computeLoopSafetyInfo(const Loop *CurLoop) override
Computes safety information for a loop checks loop body & header for the possibility of may throw exc...
A struct for saving information about induction variables.
static LLVM_ABI bool isInductionPHI(PHINode *Phi, const Loop *L, ScalarEvolution *SE, InductionDescriptor &D, ArrayRef< const SCEVPredicate * > NoWrapPreds={}, const SCEV *Expr=nullptr, SmallVectorImpl< Instruction * > *CastsToIgnore=nullptr)
Returns true if Phi is an induction in the loop L.
@ IK_FpInduction
Floating point induction variable.
@ IK_PtrInduction
Pointer induction var. Step = C.
@ IK_IntInduction
Integer induction variable. Step = C.
Instruction * getExactFPMathInst()
Returns floating-point induction operator that does not allow reassociation (transforming the inducti...
Class to represent integer types.
An instruction for reading from memory.
const MemoryDepChecker & getDepChecker() const
the Memory Dependence Checker which can determine the loop-independent and loop-carried dependences b...
static LLVM_ABI bool blockNeedsPredication(const BasicBlock *BB, const Loop *TheLoop, const DominatorTree *DT)
Return true if the block BB needs to be predicated in order for the loop to be vectorized.
bool contains(const LoopT *L) const
Return true if the specified loop is contained within in this loop.
BlockT * getLoopLatch() const
If there is a single latch block for this loop, return it.
bool isInnermost() const
Return true if the loop does not contain any (natural) loops.
unsigned getNumBackEdges() const
Calculate the number of back edges to the loop header.
iterator_range< block_iterator > blocks() const
BlockT * getLoopPreheader() const
If there is a preheader for this loop, return it.
bool isLoopHeader(const BlockT *BB) const
LLVM_ABI bool isInvariantStoreOfReduction(StoreInst *SI)
Returns True if given store is a final invariant store of one of the reductions found in the loop.
void collectUnitStridePredicates() const
Add unit stride predicates for memory accesses to PSE, if runtime checks are allowed and an inner loo...
LLVM_ABI bool isInvariantAddressOfReduction(Value *V)
Returns True if given address is invariant and is used to store recurrent expression.
LLVM_ABI bool canVectorize(bool UseVPlanNativePath)
Returns true if it is legal to vectorize this loop.
LLVM_ABI bool blockNeedsPredication(const BasicBlock *BB) const
Return true if the block BB needs to be predicated in order for the loop to be vectorized.
LLVM_ABI int isConsecutivePtr(Type *AccessTy, Value *Ptr) const
Check if this pointer is consecutive when vectorizing.
bool hasUncountableExitWithSideEffects() const
Returns true if this is an early exit loop with state-changing or potentially-faulting operations and...
LLVM_ABI bool canVectorizeFPMath(bool EnableStrictReductions)
Returns true if it is legal to vectorize the FP math operations in this loop.
LLVM_ABI bool isFixedOrderRecurrence(const PHINode *Phi) const
Returns True if Phi is a fixed-order recurrence in this loop.
LLVM_ABI const InductionDescriptor * getPointerInductionDescriptor(PHINode *Phi) const
Returns a pointer to the induction descriptor, if Phi is pointer induction.
LLVM_ABI const InductionDescriptor * getIntOrFpInductionDescriptor(PHINode *Phi) const
Returns a pointer to the induction descriptor, if Phi is an integer or floating point induction.
LLVM_ABI bool isInductionPhi(const Value *V) const
Returns True if V is a Phi node of an induction variable in this loop.
const InductionList & getInductionVars() const
Returns the induction variables found in the loop.
LLVM_ABI bool isInvariant(Value *V) const
Returns true if V is invariant across all loop iterations according to SCEV.
const ReductionList & getReductionVars() const
Returns the reduction variables found in the loop.
LLVM_ABI bool canFoldTailByMasking() const
Return true if we can vectorize this loop while folding its tail by masking.
LLVM_ABI void prepareToFoldTailByMasking()
Mark all respective loads/stores for masking.
bool hasUncountableEarlyExit() const
Returns true if the loop has uncountable early exits, i.e.
LLVM_ABI bool isUniformMemOp(Instruction &I, std::optional< ElementCount > VF) const
A uniform memory op is a load or store which accesses the same memory location on all VF lanes,...
LLVM_ABI bool isUniform(Value *V, std::optional< ElementCount > VF) const
Returns true if value V is uniform across VF lanes, when VF is provided, and otherwise if V is invari...
LLVM_ABI bool isInductionVariable(const Value *V) const
Returns True if V can be considered as an induction variable in this loop.
LLVM_ABI bool isCastedInductionVariable(const Value *V) const
Returns True if V is a cast that is part of an induction def-use chain, and had been proven to be red...
@ SK_PreferScalable
Vectorize loops using scalable vectors or fixed-width vectors, but favor scalable vectors when the co...
@ SK_AlwaysScalable
Always vectorize loops using scalable vectors if feasible (i.e.
@ SK_Unspecified
Not selected.
@ SK_FixedWidthOnly
Disables vectorization with scalable vectors.
enum ForceKind getForce() const
LLVM_ABI bool allowVectorization(Function *F, Loop *L, bool VectorizeOnlyWhenForced) const
LLVM_ABI bool allowReordering() const
When enabling loop hints are provided we allow the vectorizer to change the order of operations that ...
LLVM_ABI void emitRemarkWithHints() const
Dumps all the hint information.
ElementCount getWidth() const
@ FK_Enabled
Forcing enabled.
@ FK_Undefined
Not selected.
@ FK_Disabled
Forcing disabled.
LLVM_ABI void setAlreadyVectorized()
Mark the loop L as already vectorized by setting the width to 1.
LLVM_ABI LoopVectorizeHints(const Loop *L, bool InterleaveOnlyWhenForced, OptimizationRemarkEmitter &ORE, const TargetTransformInfo *TTI=nullptr)
unsigned getInterleave() const
unsigned getIsVectorized() const
Represents a single loop in the control flow graph.
bool isLoopInvariant(const Value *V) const
Return true if the specified value is loop invariant.
PHINode * getCanonicalInductionVariable() const
Check to see if the loop has a canonical induction variable: an integer recurrence that starts at 0 a...
MDNode * getLoopID() const
Return the llvm.loop loop id metadata node for this loop if it is present.
const MDOperand & getOperand(unsigned I) const
ArrayRef< MDOperand > operands() const
unsigned getNumOperands() const
Return number of MDNode operands.
Tracking metadata reference owned by Metadata.
LLVM_ABI StringRef getString() const
iterator find(const KeyT &Key)
Checks memory dependences among accesses to the same underlying object to determine whether there vec...
const SmallVectorImpl< Dependence > * getDependences() const
Returns the memory dependences.
An interface layer with SCEV used to manage how we see SCEV expressions for values in the context of ...
ScalarEvolution * getSE() const
Returns the ScalarEvolution analysis used.
The RecurrenceDescriptor is used to identify recurrences variables in a loop.
Instruction * getExactFPMathInst() const
Returns 1st non-reassociative FP instruction in the PHI node's use-chain.
static LLVM_ABI bool isFixedOrderRecurrence(PHINode *Phi, Loop *TheLoop, DominatorTree *DT)
Returns true if Phi is a fixed-order recurrence.
bool hasExactFPMath() const
Returns true if the recurrence has floating-point math that requires precise (ordered) operations.
static LLVM_ABI bool isReductionPHI(PHINode *Phi, Loop *TheLoop, RecurrenceDescriptor &RedDes, DemandedBits *DB=nullptr, AssumptionCache *AC=nullptr, DominatorTree *DT=nullptr, ScalarEvolution *SE=nullptr)
Returns true if Phi is a reduction in TheLoop.
bool hasUsesOutsideReductionChain() const
Returns true if the reduction PHI has any uses outside the reduction chain.
RecurKind getRecurrenceKind() const
bool isOrdered() const
Expose an ordered FP reduction to the instance users.
StoreInst * IntermediateStore
Reductions may store temporary or final result to an invariant address.
static bool isMinMaxRecurrenceKind(RecurKind Kind)
Returns true if the recurrence kind is any min/max kind.
const Loop * getLoop() const
SCEVUse getStepRecurrence(ScalarEvolution &SE) const
Constructs and returns the recurrence indicating how much this expression steps by.
This visitor recursively visits a SCEV expression and re-writes it.
const SCEV * visit(const SCEV *S)
This class represents an analyzed expression in the program.
static constexpr auto FlagAnyWrap
The main scalar evolution driver.
LLVM_ABI const SCEV * getSCEV(Value *V)
Return a SCEV expression for the full generality of the specified expression.
LLVM_ABI bool isLoopInvariant(const SCEV *S, const Loop *L)
Return true if the value of the given SCEV is unchanging in the specified loop.
LLVM_ABI bool isSCEVable(Type *Ty) const
Test if values of the given type are analyzable within the SCEV framework.
LLVM_ABI const SCEV * getCouldNotCompute()
A templated base class for SmallPtrSet which provides the typesafe interface that is common across al...
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
reference emplace_back(ArgTypes &&... Args)
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
An instruction for storing to memory.
Value * getPointerOperand()
Represent a constant reference to a string, i.e.
Provides information about what library functions are available for the current target.
void getWidestVF(StringRef ScalarF, ElementCount &FixedVF, ElementCount &ScalableVF) const
Returns the largest vectorization factor used in the list of vector functions.
bool isFunctionVectorizable(StringRef F, const ElementCount &VF) const
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
LLVM_ABI std::string str() const
Return the twine contents as a std::string.
The instances of the Type class are immutable: once they are created, they are never changed.
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
bool isPointerTy() const
True if this is an instance of PointerType.
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
bool isIntOrPtrTy() const
Return true if this is an integer type or a pointer type.
bool isIntegerTy() const
True if this is an instance of IntegerType.
Value * getOperand(unsigned i) const
static bool hasMaskedVariant(const CallInst &CI, std::optional< ElementCount > VF=std::nullopt)
static SmallVector< VFInfo, 8 > getMappings(const CallInst &CI)
Retrieve all the VFInfo instances associated to the CallInst CI.
LLVM Value Representation.
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
static LLVM_ABI bool isValidElementType(Type *ElemTy)
Return true if the specified type is valid as a element type.
static constexpr bool isKnownLE(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
constexpr bool isZero() const
const ParentTy * getParent() const
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
@ C
The default llvm calling convention, compatible with C.
@ BasicBlock
Various leaf nodes.
void reportVectorizationFailure(const StringRef DebugMsg, const StringRef OREMsg, const StringRef ORETag, OptimizationRemarkEmitter *ORE, const Loop *TheLoop, Instruction *I=nullptr)
Reports a vectorization failure: print DebugMsg for debugging purposes along with the corresponding o...
OneUse_match< SubPat > m_OneUse(const SubPat &SP)
TwoOps_match< ValueOpTy, PointerOpTy, Instruction::Store > m_Store(const ValueOpTy &ValueOp, const PointerOpTy &PointerOp)
Matches StoreInst.
BinaryOp_match< LHS, RHS, Instruction::Add > m_Add(const LHS &L, const RHS &R)
bool match(Val *V, const Pattern &P)
match_bind< Instruction > m_Instruction(Instruction *&I)
Match an instruction, capturing it if we match.
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
IntrinsicID_match m_Intrinsic()
Match intrinsic calls like this: m_Intrinsic<Intrinsic::fabs>(m_Value(X))
auto m_BinOp()
Match an arbitrary binary operation and ignore it.
auto m_Value()
Match an arbitrary value and ignore it.
match_combine_or< match_combine_or< CastInst_match< OpTy, ZExtInst >, CastInst_match< OpTy, SExtInst > >, OpTy > m_ZExtOrSExtOrSelf(const OpTy &Op)
OneOps_match< OpTy, Instruction::Load > m_Load(const OpTy &Op)
Matches LoadInst.
CmpClass_match< LHS, RHS, ICmpInst > m_ICmp(CmpPredicate &Pred, const LHS &L, const RHS &R)
BinaryOp_match< LHS, RHS, Instruction::Sub > m_Sub(const LHS &L, const RHS &R)
ValuesClass values(OptsTy... Options)
Helper to build a ValuesClass by forwarding a variable number of arguments as an initializer list to ...
initializer< Ty > init(const Ty &Val)
std::enable_if_t< detail::IsValidPointer< X, Y >::value, X * > dyn_extract(Y &&MD)
Extract a Value from Metadata, if any.
Add a small namespace to avoid name clashes with the classes used in the streaming interface.
NodeAddr< PhiNode * > Phi
NodeAddr< FuncNode * > Func
friend class Instruction
Iterator for Instructions in a `BasicBlock.
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
FunctionAddr VTableAddr Value
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
auto size(R &&Range, std::enable_if_t< std::is_base_of< std::random_access_iterator_tag, typename std::iterator_traits< decltype(Range.begin())>::iterator_category >::value, void > *=nullptr)
Get the size of a range.
LLVM_ABI Intrinsic::ID getVectorIntrinsicIDForCall(const CallInst *CI, const TargetLibraryInfo *TLI)
Returns intrinsic ID for call.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
auto successors(const MachineBasicBlock *BB)
const Value * getLoadStorePointerOperand(const Value *V)
A helper function that returns the pointer operand of a load or store instruction.
static bool isUniformLoopNest(Loop *Lp, Loop *OuterLp)
void append_range(Container &C, Range &&R)
Wrapper function to append range R to container C.
static bool isUniformLoop(Loop *Lp, Loop *OuterLp)
LLVM_ABI bool mustSuppressSpeculation(const LoadInst &LI)
Return true if speculation of the given load must be suppressed to avoid ordering or interfering with...
LLVM_ABI bool isSafeToSpeculativelyExecute(const Instruction *I, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr, bool UseVariableInfo=true, bool IgnoreUBImplyingAttrs=true)
Return true if the instruction does not have any effects besides calculating the result and does not ...
auto dyn_cast_or_null(const Y &Val)
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
auto reverse(ContainerTy &&C)
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
static IntegerType * getWiderInductionTy(const DataLayout &DL, Type *Ty0, Type *Ty1)
static IntegerType * getInductionIntegerTy(const DataLayout &DL, Type *Ty)
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
LLVM_ABI bool hasDisableAllTransformsHint(const Loop *L)
Look for the loop attribute that disables all transformation heuristic.
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
static bool storeToSameAddress(ScalarEvolution *SE, StoreInst *A, StoreInst *B)
Returns true if A and B have same pointer operands or same SCEVs addresses.
bool canVectorizeTy(Type *Ty)
Returns true if Ty is a valid vector element type, void, or an unpacked literal struct where all elem...
LLVM_ABI bool isVectorIntrinsicWithScalarOpAtArg(Intrinsic::ID ID, unsigned ScalarOpdIdx, const TargetTransformInfo *TTI)
Identifies if the vector form of the intrinsic has a scalar operand.
ArrayRef(const T &OneElt) -> ArrayRef< T >
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
LLVM_ABI bool isReadOnlyLoop(Loop *L, ScalarEvolution *SE, DominatorTree *DT, AssumptionCache *AC, SmallVectorImpl< LoadInst * > &NonDereferenceableAndAlignedLoads, SmallVectorImpl< const SCEVPredicate * > *Predicates=nullptr)
Returns true if the loop contains read-only memory accesses and doesn't throw.
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
Type * getLoadStoreType(const Value *I)
A helper function that returns the type of a load or store instruction.
auto seq(T Begin, T End)
Iterate over an integral type from Begin up to - but not including - End.
static bool findHistogram(LoadInst *LI, StoreInst *HSt, Loop *TheLoop, const PredicatedScalarEvolution &PSE, SmallVectorImpl< HistogramInfo > &Histograms)
Find histogram operations that match high-level code in loops:
LLVM_ABI bool isGuaranteedNotToBePoison(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Returns true if V cannot be poison, but may be undef.
static bool isTLIScalarize(const TargetLibraryInfo &TLI, const CallInst &CI)
Checks if a function is scalarizable according to the TLI, in the sense that it should be vectorized ...
LLVM_ABI bool isDereferenceableAndAlignedInLoop(LoadInst *LI, Loop *L, ScalarEvolution &SE, DominatorTree &DT, AssumptionCache *AC=nullptr, SmallVectorImpl< const SCEVPredicate * > *Predicates=nullptr)
Return true if we can prove that the given load (which is assumed to be within the specified loop) wo...
constexpr detail::IsaCheckPredicate< Types... > IsaPred
Function object wrapper for the llvm::isa type check.
LLVM_ABI std::optional< int64_t > getPtrStride(PredicatedScalarEvolution &PSE, Type *AccessTy, Value *Ptr, const Loop *Lp, const DominatorTree &DT, const DenseMap< Value *, const SCEV * > &StridesMap=DenseMap< Value *, const SCEV * >(), bool Assume=false, bool ShouldCheckWrap=true)
If the pointer has a constant stride return it in units of the access type size.
SCEVUseT< const SCEV * > SCEVUse
bool SCEVExprContains(const SCEV *Root, PredTy Pred)
Return true if any node in Root satisfies the predicate Pred.
Dependece between memory access instructions.
Instruction * getDestination(const MemoryDepChecker &DepChecker) const
Return the destination instruction of the dependence.
Instruction * getSource(const MemoryDepChecker &DepChecker) const
Return the source instruction of the dependence.
static LLVM_ABI VectorizationSafetyStatus isSafeForVectorization(DepType Type)
Dependence types that don't prevent vectorization.
TODO: The following VectorizationFactor was pulled out of LoopVectorizationCostModel class.
Collection of parameters shared beetween the Loop Vectorizer and the Loop Access Analysis.
static LLVM_ABI const unsigned MaxVectorWidth
Maximum SIMD width.
static LLVM_ABI bool isInterleaveForced()
True if force-vector-interleave was specified by the user.
static LLVM_ABI unsigned VectorizationInterleave
Interleave factor as overridden by the user.