LLVM 22.0.0git
InferAlignment.cpp
Go to the documentation of this file.
1//===- InferAlignment.cpp -------------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// Infer alignment for load, stores and other memory operations based on
10// trailing zero known bits information.
11//
12//===----------------------------------------------------------------------===//
13
22
23using namespace llvm;
24
26 const DataLayout &DL, Instruction *I,
27 function_ref<Align(Value *PtrOp, Align OldAlign, Align PrefAlign)> Fn) {
28
29 if (auto *PtrOp = getLoadStorePointerOperand(I)) {
30 Align OldAlign = getLoadStoreAlignment(I);
31 Align PrefAlign = DL.getPrefTypeAlign(getLoadStoreType(I));
32
33 Align NewAlign = Fn(PtrOp, OldAlign, PrefAlign);
34 if (NewAlign > OldAlign) {
35 setLoadStoreAlignment(I, NewAlign);
36 return true;
37 }
38 }
39
41 if (!II)
42 return false;
43
44 // TODO: Handle more memory intrinsics.
45 switch (II->getIntrinsicID()) {
46 case Intrinsic::masked_load:
47 case Intrinsic::masked_store: {
48 unsigned PtrOpIdx = II->getIntrinsicID() == Intrinsic::masked_load ? 0 : 1;
49 Value *PtrOp = II->getArgOperand(PtrOpIdx);
50 Type *Type = II->getIntrinsicID() == Intrinsic::masked_load
51 ? II->getType()
52 : II->getArgOperand(0)->getType();
53
54 Align OldAlign = II->getParamAlign(PtrOpIdx).valueOrOne();
55 Align PrefAlign = DL.getPrefTypeAlign(Type);
56 Align NewAlign = Fn(PtrOp, OldAlign, PrefAlign);
57 if (NewAlign <= OldAlign)
58 return false;
59
60 II->addParamAttr(PtrOpIdx,
61 Attribute::getWithAlignment(II->getContext(), NewAlign));
62 return true;
63 }
64 default:
65 return false;
66 }
67}
68
70 const DataLayout &DL = F.getDataLayout();
71 bool Changed = false;
72
73 // Enforce preferred type alignment if possible. We do this as a separate
74 // pass first, because it may improve the alignments we infer below.
75 for (BasicBlock &BB : F) {
76 for (Instruction &I : BB) {
78 DL, &I, [&](Value *PtrOp, Align OldAlign, Align PrefAlign) {
79 if (PrefAlign > OldAlign)
80 return std::max(OldAlign,
81 tryEnforceAlignment(PtrOp, PrefAlign, DL));
82 return OldAlign;
83 });
84 }
85 }
86
87 // Compute alignment from known bits.
88 auto InferFromKnownBits = [&](Instruction &I, Value *PtrOp) {
89 KnownBits Known = computeKnownBits(PtrOp, DL, &AC, &I, &DT);
90 unsigned TrailZ =
92 return Align(1ull << std::min(Known.getBitWidth() - 1, TrailZ));
93 };
94
95 // Propagate alignment between loads and stores that originate from the
96 // same base pointer.
97 DenseMap<Value *, Align> BestBasePointerAligns;
98 auto InferFromBasePointer = [&](Value *PtrOp, Align LoadStoreAlign) {
99 APInt OffsetFromBase(DL.getIndexTypeSizeInBits(PtrOp->getType()), 0);
100 PtrOp = PtrOp->stripAndAccumulateConstantOffsets(DL, OffsetFromBase, true);
101 // Derive the base pointer alignment from the load/store alignment
102 // and the offset from the base pointer.
103 Align BasePointerAlign =
104 commonAlignment(LoadStoreAlign, OffsetFromBase.getLimitedValue());
105
106 auto [It, Inserted] =
107 BestBasePointerAligns.try_emplace(PtrOp, BasePointerAlign);
108 if (!Inserted) {
109 // If the stored base pointer alignment is better than the
110 // base pointer alignment we derived, we may be able to use it
111 // to improve the load/store alignment. If not, store the
112 // improved base pointer alignment for future iterations.
113 if (It->second > BasePointerAlign) {
114 Align BetterLoadStoreAlign =
115 commonAlignment(It->second, OffsetFromBase.getLimitedValue());
116 return BetterLoadStoreAlign;
117 }
118 It->second = BasePointerAlign;
119 }
120 return LoadStoreAlign;
121 };
122
123 for (BasicBlock &BB : F) {
124 // We need to reset the map for each block because alignment information
125 // can only be propagated from instruction A to B if A dominates B.
126 // This is because control flow (and exception throwing) could be dependent
127 // on the address (and its alignment) at runtime. Some sort of dominator
128 // tree approach could be better, but doing a simple forward pass through a
129 // single basic block is correct too.
130 BestBasePointerAligns.clear();
131
132 for (Instruction &I : BB) {
134 DL, &I, [&](Value *PtrOp, Align OldAlign, Align PrefAlign) {
135 return std::max(InferFromKnownBits(I, PtrOp),
136 InferFromBasePointer(PtrOp, OldAlign));
137 });
138 }
139 }
140
141 return Changed;
142}
143
148 inferAlignment(F, AC, DT);
149 // Changes to alignment shouldn't invalidated analyses.
150 return PreservedAnalyses::all();
151}
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static bool tryToImproveAlign(const DataLayout &DL, Instruction *I, function_ref< Align(Value *PtrOp, Align OldAlign, Align PrefAlign)> Fn)
bool inferAlignment(Function &F, AssumptionCache &AC, DominatorTree &DT)
#define F(x, y, z)
Definition MD5.cpp:55
#define I(x, y, z)
Definition MD5.cpp:58
uint64_t IntrinsicInst * II
Class for arbitrary precision integers.
Definition APInt.h:78
uint64_t getLimitedValue(uint64_t Limit=UINT64_MAX) const
If this value is smaller than the specified limit, return it, otherwise return the limit value.
Definition APInt.h:475
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
A function analysis which provides an AssumptionCache.
A cache of @llvm.assume calls within a function.
static LLVM_ABI Attribute getWithAlignment(LLVMContext &Context, Align Alignment)
Return a uniquified Attribute object that has the specific alignment set.
LLVM Basic Block Representation.
Definition BasicBlock.h:62
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:63
std::pair< iterator, bool > try_emplace(KeyT &&Key, Ts &&...Args)
Definition DenseMap.h:248
Analysis pass which computes a DominatorTree.
Definition Dominators.h:284
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:165
A wrapper class for inspecting calls to intrinsic functions.
A set of analyses that are preserved following a run of a transformation pass.
Definition Analysis.h:112
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition Analysis.h:118
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:256
LLVM_ABI const Value * stripAndAccumulateConstantOffsets(const DataLayout &DL, APInt &Offset, bool AllowNonInbounds, bool AllowInvariantGroup=false, function_ref< bool(Value &Value, APInt &Offset)> ExternalAnalysis=nullptr, bool LookThroughIntToPtr=false) const
Accumulate the constant offset this value has compared to a base pointer.
static constexpr unsigned MaxAlignmentExponent
The maximum alignment for instructions.
Definition Value.h:829
An efficient, type-erasing, non-owning reference to a callable.
Changed
This is an optimization pass for GlobalISel generic memory operations.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
const Value * getLoadStorePointerOperand(const Value *V)
A helper function that returns the pointer operand of a load or store instruction.
Align getLoadStoreAlignment(const Value *I)
A helper function that returns the alignment of load or store instruction.
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
LLVM_ABI Align tryEnforceAlignment(Value *V, Align PrefAlign, const DataLayout &DL)
If the specified pointer points to an object that we control, try to modify the object's alignment to...
Definition Local.cpp:1517
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition Alignment.h:201
Type * getLoadStoreType(const Value *I)
A helper function that returns the type of a load or store instruction.
void setLoadStoreAlignment(Value *I, Align NewAlign)
A helper function that set the alignment of load or store instruction.
AnalysisManager< Function > FunctionAnalysisManager
Convenience typedef for the Function analysis manager.
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
unsigned countMinTrailingZeros() const
Returns the minimum number of trailing zero bits.
Definition KnownBits.h:242
unsigned getBitWidth() const
Get the bit width of this value.
Definition KnownBits.h:44