LLVM 23.0.0git
InferAlignment.cpp
Go to the documentation of this file.
1//===- InferAlignment.cpp -------------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// Infer alignment for load, stores and other memory operations based on
10// trailing zero known bits information.
11//
12//===----------------------------------------------------------------------===//
13
15#include "llvm/ADT/APInt.h"
20#include "llvm/IR/Instruction.h"
27
28using namespace llvm;
29using namespace llvm::PatternMatch;
30
32 const DataLayout &DL, Instruction *I,
33 function_ref<Align(Value *PtrOp, Align OldAlign, Align PrefAlign)> Fn) {
34
35 if (auto *PtrOp = getLoadStorePointerOperand(I)) {
36 Align OldAlign = getLoadStoreAlignment(I);
37 Align PrefAlign = DL.getPrefTypeAlign(getLoadStoreType(I));
38
39 Align NewAlign = Fn(PtrOp, OldAlign, PrefAlign);
40 if (NewAlign > OldAlign) {
41 setLoadStoreAlignment(I, NewAlign);
42 return true;
43 }
44 }
45
46 Value *PtrOp;
47 const APInt *Const;
48 if (match(I, m_And(m_PtrToIntOrAddr(m_Value(PtrOp)), m_APInt(Const)))) {
49 Align ActualAlign = Fn(PtrOp, Align(1), Align(1));
50 if (Const->ult(ActualAlign.value())) {
51 I->replaceAllUsesWith(Constant::getNullValue(I->getType()));
52 return true;
53 }
54 if (Const->uge(
55 APInt::getBitsSetFrom(Const->getBitWidth(), Log2(ActualAlign)))) {
56 I->replaceAllUsesWith(I->getOperand(0));
57 return true;
58 }
59 }
60 if (match(I, m_Trunc(m_PtrToIntOrAddr(m_Value(PtrOp))))) {
61 Align ActualAlign = Fn(PtrOp, Align(1), Align(1));
62 if (Log2(ActualAlign) >= I->getType()->getScalarSizeInBits()) {
63 I->replaceAllUsesWith(Constant::getNullValue(I->getType()));
64 return true;
65 }
66 }
67
69 if (!II)
70 return false;
71
72 // TODO: Handle more memory intrinsics.
73 switch (II->getIntrinsicID()) {
74 case Intrinsic::masked_load:
75 case Intrinsic::masked_store: {
76 unsigned PtrOpIdx = II->getIntrinsicID() == Intrinsic::masked_load ? 0 : 1;
77 Value *PtrOp = II->getArgOperand(PtrOpIdx);
78 Type *Type = II->getIntrinsicID() == Intrinsic::masked_load
79 ? II->getType()
80 : II->getArgOperand(0)->getType();
81
82 Align OldAlign = II->getParamAlign(PtrOpIdx).valueOrOne();
83 Align PrefAlign = DL.getPrefTypeAlign(Type);
84 Align NewAlign = Fn(PtrOp, OldAlign, PrefAlign);
85 if (NewAlign <= OldAlign)
86 return false;
87
88 II->addParamAttr(PtrOpIdx,
89 Attribute::getWithAlignment(II->getContext(), NewAlign));
90 return true;
91 }
92 default:
93 return false;
94 }
95}
96
97using ScopedHT =
100 // If BB is nullptr, the BB is processed.
102 DomTreeNode::const_iterator Iter;
103 DomTreeNode::const_iterator End;
105
107 : BB(N->getBlock()), Iter(N->begin()), End(N->end()), Scope(Table) {}
108};
109
111 const DataLayout &DL = F.getDataLayout();
112 bool Changed = false;
113
114 // Enforce preferred type alignment if possible. We do this as a separate
115 // pass first, because it may improve the alignments we infer below.
116 for (BasicBlock &BB : F) {
117 for (Instruction &I : BB) {
119 DL, &I, [&](Value *PtrOp, Align OldAlign, Align PrefAlign) {
120 if (PrefAlign > OldAlign)
121 return std::max(OldAlign,
122 tryEnforceAlignment(PtrOp, PrefAlign, DL));
123 return OldAlign;
124 });
125 }
126 }
127
128 // Compute alignment from known bits.
129 auto InferFromKnownBits = [&](Instruction &I, Value *PtrOp) {
130 KnownBits Known = computeKnownBits(PtrOp, DL, &AC, &I, &DT);
131 unsigned TrailZ =
133 return Align(1ull << std::min(Known.getBitWidth() - 1, TrailZ));
134 };
135
136 // Propagate alignment between loads and stores that originate from the
137 // same base pointer.
138 ScopedHT BestBasePointerAligns;
139 auto InferFromBasePointer = [&](Value *PtrOp, Align LoadStoreAlign) {
140 APInt OffsetFromBase(DL.getIndexTypeSizeInBits(PtrOp->getType()), 0);
141 PtrOp = PtrOp->stripAndAccumulateConstantOffsets(DL, OffsetFromBase, true);
142 // Derive the base pointer alignment from the load/store alignment
143 // and the offset from the base pointer.
144 Align BasePointerAlign =
145 commonAlignment(LoadStoreAlign, OffsetFromBase.getLimitedValue());
146
147 if (auto BestAlign = BestBasePointerAligns.lookup(PtrOp);
148 BestAlign != Align()) {
149 // If the stored base pointer alignment is better than the
150 // base pointer alignment we derived, we may be able to use it
151 // to improve the load/store alignment. If not, store the
152 // improved base pointer alignment for future iterations.
153 if (BestAlign > BasePointerAlign) {
154 Align BetterLoadStoreAlign =
155 commonAlignment(BestAlign, OffsetFromBase.getLimitedValue());
156 return BetterLoadStoreAlign;
157 }
158 }
159
160 BestBasePointerAligns.insert(PtrOp, BasePointerAlign);
161 return LoadStoreAlign;
162 };
163
164 // AlignmentScope is unmovable.
165 std::list<AlignmentScope> Stack;
166 Stack.emplace_back(DT.getRootNode(), BestBasePointerAligns);
167 while (!Stack.empty()) {
168 AlignmentScope &Top = Stack.back();
169 if (Top.BB) {
170 for (Instruction &I : *Top.BB) {
172 DL, &I, [&](Value *PtrOp, Align OldAlign, Align PrefAlign) {
173 return std::max(InferFromKnownBits(I, PtrOp),
174 InferFromBasePointer(PtrOp, OldAlign));
175 });
176 }
177 Top.BB = nullptr;
178 }
179
180 if (Top.Iter != Top.End)
181 Stack.emplace_back(*Top.Iter++, BestBasePointerAligns);
182 else
183 Stack.pop_back();
184 }
185
186 return Changed;
187}
188
193 inferAlignment(F, AC, DT);
194 // Changes to alignment shouldn't invalidated analyses.
195 return PreservedAnalyses::all();
196}
This file implements a class to represent arbitrary precision integral constant values and operations...
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static bool tryToImproveAlign(const DataLayout &DL, Instruction *I, function_ref< Align(Value *PtrOp, Align OldAlign, Align PrefAlign)> Fn)
bool inferAlignment(Function &F, AssumptionCache &AC, DominatorTree &DT)
ScopedHashTable< Value *, Align, DenseMapInfo< Value * >, BumpPtrAllocator > ScopedHT
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
uint64_t IntrinsicInst * II
Class for arbitrary precision integers.
Definition APInt.h:78
uint64_t getLimitedValue(uint64_t Limit=UINT64_MAX) const
If this value is smaller than the specified limit, return it, otherwise return the limit value.
Definition APInt.h:476
static APInt getBitsSetFrom(unsigned numBits, unsigned loBit)
Constructs an APInt value that has a contiguous range of bits set.
Definition APInt.h:287
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
A function analysis which provides an AssumptionCache.
A cache of @llvm.assume calls within a function.
static LLVM_ABI Attribute getWithAlignment(LLVMContext &Context, Align Alignment)
Return a uniquified Attribute object that has the specific alignment set.
LLVM Basic Block Representation.
Definition BasicBlock.h:62
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
Analysis pass which computes a DominatorTree.
Definition Dominators.h:278
DomTreeNodeBase< NodeT > * getRootNode()
getRootNode - This returns the entry node for the CFG of the function.
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:159
A wrapper class for inspecting calls to intrinsic functions.
A set of analyses that are preserved following a run of a transformation pass.
Definition Analysis.h:112
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition Analysis.h:118
void insert(const K &Key, const V &Val)
V lookup(const K &Key) const
ScopedHashTableScope< Value *, Align, DenseMapInfo< Value * >, BumpPtrAllocator > ScopeTy
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:255
LLVM_ABI const Value * stripAndAccumulateConstantOffsets(const DataLayout &DL, APInt &Offset, bool AllowNonInbounds, bool AllowInvariantGroup=false, function_ref< bool(Value &Value, APInt &Offset)> ExternalAnalysis=nullptr, bool LookThroughIntToPtr=false) const
Accumulate the constant offset this value has compared to a base pointer.
static constexpr unsigned MaxAlignmentExponent
The maximum alignment for instructions.
Definition Value.h:797
An efficient, type-erasing, non-owning reference to a callable.
Changed
BinaryOp_match< LHS, RHS, Instruction::And > m_And(const LHS &L, const RHS &R)
auto m_PtrToIntOrAddr(const OpTy &Op)
Matches PtrToInt or PtrToAddr.
ap_match< APInt > m_APInt(const APInt *&Res)
Match a ConstantInt or splatted ConstantVector, binding the specified pointer to the contained APInt.
CastInst_match< OpTy, TruncInst > m_Trunc(const OpTy &Op)
Matches Trunc.
bool match(Val *V, const Pattern &P)
auto m_Value()
Match an arbitrary value and ignore it.
This is an optimization pass for GlobalISel generic memory operations.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
const Value * getLoadStorePointerOperand(const Value *V)
A helper function that returns the pointer operand of a load or store instruction.
Align getLoadStoreAlignment(const Value *I)
A helper function that returns the alignment of load or store instruction.
DomTreeNodeBase< BasicBlock > DomTreeNode
Definition Dominators.h:94
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
LLVM_ABI Align tryEnforceAlignment(Value *V, Align PrefAlign, const DataLayout &DL)
If the specified pointer points to an object that we control, try to modify the object's alignment to...
Definition Local.cpp:1532
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition Alignment.h:201
Type * getLoadStoreType(const Value *I)
A helper function that returns the type of a load or store instruction.
void setLoadStoreAlignment(Value *I, Align NewAlign)
A helper function that set the alignment of load or store instruction.
unsigned Log2(Align A)
Returns the log2 of the alignment.
Definition Alignment.h:197
AnalysisManager< Function > FunctionAnalysisManager
Convenience typedef for the Function analysis manager.
BumpPtrAllocatorImpl<> BumpPtrAllocator
The standard BumpPtrAllocator which just uses the default template parameters.
Definition Allocator.h:383
#define N
ScopedHT::ScopeTy Scope
DomTreeNode::const_iterator End
AlignmentScope(DomTreeNode *N, ScopedHT &Table)
DomTreeNode::const_iterator Iter
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
constexpr uint64_t value() const
This is a hole in the type system and should not be abused.
Definition Alignment.h:77
LLVM_ABI PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
unsigned countMinTrailingZeros() const
Returns the minimum number of trailing zero bits.
Definition KnownBits.h:256
unsigned getBitWidth() const
Get the bit width of this value.
Definition KnownBits.h:44