LLVM 22.0.0git
InferAlignment.cpp
Go to the documentation of this file.
1//===- InferAlignment.cpp -------------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// Infer alignment for load, stores and other memory operations based on
10// trailing zero known bits information.
11//
12//===----------------------------------------------------------------------===//
13
22
23using namespace llvm;
24
26 const DataLayout &DL, Instruction *I,
27 function_ref<Align(Value *PtrOp, Align OldAlign, Align PrefAlign)> Fn) {
28
29 if (auto *PtrOp = getLoadStorePointerOperand(I)) {
30 Align OldAlign = getLoadStoreAlignment(I);
31 Align PrefAlign = DL.getPrefTypeAlign(getLoadStoreType(I));
32
33 Align NewAlign = Fn(PtrOp, OldAlign, PrefAlign);
34 if (NewAlign > OldAlign) {
35 setLoadStoreAlignment(I, NewAlign);
36 return true;
37 }
38 }
39
41 if (!II)
42 return false;
43
44 // TODO: Handle more memory intrinsics.
45 switch (II->getIntrinsicID()) {
46 case Intrinsic::masked_load:
47 case Intrinsic::masked_store: {
48 int AlignOpIdx = II->getIntrinsicID() == Intrinsic::masked_load ? 1 : 2;
49 Value *PtrOp = II->getIntrinsicID() == Intrinsic::masked_load
50 ? II->getArgOperand(0)
51 : II->getArgOperand(1);
52 Type *Type = II->getIntrinsicID() == Intrinsic::masked_load
53 ? II->getType()
54 : II->getArgOperand(0)->getType();
55
56 Align OldAlign =
57 cast<ConstantInt>(II->getArgOperand(AlignOpIdx))->getAlignValue();
58 Align PrefAlign = DL.getPrefTypeAlign(Type);
59 Align NewAlign = Fn(PtrOp, OldAlign, PrefAlign);
60 if (NewAlign <= OldAlign ||
61 NewAlign.value() > std::numeric_limits<uint32_t>().max())
62 return false;
63
64 Value *V =
65 ConstantInt::get(Type::getInt32Ty(II->getContext()), NewAlign.value());
66 II->setOperand(AlignOpIdx, V);
67 return true;
68 }
69 default:
70 return false;
71 }
72}
73
75 const DataLayout &DL = F.getDataLayout();
76 bool Changed = false;
77
78 // Enforce preferred type alignment if possible. We do this as a separate
79 // pass first, because it may improve the alignments we infer below.
80 for (BasicBlock &BB : F) {
81 for (Instruction &I : BB) {
83 DL, &I, [&](Value *PtrOp, Align OldAlign, Align PrefAlign) {
84 if (PrefAlign > OldAlign)
85 return std::max(OldAlign,
86 tryEnforceAlignment(PtrOp, PrefAlign, DL));
87 return OldAlign;
88 });
89 }
90 }
91
92 // Compute alignment from known bits.
93 auto InferFromKnownBits = [&](Instruction &I, Value *PtrOp) {
94 KnownBits Known = computeKnownBits(PtrOp, DL, &AC, &I, &DT);
95 unsigned TrailZ =
97 return Align(1ull << std::min(Known.getBitWidth() - 1, TrailZ));
98 };
99
100 // Propagate alignment between loads and stores that originate from the
101 // same base pointer.
102 DenseMap<Value *, Align> BestBasePointerAligns;
103 auto InferFromBasePointer = [&](Value *PtrOp, Align LoadStoreAlign) {
104 APInt OffsetFromBase(DL.getIndexTypeSizeInBits(PtrOp->getType()), 0);
105 PtrOp = PtrOp->stripAndAccumulateConstantOffsets(DL, OffsetFromBase, true);
106 // Derive the base pointer alignment from the load/store alignment
107 // and the offset from the base pointer.
108 Align BasePointerAlign =
109 commonAlignment(LoadStoreAlign, OffsetFromBase.getLimitedValue());
110
111 auto [It, Inserted] =
112 BestBasePointerAligns.try_emplace(PtrOp, BasePointerAlign);
113 if (!Inserted) {
114 // If the stored base pointer alignment is better than the
115 // base pointer alignment we derived, we may be able to use it
116 // to improve the load/store alignment. If not, store the
117 // improved base pointer alignment for future iterations.
118 if (It->second > BasePointerAlign) {
119 Align BetterLoadStoreAlign =
120 commonAlignment(It->second, OffsetFromBase.getLimitedValue());
121 return BetterLoadStoreAlign;
122 }
123 It->second = BasePointerAlign;
124 }
125 return LoadStoreAlign;
126 };
127
128 for (BasicBlock &BB : F) {
129 // We need to reset the map for each block because alignment information
130 // can only be propagated from instruction A to B if A dominates B.
131 // This is because control flow (and exception throwing) could be dependent
132 // on the address (and its alignment) at runtime. Some sort of dominator
133 // tree approach could be better, but doing a simple forward pass through a
134 // single basic block is correct too.
135 BestBasePointerAligns.clear();
136
137 for (Instruction &I : BB) {
139 DL, &I, [&](Value *PtrOp, Align OldAlign, Align PrefAlign) {
140 return std::max(InferFromKnownBits(I, PtrOp),
141 InferFromBasePointer(PtrOp, OldAlign));
142 });
143 }
144 }
145
146 return Changed;
147}
148
153 inferAlignment(F, AC, DT);
154 // Changes to alignment shouldn't invalidated analyses.
155 return PreservedAnalyses::all();
156}
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static bool tryToImproveAlign(const DataLayout &DL, Instruction *I, function_ref< Align(Value *PtrOp, Align OldAlign, Align PrefAlign)> Fn)
bool inferAlignment(Function &F, AssumptionCache &AC, DominatorTree &DT)
#define F(x, y, z)
Definition MD5.cpp:55
#define I(x, y, z)
Definition MD5.cpp:58
uint64_t IntrinsicInst * II
Class for arbitrary precision integers.
Definition APInt.h:78
uint64_t getLimitedValue(uint64_t Limit=UINT64_MAX) const
If this value is smaller than the specified limit, return it, otherwise return the limit value.
Definition APInt.h:475
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
A function analysis which provides an AssumptionCache.
A cache of @llvm.assume calls within a function.
LLVM Basic Block Representation.
Definition BasicBlock.h:62
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:63
std::pair< iterator, bool > try_emplace(KeyT &&Key, Ts &&...Args)
Definition DenseMap.h:229
Analysis pass which computes a DominatorTree.
Definition Dominators.h:284
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:165
A wrapper class for inspecting calls to intrinsic functions.
A set of analyses that are preserved following a run of a transformation pass.
Definition Analysis.h:112
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition Analysis.h:118
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:297
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:256
LLVM_ABI const Value * stripAndAccumulateConstantOffsets(const DataLayout &DL, APInt &Offset, bool AllowNonInbounds, bool AllowInvariantGroup=false, function_ref< bool(Value &Value, APInt &Offset)> ExternalAnalysis=nullptr, bool LookThroughIntToPtr=false) const
Accumulate the constant offset this value has compared to a base pointer.
static constexpr unsigned MaxAlignmentExponent
The maximum alignment for instructions.
Definition Value.h:829
An efficient, type-erasing, non-owning reference to a callable.
Changed
This is an optimization pass for GlobalISel generic memory operations.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:649
const Value * getLoadStorePointerOperand(const Value *V)
A helper function that returns the pointer operand of a load or store instruction.
Align getLoadStoreAlignment(const Value *I)
A helper function that returns the alignment of load or store instruction.
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
LLVM_ABI Align tryEnforceAlignment(Value *V, Align PrefAlign, const DataLayout &DL)
If the specified pointer points to an object that we control, try to modify the object's alignment to...
Definition Local.cpp:1517
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:565
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition Alignment.h:212
Type * getLoadStoreType(const Value *I)
A helper function that returns the type of a load or store instruction.
void setLoadStoreAlignment(Value *I, Align NewAlign)
A helper function that set the alignment of load or store instruction.
AnalysisManager< Function > FunctionAnalysisManager
Convenience typedef for the Function analysis manager.
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
uint64_t value() const
This is a hole in the type system and should not be abused.
Definition Alignment.h:85
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
unsigned countMinTrailingZeros() const
Returns the minimum number of trailing zero bits.
Definition KnownBits.h:242
unsigned getBitWidth() const
Get the bit width of this value.
Definition KnownBits.h:44