LLVM 22.0.0git
InferAlignment.cpp
Go to the documentation of this file.
1//===- InferAlignment.cpp -------------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// Infer alignment for load, stores and other memory operations based on
10// trailing zero known bits information.
11//
12//===----------------------------------------------------------------------===//
13
22
23using namespace llvm;
24
26 const DataLayout &DL, Instruction *I,
27 function_ref<Align(Value *PtrOp, Align OldAlign, Align PrefAlign)> Fn) {
28
29 if (auto *PtrOp = getLoadStorePointerOperand(I)) {
30 Align OldAlign = getLoadStoreAlignment(I);
31 Align PrefAlign = DL.getPrefTypeAlign(getLoadStoreType(I));
32
33 Align NewAlign = Fn(PtrOp, OldAlign, PrefAlign);
34 if (NewAlign > OldAlign) {
35 setLoadStoreAlignment(I, NewAlign);
36 return true;
37 }
38 }
39
41 if (!II)
42 return false;
43
44 // TODO: Handle more memory intrinsics.
45 switch (II->getIntrinsicID()) {
46 case Intrinsic::masked_load:
47 case Intrinsic::masked_store: {
48 int AlignOpIdx = II->getIntrinsicID() == Intrinsic::masked_load ? 1 : 2;
49 Value *PtrOp = II->getIntrinsicID() == Intrinsic::masked_load
50 ? II->getArgOperand(0)
51 : II->getArgOperand(1);
52 Type *Type = II->getIntrinsicID() == Intrinsic::masked_load
53 ? II->getType()
54 : II->getArgOperand(0)->getType();
55
56 Align OldAlign =
57 cast<ConstantInt>(II->getArgOperand(AlignOpIdx))->getAlignValue();
58 Align PrefAlign = DL.getPrefTypeAlign(Type);
59 Align NewAlign = Fn(PtrOp, OldAlign, PrefAlign);
60 if (NewAlign <= OldAlign)
61 return false;
62
63 Value *V =
64 ConstantInt::get(Type::getInt32Ty(II->getContext()), NewAlign.value());
65 II->setOperand(AlignOpIdx, V);
66 return true;
67 }
68 default:
69 return false;
70 }
71}
72
74 const DataLayout &DL = F.getDataLayout();
75 bool Changed = false;
76
77 // Enforce preferred type alignment if possible. We do this as a separate
78 // pass first, because it may improve the alignments we infer below.
79 for (BasicBlock &BB : F) {
80 for (Instruction &I : BB) {
82 DL, &I, [&](Value *PtrOp, Align OldAlign, Align PrefAlign) {
83 if (PrefAlign > OldAlign)
84 return std::max(OldAlign,
85 tryEnforceAlignment(PtrOp, PrefAlign, DL));
86 return OldAlign;
87 });
88 }
89 }
90
91 // Compute alignment from known bits.
92 auto InferFromKnownBits = [&](Instruction &I, Value *PtrOp) {
93 KnownBits Known = computeKnownBits(PtrOp, DL, &AC, &I, &DT);
94 unsigned TrailZ =
96 return Align(1ull << std::min(Known.getBitWidth() - 1, TrailZ));
97 };
98
99 // Propagate alignment between loads and stores that originate from the
100 // same base pointer.
101 DenseMap<Value *, Align> BestBasePointerAligns;
102 auto InferFromBasePointer = [&](Value *PtrOp, Align LoadStoreAlign) {
103 APInt OffsetFromBase(DL.getIndexTypeSizeInBits(PtrOp->getType()), 0);
104 PtrOp = PtrOp->stripAndAccumulateConstantOffsets(DL, OffsetFromBase, true);
105 // Derive the base pointer alignment from the load/store alignment
106 // and the offset from the base pointer.
107 Align BasePointerAlign =
108 commonAlignment(LoadStoreAlign, OffsetFromBase.getLimitedValue());
109
110 auto [It, Inserted] =
111 BestBasePointerAligns.try_emplace(PtrOp, BasePointerAlign);
112 if (!Inserted) {
113 // If the stored base pointer alignment is better than the
114 // base pointer alignment we derived, we may be able to use it
115 // to improve the load/store alignment. If not, store the
116 // improved base pointer alignment for future iterations.
117 if (It->second > BasePointerAlign) {
118 Align BetterLoadStoreAlign =
119 commonAlignment(It->second, OffsetFromBase.getLimitedValue());
120 return BetterLoadStoreAlign;
121 }
122 It->second = BasePointerAlign;
123 }
124 return LoadStoreAlign;
125 };
126
127 for (BasicBlock &BB : F) {
128 // We need to reset the map for each block because alignment information
129 // can only be propagated from instruction A to B if A dominates B.
130 // This is because control flow (and exception throwing) could be dependent
131 // on the address (and its alignment) at runtime. Some sort of dominator
132 // tree approach could be better, but doing a simple forward pass through a
133 // single basic block is correct too.
134 BestBasePointerAligns.clear();
135
136 for (Instruction &I : BB) {
138 DL, &I, [&](Value *PtrOp, Align OldAlign, Align PrefAlign) {
139 return std::max(InferFromKnownBits(I, PtrOp),
140 InferFromBasePointer(PtrOp, OldAlign));
141 });
142 }
143 }
144
145 return Changed;
146}
147
152 inferAlignment(F, AC, DT);
153 // Changes to alignment shouldn't invalidated analyses.
154 return PreservedAnalyses::all();
155}
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static bool tryToImproveAlign(const DataLayout &DL, Instruction *I, function_ref< Align(Value *PtrOp, Align OldAlign, Align PrefAlign)> Fn)
bool inferAlignment(Function &F, AssumptionCache &AC, DominatorTree &DT)
#define F(x, y, z)
Definition MD5.cpp:55
#define I(x, y, z)
Definition MD5.cpp:58
uint64_t IntrinsicInst * II
Class for arbitrary precision integers.
Definition APInt.h:78
uint64_t getLimitedValue(uint64_t Limit=UINT64_MAX) const
If this value is smaller than the specified limit, return it, otherwise return the limit value.
Definition APInt.h:475
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
A function analysis which provides an AssumptionCache.
A cache of @llvm.assume calls within a function.
LLVM Basic Block Representation.
Definition BasicBlock.h:62
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:63
std::pair< iterator, bool > try_emplace(KeyT &&Key, Ts &&...Args)
Definition DenseMap.h:229
Analysis pass which computes a DominatorTree.
Definition Dominators.h:284
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:165
A wrapper class for inspecting calls to intrinsic functions.
A set of analyses that are preserved following a run of a transformation pass.
Definition Analysis.h:112
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition Analysis.h:118
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:297
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:256
LLVM_ABI const Value * stripAndAccumulateConstantOffsets(const DataLayout &DL, APInt &Offset, bool AllowNonInbounds, bool AllowInvariantGroup=false, function_ref< bool(Value &Value, APInt &Offset)> ExternalAnalysis=nullptr, bool LookThroughIntToPtr=false) const
Accumulate the constant offset this value has compared to a base pointer.
static constexpr unsigned MaxAlignmentExponent
The maximum alignment for instructions.
Definition Value.h:829
An efficient, type-erasing, non-owning reference to a callable.
Changed
This is an optimization pass for GlobalISel generic memory operations.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:649
const Value * getLoadStorePointerOperand(const Value *V)
A helper function that returns the pointer operand of a load or store instruction.
Align getLoadStoreAlignment(const Value *I)
A helper function that returns the alignment of load or store instruction.
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
LLVM_ABI Align tryEnforceAlignment(Value *V, Align PrefAlign, const DataLayout &DL)
If the specified pointer points to an object that we control, try to modify the object's alignment to...
Definition Local.cpp:1517
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:565
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition Alignment.h:212
Type * getLoadStoreType(const Value *I)
A helper function that returns the type of a load or store instruction.
void setLoadStoreAlignment(Value *I, Align NewAlign)
A helper function that set the alignment of load or store instruction.
AnalysisManager< Function > FunctionAnalysisManager
Convenience typedef for the Function analysis manager.
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
uint64_t value() const
This is a hole in the type system and should not be abused.
Definition Alignment.h:85
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
unsigned countMinTrailingZeros() const
Returns the minimum number of trailing zero bits.
Definition KnownBits.h:235
unsigned getBitWidth() const
Get the bit width of this value.
Definition KnownBits.h:44