LLVM 20.0.0git
VPRecipeBuilder.h
Go to the documentation of this file.
1//===- VPRecipeBuilder.h - Helper class to build recipes --------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9#ifndef LLVM_TRANSFORMS_VECTORIZE_VPRECIPEBUILDER_H
10#define LLVM_TRANSFORMS_VECTORIZE_VPRECIPEBUILDER_H
11
13#include "VPlan.h"
14#include "llvm/ADT/DenseMap.h"
17#include "llvm/IR/IRBuilder.h"
18
19namespace llvm {
20
21class LoopVectorizationLegality;
22class LoopVectorizationCostModel;
23class TargetLibraryInfo;
24class TargetTransformInfo;
25struct HistogramInfo;
26
27/// A chain of instructions that form a partial reduction.
28/// Designed to match: reduction_bin_op (bin_op (extend (A), (extend (B))),
29/// accumulator).
34 }
35 /// The top-level binary operation that forms the reduction to a scalar
36 /// after the loop body.
38 /// The extension of each of the inner binary operation's operands.
41
42 /// The binary operation using the extends that is then reduced.
44};
45
46/// Helper class to create VPRecipies from IR instructions.
48 /// The VPlan new recipes are added to.
49 VPlan &Plan;
50
51 /// The loop that we evaluate.
52 Loop *OrigLoop;
53
54 /// Target Library Info.
55 const TargetLibraryInfo *TLI;
56
57 // Target Transform Info.
59
60 /// The legality analysis.
62
63 /// The profitablity analysis.
65
67
68 VPBuilder &Builder;
69
70 /// When we if-convert we need to create edge masks. We have to cache values
71 /// so that we don't end up with exponential recursion/IR. Note that
72 /// if-conversion currently takes place during VPlan-construction, so these
73 /// caches are only used at that stage.
74 using EdgeMaskCacheTy =
77 EdgeMaskCacheTy EdgeMaskCache;
78 BlockMaskCacheTy BlockMaskCache;
79
80 // VPlan construction support: Hold a mapping from ingredients to
81 // their recipe.
83
84 /// Cross-iteration reduction & first-order recurrence phis for which we need
85 /// to add the incoming value from the backedge after all recipes have been
86 /// created.
88
89 /// A mapping of partial reduction exit instructions to their scaling factor.
91
92 /// Check if \p I can be widened at the start of \p Range and possibly
93 /// decrease the range such that the returned value holds for the entire \p
94 /// Range. The function should not be called for memory instructions or calls.
95 bool shouldWiden(Instruction *I, VFRange &Range) const;
96
97 /// Check if the load or store instruction \p I should widened for \p
98 /// Range.Start and potentially masked. Such instructions are handled by a
99 /// recipe that takes an additional VPInstruction for the mask.
100 VPWidenMemoryRecipe *tryToWidenMemory(Instruction *I,
102 VFRange &Range);
103
104 /// Check if an induction recipe should be constructed for \p Phi. If so build
105 /// and return it. If not, return null.
106 VPHeaderPHIRecipe *tryToOptimizeInductionPHI(PHINode *Phi,
108 VFRange &Range);
109
110 /// Optimize the special case where the operand of \p I is a constant integer
111 /// induction variable.
113 tryToOptimizeInductionTruncate(TruncInst *I, ArrayRef<VPValue *> Operands,
114 VFRange &Range);
115
116 /// Handle non-loop phi nodes. Return a new VPBlendRecipe otherwise. Currently
117 /// all such phi nodes are turned into a sequence of select instructions as
118 /// the vectorizer currently performs full if-conversion.
120
121 /// Handle call instructions. If \p CI can be widened for \p Range.Start,
122 /// return a new VPWidenCallRecipe or VPWidenIntrinsicRecipe. Range.End may be
123 /// decreased to ensure same decision from \p Range.Start to \p Range.End.
125 VFRange &Range);
126
127 /// Check if \p I has an opcode that can be widened and return a VPWidenRecipe
128 /// if it can. The function should only be called if the cost-model indicates
129 /// that widening should be performed.
131 VPBasicBlock *VPBB);
132
133 /// Makes Histogram count operations safe for vectorization, by emitting a
134 /// llvm.experimental.vector.histogram.add intrinsic in place of the
135 /// Load + Add|Sub + Store operations that perform the histogram in the
136 /// original scalar loop.
137 VPHistogramRecipe *tryToWidenHistogram(const HistogramInfo *HI,
139
140 /// Examines reduction operations to see if the target can use a cheaper
141 /// operation with a wider per-iteration input VF and narrower PHI VF.
142 /// Returns null if no scaled reduction was found, otherwise a pair with a
143 /// struct containing reduction information and the scaling factor between the
144 /// number of elements in the input and output.
145 std::optional<std::pair<PartialReductionChain, unsigned>>
146 getScaledReduction(PHINode *PHI, const RecurrenceDescriptor &Rdx,
147 VFRange &Range);
148
149public:
150 VPRecipeBuilder(VPlan &Plan, Loop *OrigLoop, const TargetLibraryInfo *TLI,
155 : Plan(Plan), OrigLoop(OrigLoop), TLI(TLI), TTI(TTI), Legal(Legal),
156 CM(CM), PSE(PSE), Builder(Builder) {}
157
158 std::optional<unsigned> getScalingForReduction(const Instruction *ExitInst) {
159 auto It = ScaledReductionMap.find(ExitInst);
160 return It == ScaledReductionMap.end() ? std::nullopt
161 : std::make_optional(It->second);
162 }
163
164 /// Find all possible partial reductions in the loop and track all of those
165 /// that are valid so recipes can be formed later.
167
168 /// Create and return a widened recipe for \p I if one can be created within
169 /// the given VF \p Range.
172 VFRange &Range, VPBasicBlock *VPBB);
173
174 /// Create and return a partial reduction recipe for a reduction instruction
175 /// along with binary operation and reduction phi operands.
178
179 /// Set the recipe created for given ingredient.
181 assert(!Ingredient2Recipe.contains(I) &&
182 "Cannot reset recipe for instruction.");
183 Ingredient2Recipe[I] = R;
184 }
185
186 /// Create the mask for the vector loop header block.
187 void createHeaderMask();
188
189 /// A helper function that computes the predicate of the block BB, assuming
190 /// that the header block of the loop is set to True or the loop mask when
191 /// tail folding.
193
194 /// Returns the *entry* mask for the block \p BB.
196
197 /// Create an edge mask for every destination of cases and/or default.
199
200 /// A helper function that computes the predicate of the edge between SRC
201 /// and DST.
203
204 /// A helper that returns the previously computed predicate of the edge
205 /// between SRC and DST.
206 VPValue *getEdgeMask(BasicBlock *Src, BasicBlock *Dst) const;
207
208 /// Return the recipe created for given ingredient.
210 assert(Ingredient2Recipe.count(I) &&
211 "Recording this ingredients recipe was not requested");
212 assert(Ingredient2Recipe[I] != nullptr &&
213 "Ingredient doesn't have a recipe");
214 return Ingredient2Recipe[I];
215 }
216
217 /// Build a VPReplicationRecipe for \p I. If it is predicated, add the mask as
218 /// last operand. Range.End may be decreased to ensure same recipe behavior
219 /// from \p Range.Start to \p Range.End.
221
222 /// Add the incoming values from the backedge to reduction & first-order
223 /// recurrence cross-iteration phis.
224 void fixHeaderPhis();
225
226 /// Returns a range mapping the values of the range \p Operands to their
227 /// corresponding VPValues.
228 iterator_range<mapped_iterator<Use *, std::function<VPValue *(Value *)>>>
230
232 if (auto *I = dyn_cast<Instruction>(V)) {
233 if (auto *R = Ingredient2Recipe.lookup(I))
234 return R->getVPSingleValue();
235 }
236 return Plan.getOrAddLiveIn(V);
237 }
238};
239} // end namespace llvm
240
241#endif // LLVM_TRANSFORMS_VECTORIZE_VPRECIPEBUILDER_H
Rewrite undef for PHI
This file defines the DenseMap class.
This file provides a LoopVectorizationPlanner class.
#define I(x, y, z)
Definition: MD5.cpp:58
mir Rename Register Operands
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
This file defines the PointerUnion class, which is a discriminated union of pointer types.
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file contains the declarations of the Vectorization Plan base classes:
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41
LLVM Basic Block Representation.
Definition: BasicBlock.h:61
This class represents a function call, abstracting a target machine's calling convention.
ValueT lookup(const_arg_type_t< KeyT > Val) const
lookup - Return the entry for the specified key, or a default constructed value if no such entry exis...
Definition: DenseMap.h:194
iterator find(const_arg_type_t< KeyT > Val)
Definition: DenseMap.h:156
size_type count(const_arg_type_t< KeyT > Val) const
Return 1 if the specified key is in the map, 0 otherwise.
Definition: DenseMap.h:152
iterator end()
Definition: DenseMap.h:84
bool contains(const_arg_type_t< KeyT > Val) const
Return true if the specified key is in the map, false otherwise.
Definition: DenseMap.h:147
LoopVectorizationCostModel - estimates the expected speedups due to vectorization.
LoopVectorizationLegality checks if it is legal to vectorize a loop, and to what vectorization factor...
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:39
An interface layer with SCEV used to manage how we see SCEV expressions for values in the context of ...
The RecurrenceDescriptor is used to identify recurrences variables in a loop.
Definition: IVDescriptors.h:77
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196
Multiway switch.
Provides information about what library functions are available for the current target.
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
This class represents a truncation of integer types.
A Use represents the edge between a Value definition and its users.
Definition: Use.h:43
VPBasicBlock serves as the leaf of the Hierarchical Control-Flow Graph.
Definition: VPlan.h:3536
A recipe for vectorizing a phi-node as a sequence of mask-based select instructions.
Definition: VPlan.h:2494
VPlan-based builder utility analogous to IRBuilder.
A pure virtual base class for all recipes modeling header phis, including phis for first order recurr...
Definition: VPlan.h:2033
A recipe representing a sequence of load -> update -> store as part of a histogram operation.
Definition: VPlan.h:1783
VPRecipeBase is a base class modeling a sequence of one or more output IR instructions.
Definition: VPlan.h:716
Helper class to create VPRecipies from IR instructions.
VPRecipeBase * tryToCreatePartialReduction(Instruction *Reduction, ArrayRef< VPValue * > Operands)
Create and return a partial reduction recipe for a reduction instruction along with binary operation ...
VPValue * createEdgeMask(BasicBlock *Src, BasicBlock *Dst)
A helper function that computes the predicate of the edge between SRC and DST.
VPReplicateRecipe * handleReplication(Instruction *I, VFRange &Range)
Build a VPReplicationRecipe for I.
void createSwitchEdgeMasks(SwitchInst *SI)
Create an edge mask for every destination of cases and/or default.
VPValue * getBlockInMask(BasicBlock *BB) const
Returns the entry mask for the block BB.
VPValue * getEdgeMask(BasicBlock *Src, BasicBlock *Dst) const
A helper that returns the previously computed predicate of the edge between SRC and DST.
iterator_range< mapped_iterator< Use *, std::function< VPValue *(Value *)> > > mapToVPValues(User::op_range Operands)
Returns a range mapping the values of the range Operands to their corresponding VPValues.
void fixHeaderPhis()
Add the incoming values from the backedge to reduction & first-order recurrence cross-iteration phis.
VPRecipeBase * tryToCreateWidenRecipe(Instruction *Instr, ArrayRef< VPValue * > Operands, VFRange &Range, VPBasicBlock *VPBB)
Create and return a widened recipe for I if one can be created within the given VF Range.
VPValue * getVPValueOrAddLiveIn(Value *V)
void createHeaderMask()
Create the mask for the vector loop header block.
std::optional< unsigned > getScalingForReduction(const Instruction *ExitInst)
void createBlockInMask(BasicBlock *BB)
A helper function that computes the predicate of the block BB, assuming that the header block of the ...
void collectScaledReductions(VFRange &Range)
Find all possible partial reductions in the loop and track all of those that are valid so recipes can...
void setRecipe(Instruction *I, VPRecipeBase *R)
Set the recipe created for given ingredient.
VPRecipeBase * getRecipe(Instruction *I)
Return the recipe created for given ingredient.
VPRecipeBuilder(VPlan &Plan, Loop *OrigLoop, const TargetLibraryInfo *TLI, const TargetTransformInfo *TTI, LoopVectorizationLegality *Legal, LoopVectorizationCostModel &CM, PredicatedScalarEvolution &PSE, VPBuilder &Builder)
VPReplicateRecipe replicates a given instruction producing multiple scalar copies of the original sca...
Definition: VPlan.h:2777
VPSingleDef is a base class for recipes for modeling a sequence of one or more output IR that define ...
Definition: VPlan.h:843
A recipe for handling phi nodes of integer and floating-point inductions, producing their vector valu...
Definition: VPlan.h:2148
A common base class for widening memory operations.
Definition: VPlan.h:2950
VPWidenRecipe is a recipe for producing a widened instruction using the opcode and operands of the re...
Definition: VPlan.h:1437
VPlan models a candidate for vectorization, encoding various decisions take to produce efficient outp...
Definition: VPlan.h:3812
VPValue * getOrAddLiveIn(Value *V)
Gets the live-in VPValue for V or adds a new live-in (if none exists yet) for V.
Definition: VPlan.h:4036
LLVM Value Representation.
Definition: Value.h:74
A range adaptor for a pair of iterators.
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
This holds details about a histogram operation – a load -> update -> store sequence where each lane i...
A chain of instructions that form a partial reduction.
Instruction * BinOp
The binary operation using the extends that is then reduced.
PartialReductionChain(Instruction *Reduction, Instruction *ExtendA, Instruction *ExtendB, Instruction *BinOp)
Instruction * Reduction
The top-level binary operation that forms the reduction to a scalar after the loop body.
Instruction * ExtendA
The extension of each of the inner binary operation's operands.
A range of powers-of-2 vectorization factors with fixed start and adjustable end.
Definition: VPlan.h:97