13#ifndef LLVM_TRANSFORMS_VECTORIZE_VPLANTRANSFORMS_H
14#define LLVM_TRANSFORMS_VECTORIZE_VPLANTRANSFORMS_H
44#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
56 template <
bool EnableVerify =
true,
typename PassTy,
typename... ArgsTy>
59#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
60 auto PrintPlan = [&](
StringRef BeforeOrAfterStr) {
62 <<
"VPlan for loop in '"
64 <<
"' " << BeforeOrAfterStr <<
" " <<
PassName <<
'\n';
68 dbgs() << Plan <<
'\n';
72 return (ListOpt.getNumOccurrences() > 0 &&
83#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
95 return std::forward<PassTy>(
Pass)(Plan, std::forward<ArgsTy>(Args)...);
97#define RUN_VPLAN_PASS(PASS, ...) \
98 llvm::VPlanTransforms::runPass(#PASS, PASS, __VA_ARGS__)
99#define RUN_VPLAN_PASS_NO_VERIFY(PASS, ...) \
100 llvm::VPlanTransforms::runPass<false>(#PASS, PASS, __VA_ARGS__)
144 buildVPlan0(Loop *TheLoop, LoopInfo &LI, Type *InductionTy,
145 PredicatedScalarEvolution &PSE, LoopVersioning *LVer =
nullptr);
155 VPlan &Plan, PredicatedScalarEvolution &PSE, Loop &OrigLoop,
156 const VPDominatorTree &VPDT,
157 const MapVector<PHINode *, InductionDescriptor> &Inductions,
158 const MapVector<PHINode *, RecurrenceDescriptor> &
Reductions,
159 const SmallPtrSetImpl<const PHINode *> &FixedOrderRecurrences,
160 const SmallPtrSetImpl<PHINode *> &InLoopReductions,
bool AllowReordering);
169 bool OptForSize,
unsigned SCEVCheckThreshold,
170 OptimizationRemarkEmitter *ORE, Loop *TheLoop);
183 PredicatedScalarEvolution &PSE, DominatorTree &DT,
184 AssumptionCache *AC);
193 VPlan &Plan, ElementCount VF,
unsigned UF,
194 ElementCount MinProfitableTripCount,
bool RequiresScalarEpilogue,
196 DebugLoc DL, PredicatedScalarEvolution &PSE, VPBasicBlock *CheckBlock);
202 bool RequiresScalarEpilogue, Loop *OrigLoop,
209 VPlan &Plan, Value *VectorTripCount,
bool RequiresScalarEpilogue,
210 ElementCount EpilogueVF,
unsigned EpilogueUF,
unsigned MainLoopStep,
211 unsigned EpilogueLoopStep, ScalarEvolution &SE);
223 VPBasicBlock *CheckBlock,
224 bool AddBranchWeights);
226 bool AddBranchWeights);
233 const TargetLibraryInfo &TLI);
240 OptimizationRemarkEmitter *ORE,
260 static void unrollByUF(VPlan &Plan,
unsigned UF);
273 PredicatedScalarEvolution &PSE);
278 PredicatedScalarEvolution &PSE);
300 bool UseActiveLaneMaskForControlFlow);
306 const MapVector<Instruction *, uint64_t> &MinBWs);
312 const DenseMap<Value *, const SCEV *> &StridesMap,
313 const VPDominatorTree &VPDT);
330 const std::optional<unsigned> &MaxEVLSafeElements);
346 const SmallPtrSetImpl<
const InterleaveGroup<Instruction> *>
348 const bool &EpilogueAllowed);
354 PredicatedScalarEvolution &PSE, Loop &L,
355 VPCostContext &Ctx, VFRange &
Range);
365 VPlan &Plan, VPBasicBlock *HeaderVPBB, VPBasicBlock *LatchVPBB,
366 VPBasicBlock *MiddleVPBB, Loop *TheLoop, PredicatedScalarEvolution &PSE,
414 static void cse(VPlan &Plan);
420 PredicatedScalarEvolution &PSE,
444 PredicatedScalarEvolution &PSE);
451 VPlan &Plan, VPBasicBlock *VectorPHVPBB,
bool TailByMasking,
452 bool RequiresScalarEpilogue, VPValue *Step,
453 std::optional<uint64_t> MaxRuntimeStep = std::nullopt);
458 VPBasicBlock *VectorPH);
476 VPBasicBlock *AliasCheckVPBB,
494 static DenseMap<const SCEV *, Value *>
expandSCEVs(VPlan &Plan,
495 ScalarEvolution &SE);
509 static std::unique_ptr<VPlan>
555 VPlan &Plan, ScalarEvolution &SE,
const TargetTransformInfo &
TTI,
557 unsigned UF,
const SmallPtrSetImpl<const Value *> &ValuesToIgnore);
563 std::optional<unsigned> VScaleForTuning);
576 PredicatedScalarEvolution &PSE, Loop &L);
587 VPRecipeBuilder &RecipeBuilder);
597 VPRecipeBuilder &RecipeBuilder,
598 VPCostContext &CostCtx);
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
#define LLVM_ABI_FOR_TEST
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))
static constexpr uint32_t MinItersBypassWeights[]
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
const SmallVectorImpl< MachineOperand > & Cond
This file defines the make_scope_exit function, which executes user-defined cleanup logic at scope ex...
This file declares the class VPlanVerifier, which contains utility functions to check the consistency...
This file contains the declarations of the Vectorization Plan base classes:
static const char PassName[]
const Function * getParent() const
Return the enclosing method, or null if none.
A struct for saving information about induction variables.
This class emits a version of the loop where run-time checks ensure that may-alias pointers can't ove...
Represents a single loop in the control flow graph.
Pass interface - Implemented by all 'passes'.
An interface layer with SCEV used to manage how we see SCEV expressions for values in the context of ...
LLVM_ABI bool match(StringRef String, SmallVectorImpl< StringRef > *Matches=nullptr, std::string *Error=nullptr) const
matches - Match the regex against a given String.
The main scalar evolution driver.
Represent a constant reference to a string, i.e.
Provides information about what library functions are available for the current target.
VPlan-based builder utility analogous to IRBuilder.
BasicBlock * getIRBasicBlock() const
Helper class to create VPRecipies from IR instructions.
void print(raw_ostream &O, const Twine &Indent, VPSlotTracker &SlotTracker) const override
Print this VPRegionBlock to O (recursively), prefixing all lines with Indent.
VPlan models a candidate for vectorization, encoding various decisions take to produce efficient outp...
LLVM_ABI_FOR_TEST VPRegionBlock * getVectorLoopRegion()
Returns the VPRegionBlock of the vector loop.
VPIRBasicBlock * getScalarHeader() const
Return the VPIRBasicBlock wrapping the header of the scalar loop.
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
This is an optimization pass for GlobalISel generic memory operations.
LLVM_ABI_FOR_TEST cl::opt< bool > VerifyEachVPlan
LLVM_ABI_FOR_TEST cl::opt< bool > VPlanPrintAfterAll
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI_FOR_TEST cl::opt< bool > EnableWideActiveLaneMask
UncountableExitStyle
Different methods of handling early exits.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
LLVM_ABI_FOR_TEST cl::list< std::string > VPlanPrintAfterPasses
LLVM_ABI_FOR_TEST cl::list< std::string > VPlanPrintBeforePasses
ArrayRef(const T &OneElt) -> ArrayRef< T >
LLVM_ABI_FOR_TEST cl::opt< bool > VPlanPrintBeforeAll
LLVM_ABI_FOR_TEST bool verifyVPlanIsValid(const VPlan &Plan)
Verify invariants for general VPlans.
LLVM_ABI_FOR_TEST cl::opt< bool > VPlanPrintVectorRegionScope
A range of powers-of-2 vectorization factors with fixed start and adjustable end.