| //===- VPlanTransforms.h - Utility VPlan to VPlan transforms --------------===// |
| // |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| // See https://llvm.org/LICENSE.txt for license information. |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| // |
| //===----------------------------------------------------------------------===// |
| /// |
| /// \file |
| /// This file provides utility VPlan to VPlan transformations. |
| //===----------------------------------------------------------------------===// |
| |
| #ifndef LLVM_TRANSFORMS_VECTORIZE_VPLANTRANSFORMS_H |
| #define LLVM_TRANSFORMS_VECTORIZE_VPLANTRANSFORMS_H |
| |
| #include "VPlan.h" |
| #include "VPlanVerifier.h" |
| #include "llvm/ADT/STLFunctionalExtras.h" |
| #include "llvm/Support/CommandLine.h" |
| |
| namespace llvm { |
| |
| class InductionDescriptor; |
| class Instruction; |
| class PHINode; |
| class ScalarEvolution; |
| class PredicatedScalarEvolution; |
| class TargetLibraryInfo; |
| class VPBuilder; |
| class VPRecipeBuilder; |
| struct VFRange; |
| |
| extern cl::opt<bool> VerifyEachVPlan; |
| |
| struct VPlanTransforms { |
| /// Helper to run a VPlan transform \p Transform on \p VPlan, forwarding extra |
| /// arguments to the transform. Returns the boolean returned by the transform. |
| template <typename... ArgsTy> |
| static bool runPass(bool (*Transform)(VPlan &, ArgsTy...), VPlan &Plan, |
| typename std::remove_reference<ArgsTy>::type &...Args) { |
| bool Res = Transform(Plan, Args...); |
| if (VerifyEachVPlan) |
| verifyVPlanIsValid(Plan); |
| return Res; |
| } |
| /// Helper to run a VPlan transform \p Transform on \p VPlan, forwarding extra |
| /// arguments to the transform. |
| template <typename... ArgsTy> |
| static void runPass(void (*Fn)(VPlan &, ArgsTy...), VPlan &Plan, |
| typename std::remove_reference<ArgsTy>::type &...Args) { |
| Fn(Plan, Args...); |
| if (VerifyEachVPlan) |
| verifyVPlanIsValid(Plan); |
| } |
| |
| static std::unique_ptr<VPlan> |
| buildPlainCFG(Loop *TheLoop, LoopInfo &LI, |
| DenseMap<VPBlockBase *, BasicBlock *> &VPB2IRBB); |
| |
| /// Prepare the plan for vectorization. It will introduce a dedicated |
| /// VPBasicBlock for the vector pre-header as well as a VPBasicBlock as exit |
| /// block of the main vector loop (middle.block). If a check is needed to |
| /// guard executing the scalar epilogue loop, it will be added to the middle |
| /// block, together with VPBasicBlocks for the scalar preheader and exit |
| /// blocks. \p InductionTy is the type of the canonical induction and used for |
| /// related values, like the trip count expression. It also creates a VPValue |
| /// expression for the original trip count. |
| static void prepareForVectorization(VPlan &Plan, Type *InductionTy, |
| PredicatedScalarEvolution &PSE, |
| bool RequiresScalarEpilogueCheck, |
| bool TailFolded, Loop *TheLoop, |
| DebugLoc IVDL); |
| |
| /// Replace loops in \p Plan's flat CFG with VPRegionBlocks, turning \p Plan's |
| /// flat CFG into a hierarchical CFG. |
| static void createLoopRegions(VPlan &Plan); |
| |
| /// Replaces the VPInstructions in \p Plan with corresponding |
| /// widen recipes. Returns false if any VPInstructions could not be converted |
| /// to a wide recipe if needed. |
| static bool tryToConvertVPInstructionsToVPRecipes( |
| VPlanPtr &Plan, |
| function_ref<const InductionDescriptor *(PHINode *)> |
| GetIntOrFpInductionDescriptor, |
| ScalarEvolution &SE, const TargetLibraryInfo &TLI); |
| |
| /// Try to have all users of fixed-order recurrences appear after the recipe |
| /// defining their previous value, by either sinking users or hoisting recipes |
| /// defining their previous value (and its operands). Then introduce |
| /// FirstOrderRecurrenceSplice VPInstructions to combine the value from the |
| /// recurrence phis and previous values. |
| /// \returns true if all users of fixed-order recurrences could be re-arranged |
| /// as needed or false if it is not possible. In the latter case, \p Plan is |
| /// not valid. |
| static bool adjustFixedOrderRecurrences(VPlan &Plan, VPBuilder &Builder); |
| |
| /// Clear NSW/NUW flags from reduction instructions if necessary. |
| static void clearReductionWrapFlags(VPlan &Plan); |
| |
| /// Explicitly unroll \p Plan by \p UF. |
| static void unrollByUF(VPlan &Plan, unsigned UF, LLVMContext &Ctx); |
| |
| /// Optimize \p Plan based on \p BestVF and \p BestUF. This may restrict the |
| /// resulting plan to \p BestVF and \p BestUF. |
| static void optimizeForVFAndUF(VPlan &Plan, ElementCount BestVF, |
| unsigned BestUF, |
| PredicatedScalarEvolution &PSE); |
| |
| /// Apply VPlan-to-VPlan optimizations to \p Plan, including induction recipe |
| /// optimizations, dead recipe removal, replicate region optimizations and |
| /// block merging. |
| static void optimize(VPlan &Plan); |
| |
| /// Wrap predicated VPReplicateRecipes with a mask operand in an if-then |
| /// region block and remove the mask operand. Optimize the created regions by |
| /// iteratively sinking scalar operands into the region, followed by merging |
| /// regions until no improvements are remaining. |
| static void createAndOptimizeReplicateRegions(VPlan &Plan); |
| |
| /// Replace (ICMP_ULE, wide canonical IV, backedge-taken-count) checks with an |
| /// (active-lane-mask recipe, wide canonical IV, trip-count). If \p |
| /// UseActiveLaneMaskForControlFlow is true, introduce an |
| /// VPActiveLaneMaskPHIRecipe. If \p DataAndControlFlowWithoutRuntimeCheck is |
| /// true, no minimum-iteration runtime check will be created (during skeleton |
| /// creation) and instead it is handled using active-lane-mask. \p |
| /// DataAndControlFlowWithoutRuntimeCheck implies \p |
| /// UseActiveLaneMaskForControlFlow. |
| static void addActiveLaneMask(VPlan &Plan, |
| bool UseActiveLaneMaskForControlFlow, |
| bool DataAndControlFlowWithoutRuntimeCheck); |
| |
| /// Insert truncates and extends for any truncated recipe. Redundant casts |
| /// will be folded later. |
| static void |
| truncateToMinimalBitwidths(VPlan &Plan, |
| const MapVector<Instruction *, uint64_t> &MinBWs); |
| |
| /// Drop poison flags from recipes that may generate a poison value that is |
| /// used after vectorization, even when their operands are not poison. Those |
| /// recipes meet the following conditions: |
| /// * Contribute to the address computation of a recipe generating a widen |
| /// memory load/store (VPWidenMemoryInstructionRecipe or |
| /// VPInterleaveRecipe). |
| /// * Such a widen memory load/store has at least one underlying Instruction |
| /// that is in a basic block that needs predication and after vectorization |
| /// the generated instruction won't be predicated. |
| /// Uses \p BlockNeedsPredication to check if a block needs predicating. |
| /// TODO: Replace BlockNeedsPredication callback with retrieving info from |
| /// VPlan directly. |
| static void dropPoisonGeneratingRecipes( |
| VPlan &Plan, |
| const std::function<bool(BasicBlock *)> &BlockNeedsPredication); |
| |
| /// Add a VPEVLBasedIVPHIRecipe and related recipes to \p Plan and |
| /// replaces all uses except the canonical IV increment of |
| /// VPCanonicalIVPHIRecipe with a VPEVLBasedIVPHIRecipe. |
| /// VPCanonicalIVPHIRecipe is only used to control the loop after |
| /// this transformation. |
| /// \returns true if the transformation succeeds, or false if it doesn't. |
| static bool |
| tryAddExplicitVectorLength(VPlan &Plan, |
| const std::optional<unsigned> &MaxEVLSafeElements); |
| |
| // For each Interleave Group in \p InterleaveGroups replace the Recipes |
| // widening its memory instructions with a single VPInterleaveRecipe at its |
| // insertion point. |
| static void createInterleaveGroups( |
| VPlan &Plan, |
| const SmallPtrSetImpl<const InterleaveGroup<Instruction> *> |
| &InterleaveGroups, |
| VPRecipeBuilder &RecipeBuilder, const bool &ScalarEpilogueAllowed); |
| |
| /// Remove dead recipes from \p Plan. |
| static void removeDeadRecipes(VPlan &Plan); |
| |
| /// Update \p Plan to account for the uncountable early exit block in \p |
| /// UncountableExitingBlock by |
| /// * updating the condition exiting the vector loop to include the early |
| /// exit conditions |
| /// * splitting the original middle block to branch to the early exit block |
| /// if taken. |
| static void handleUncountableEarlyExit(VPlan &Plan, Loop *OrigLoop, |
| BasicBlock *UncountableExitingBlock, |
| VPRecipeBuilder &RecipeBuilder, |
| VFRange &Range); |
| |
| /// Lower abstract recipes to concrete ones, that can be codegen'd. Use \p |
| /// CanonicalIVTy as type for all un-typed live-ins in VPTypeAnalysis. |
| static void convertToConcreteRecipes(VPlan &Plan, Type &CanonicalIVTy); |
| |
| /// Perform instcombine-like simplifications on recipes in \p Plan. Use \p |
| /// CanonicalIVTy as type for all un-typed live-ins in VPTypeAnalysis. |
| static void simplifyRecipes(VPlan &Plan, Type &CanonicalIVTy); |
| |
| /// If there's a single exit block, optimize its phi recipes that use exiting |
| /// IV values by feeding them precomputed end values instead, possibly taken |
| /// one step backwards. |
| static void |
| optimizeInductionExitUsers(VPlan &Plan, |
| DenseMap<VPValue *, VPValue *> &EndValues); |
| |
| /// Add explicit broadcasts for live-ins and VPValues defined in \p Plan's entry block if they are used as vectors. |
| static void materializeBroadcasts(VPlan &Plan); |
| |
| /// Try to convert a plan with interleave groups with VF elements to a plan |
| /// with the interleave groups replaced by wide loads and stores processing VF |
| /// elements, if all transformed interleave groups access the full vector |
| /// width (checked via \o VectorRegWidth). This effectively is a very simple |
| /// form of loop-aware SLP, where we use interleave groups to identify |
| /// candidates. |
| static void narrowInterleaveGroups(VPlan &Plan, ElementCount VF, |
| unsigned VectorRegWidth); |
| }; |
| |
| } // namespace llvm |
| |
| #endif // LLVM_TRANSFORMS_VECTORIZE_VPLANTRANSFORMS_H |