//===- InlineCost.h - Cost analysis for inliner -----------------*- C++ -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This file implements heuristics for inlining decisions. // //===----------------------------------------------------------------------===// #ifndef LLVM_ANALYSIS_INLINECOST_H #define LLVM_ANALYSIS_INLINECOST_H #include "llvm/Analysis/AssumptionCache.h" #include "llvm/Analysis/CallGraphSCCPass.h" #include "llvm/Analysis/OptimizationRemarkEmitter.h" #include #include namespace llvm { class AssumptionCacheTracker; class BlockFrequencyInfo; class CallBase; class DataLayout; class Function; class ProfileSummaryInfo; class TargetTransformInfo; class TargetLibraryInfo; namespace InlineConstants { // Various thresholds used by inline cost analysis. /// Use when optsize (-Os) is specified. const int OptSizeThreshold = 50; /// Use when minsize (-Oz) is specified. const int OptMinSizeThreshold = 5; /// Use when -O3 is specified. const int OptAggressiveThreshold = 250; // Various magic constants used to adjust heuristics. const int InstrCost = 5; const int IndirectCallThreshold = 100; const int CallPenalty = 25; const int LastCallToStaticBonus = 15000; const int ColdccPenalty = 2000; /// Do not inline functions which allocate this many bytes on the stack /// when the caller is recursive. const unsigned TotalAllocaSizeRecursiveCaller = 1024; /// Do not inline dynamic allocas that have been constant propagated to be /// static allocas above this amount in bytes. const uint64_t MaxSimplifiedDynamicAllocaToInline = 65536; } // namespace InlineConstants /// Represents the cost of inlining a function. /// /// This supports special values for functions which should "always" or /// "never" be inlined. Otherwise, the cost represents a unitless amount; /// smaller values increase the likelihood of the function being inlined. /// /// Objects of this type also provide the adjusted threshold for inlining /// based on the information available for a particular callsite. They can be /// directly tested to determine if inlining should occur given the cost and /// threshold for this cost metric. class InlineCost { enum SentinelValues { AlwaysInlineCost = INT_MIN, NeverInlineCost = INT_MAX }; /// The estimated cost of inlining this callsite. int Cost = 0; /// The adjusted threshold against which this cost was computed. int Threshold = 0; /// Must be set for Always and Never instances. const char *Reason = nullptr; // Trivial constructor, interesting logic in the factory functions below. InlineCost(int Cost, int Threshold, const char *Reason = nullptr) : Cost(Cost), Threshold(Threshold), Reason(Reason) { assert((isVariable() || Reason) && "Reason must be provided for Never or Always"); } public: static InlineCost get(int Cost, int Threshold) { assert(Cost > AlwaysInlineCost && "Cost crosses sentinel value"); assert(Cost < NeverInlineCost && "Cost crosses sentinel value"); return InlineCost(Cost, Threshold); } static InlineCost getAlways(const char *Reason) { return InlineCost(AlwaysInlineCost, 0, Reason); } static InlineCost getNever(const char *Reason) { return InlineCost(NeverInlineCost, 0, Reason); } /// Test whether the inline cost is low enough for inlining. explicit operator bool() const { return Cost < Threshold; } bool isAlways() const { return Cost == AlwaysInlineCost; } bool isNever() const { return Cost == NeverInlineCost; } bool isVariable() const { return !isAlways() && !isNever(); } /// Get the inline cost estimate. /// It is an error to call this on an "always" or "never" InlineCost. int getCost() const { assert(isVariable() && "Invalid access of InlineCost"); return Cost; } /// Get the threshold against which the cost was computed int getThreshold() const { assert(isVariable() && "Invalid access of InlineCost"); return Threshold; } /// Get the reason of Always or Never. const char *getReason() const { assert((Reason || isVariable()) && "InlineCost reason must be set for Always or Never"); return Reason; } /// Get the cost delta from the threshold for inlining. /// Only valid if the cost is of the variable kind. Returns a negative /// value if the cost is too high to inline. int getCostDelta() const { return Threshold - getCost(); } }; /// InlineResult is basically true or false. For false results the message /// describes a reason. class InlineResult { const char *Message = nullptr; InlineResult(const char *Message = nullptr) : Message(Message) {} public: static InlineResult success() { return {}; } static InlineResult failure(const char *Reason) { return InlineResult(Reason); } bool isSuccess() const { return Message == nullptr; } const char *getFailureReason() const { assert(!isSuccess() && "getFailureReason should only be called in failure cases"); return Message; } }; /// Thresholds to tune inline cost analysis. The inline cost analysis decides /// the condition to apply a threshold and applies it. Otherwise, /// DefaultThreshold is used. If a threshold is Optional, it is applied only /// when it has a valid value. Typically, users of inline cost analysis /// obtain an InlineParams object through one of the \c getInlineParams methods /// and pass it to \c getInlineCost. Some specialized versions of inliner /// (such as the pre-inliner) might have custom logic to compute \c InlineParams /// object. struct InlineParams { /// The default threshold to start with for a callee. int DefaultThreshold = -1; /// Threshold to use for callees with inline hint. Optional HintThreshold; /// Threshold to use for cold callees. Optional ColdThreshold; /// Threshold to use when the caller is optimized for size. Optional OptSizeThreshold; /// Threshold to use when the caller is optimized for minsize. Optional OptMinSizeThreshold; /// Threshold to use when the callsite is considered hot. Optional HotCallSiteThreshold; /// Threshold to use when the callsite is considered hot relative to function /// entry. Optional LocallyHotCallSiteThreshold; /// Threshold to use when the callsite is considered cold. Optional ColdCallSiteThreshold; /// Compute inline cost even when the cost has exceeded the threshold. Optional ComputeFullInlineCost; /// Indicate whether we should allow inline deferral. Optional EnableDeferral = true; }; /// Generate the parameters to tune the inline cost analysis based only on the /// commandline options. InlineParams getInlineParams(); /// Generate the parameters to tune the inline cost analysis based on command /// line options. If -inline-threshold option is not explicitly passed, /// \p Threshold is used as the default threshold. InlineParams getInlineParams(int Threshold); /// Generate the parameters to tune the inline cost analysis based on command /// line options. If -inline-threshold option is not explicitly passed, /// the default threshold is computed from \p OptLevel and \p SizeOptLevel. /// An \p OptLevel value above 3 is considered an aggressive optimization mode. /// \p SizeOptLevel of 1 corresponds to the -Os flag and 2 corresponds to /// the -Oz flag. InlineParams getInlineParams(unsigned OptLevel, unsigned SizeOptLevel); /// Return the cost associated with a callsite, including parameter passing /// and the call/return instruction. int getCallsiteCost(CallBase &Call, const DataLayout &DL); /// Get an InlineCost object representing the cost of inlining this /// callsite. /// /// Note that a default threshold is passed into this function. This threshold /// could be modified based on callsite's properties and only costs below this /// new threshold are computed with any accuracy. The new threshold can be /// used to bound the computation necessary to determine whether the cost is /// sufficiently low to warrant inlining. /// /// Also note that calling this function *dynamically* computes the cost of /// inlining the callsite. It is an expensive, heavyweight call. InlineCost getInlineCost(CallBase &Call, const InlineParams &Params, TargetTransformInfo &CalleeTTI, function_ref GetAssumptionCache, function_ref GetTLI, function_ref GetBFI = nullptr, ProfileSummaryInfo *PSI = nullptr, OptimizationRemarkEmitter *ORE = nullptr); /// Get an InlineCost with the callee explicitly specified. /// This allows you to calculate the cost of inlining a function via a /// pointer. This behaves exactly as the version with no explicit callee /// parameter in all other respects. // InlineCost getInlineCost(CallBase &Call, Function *Callee, const InlineParams &Params, TargetTransformInfo &CalleeTTI, function_ref GetAssumptionCache, function_ref GetTLI, function_ref GetBFI = nullptr, ProfileSummaryInfo *PSI = nullptr, OptimizationRemarkEmitter *ORE = nullptr); /// Returns InlineResult::success() if the call site should be always inlined /// because of user directives, and the inlining is viable. Returns /// InlineResult::failure() if the inlining may never happen because of user /// directives or incompatibilities detectable without needing callee traversal. /// Otherwise returns None, meaning that inlining should be decided based on /// other criteria (e.g. cost modeling). Optional getAttributeBasedInliningDecision( CallBase &Call, Function *Callee, TargetTransformInfo &CalleeTTI, function_ref GetTLI); /// Get the cost estimate ignoring thresholds. This is similar to getInlineCost /// when passed InlineParams::ComputeFullInlineCost, or a non-null ORE. It /// uses default InlineParams otherwise. /// Contrary to getInlineCost, which makes a threshold-based final evaluation of /// should/shouldn't inline, captured in InlineResult, getInliningCostEstimate /// returns: /// - None, if the inlining cannot happen (is illegal) /// - an integer, representing the cost. Optional getInliningCostEstimate( CallBase &Call, TargetTransformInfo &CalleeTTI, function_ref GetAssumptionCache, function_ref GetBFI = nullptr, ProfileSummaryInfo *PSI = nullptr, OptimizationRemarkEmitter *ORE = nullptr); /// Minimal filter to detect invalid constructs for inlining. InlineResult isInlineViable(Function &Callee); // This pass is used to annotate instructions during the inline process for // debugging and analysis. The main purpose of the pass is to see and test // inliner's decisions when creating new optimizations to InlineCost. struct InlineCostAnnotationPrinterPass : PassInfoMixin { raw_ostream &OS; public: explicit InlineCostAnnotationPrinterPass(raw_ostream &OS) : OS(OS) {} PreservedAnalyses run(Function &F, FunctionAnalysisManager &FAM); }; } // namespace llvm #endif