mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-23 11:13:28 +01:00
9e1b62af44
This adds the following to the new PM based inliner in PGO mode: * Use block frequency analysis to derive callsite's profile count and use that to adjust thresholds of hot and cold callsites. * Incrementally update the BFI of the caller after a callee gets inlined into it. This incremental update is only within an invocation of the run method - BFI is not preserved across calls to run. Update the function entry count of the callee after inlining it into a caller. * I've tuned the thresholds for the hot and cold callsites using a hacked up version of the old inliner that explicitly computes BFI on a set of internal benchmarks and spec. Once the new PM based pipeline stabilizes (IIRC Chandler mentioned there are known issues) I'll benchmark this again and adjust the thresholds if required. Inliner PGO support. Differential revision: https://reviews.llvm.org/D28331 llvm-svn: 292666
198 lines
7.3 KiB
C++
198 lines
7.3 KiB
C++
//===- InlineCost.h - Cost analysis for inliner -----------------*- C++ -*-===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file implements heuristics for inlining decisions.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLVM_ANALYSIS_INLINECOST_H
|
|
#define LLVM_ANALYSIS_INLINECOST_H
|
|
|
|
#include "llvm/Analysis/CallGraphSCCPass.h"
|
|
#include "llvm/Analysis/AssumptionCache.h"
|
|
#include <cassert>
|
|
#include <climits>
|
|
|
|
namespace llvm {
|
|
class AssumptionCacheTracker;
|
|
class BlockFrequencyInfo;
|
|
class CallSite;
|
|
class DataLayout;
|
|
class Function;
|
|
class ProfileSummaryInfo;
|
|
class TargetTransformInfo;
|
|
|
|
namespace InlineConstants {
|
|
// Various thresholds used by inline cost analysis.
|
|
/// Use when optsize (-Os) is specified.
|
|
const int OptSizeThreshold = 50;
|
|
|
|
/// Use when minsize (-Oz) is specified.
|
|
const int OptMinSizeThreshold = 5;
|
|
|
|
/// Use when -O3 is specified.
|
|
const int OptAggressiveThreshold = 250;
|
|
|
|
// Various magic constants used to adjust heuristics.
|
|
const int InstrCost = 5;
|
|
const int IndirectCallThreshold = 100;
|
|
const int CallPenalty = 25;
|
|
const int LastCallToStaticBonus = 15000;
|
|
const int ColdccPenalty = 2000;
|
|
const int NoreturnPenalty = 10000;
|
|
/// Do not inline functions which allocate this many bytes on the stack
|
|
/// when the caller is recursive.
|
|
const unsigned TotalAllocaSizeRecursiveCaller = 1024;
|
|
}
|
|
|
|
/// \brief Represents the cost of inlining a function.
|
|
///
|
|
/// This supports special values for functions which should "always" or
|
|
/// "never" be inlined. Otherwise, the cost represents a unitless amount;
|
|
/// smaller values increase the likelihood of the function being inlined.
|
|
///
|
|
/// Objects of this type also provide the adjusted threshold for inlining
|
|
/// based on the information available for a particular callsite. They can be
|
|
/// directly tested to determine if inlining should occur given the cost and
|
|
/// threshold for this cost metric.
|
|
class InlineCost {
|
|
enum SentinelValues {
|
|
AlwaysInlineCost = INT_MIN,
|
|
NeverInlineCost = INT_MAX
|
|
};
|
|
|
|
/// \brief The estimated cost of inlining this callsite.
|
|
const int Cost;
|
|
|
|
/// \brief The adjusted threshold against which this cost was computed.
|
|
const int Threshold;
|
|
|
|
// Trivial constructor, interesting logic in the factory functions below.
|
|
InlineCost(int Cost, int Threshold) : Cost(Cost), Threshold(Threshold) {}
|
|
|
|
public:
|
|
static InlineCost get(int Cost, int Threshold) {
|
|
assert(Cost > AlwaysInlineCost && "Cost crosses sentinel value");
|
|
assert(Cost < NeverInlineCost && "Cost crosses sentinel value");
|
|
return InlineCost(Cost, Threshold);
|
|
}
|
|
static InlineCost getAlways() {
|
|
return InlineCost(AlwaysInlineCost, 0);
|
|
}
|
|
static InlineCost getNever() {
|
|
return InlineCost(NeverInlineCost, 0);
|
|
}
|
|
|
|
/// \brief Test whether the inline cost is low enough for inlining.
|
|
explicit operator bool() const {
|
|
return Cost < Threshold;
|
|
}
|
|
|
|
bool isAlways() const { return Cost == AlwaysInlineCost; }
|
|
bool isNever() const { return Cost == NeverInlineCost; }
|
|
bool isVariable() const { return !isAlways() && !isNever(); }
|
|
|
|
/// \brief Get the inline cost estimate.
|
|
/// It is an error to call this on an "always" or "never" InlineCost.
|
|
int getCost() const {
|
|
assert(isVariable() && "Invalid access of InlineCost");
|
|
return Cost;
|
|
}
|
|
|
|
/// \brief Get the cost delta from the threshold for inlining.
|
|
/// Only valid if the cost is of the variable kind. Returns a negative
|
|
/// value if the cost is too high to inline.
|
|
int getCostDelta() const { return Threshold - getCost(); }
|
|
};
|
|
|
|
/// Thresholds to tune inline cost analysis. The inline cost analysis decides
|
|
/// the condition to apply a threshold and applies it. Otherwise,
|
|
/// DefaultThreshold is used. If a threshold is Optional, it is applied only
|
|
/// when it has a valid value. Typically, users of inline cost analysis
|
|
/// obtain an InlineParams object through one of the \c getInlineParams methods
|
|
/// and pass it to \c getInlineCost. Some specialized versions of inliner
|
|
/// (such as the pre-inliner) might have custom logic to compute \c InlineParams
|
|
/// object.
|
|
|
|
struct InlineParams {
|
|
/// The default threshold to start with for a callee.
|
|
int DefaultThreshold;
|
|
|
|
/// Threshold to use for callees with inline hint.
|
|
Optional<int> HintThreshold;
|
|
|
|
/// Threshold to use for cold callees.
|
|
Optional<int> ColdThreshold;
|
|
|
|
/// Threshold to use when the caller is optimized for size.
|
|
Optional<int> OptSizeThreshold;
|
|
|
|
/// Threshold to use when the caller is optimized for minsize.
|
|
Optional<int> OptMinSizeThreshold;
|
|
|
|
/// Threshold to use when the callsite is considered hot.
|
|
Optional<int> HotCallSiteThreshold;
|
|
|
|
/// Threshold to use when the callsite is considered cold.
|
|
Optional<int> ColdCallSiteThreshold;
|
|
};
|
|
|
|
/// Generate the parameters to tune the inline cost analysis based only on the
|
|
/// commandline options.
|
|
InlineParams getInlineParams();
|
|
|
|
/// Generate the parameters to tune the inline cost analysis based on command
|
|
/// line options. If -inline-threshold option is not explicitly passed,
|
|
/// \p Threshold is used as the default threshold.
|
|
InlineParams getInlineParams(int Threshold);
|
|
|
|
/// Generate the parameters to tune the inline cost analysis based on command
|
|
/// line options. If -inline-threshold option is not explicitly passed,
|
|
/// the default threshold is computed from \p OptLevel and \p SizeOptLevel.
|
|
/// An \p OptLevel value above 3 is considered an aggressive optimization mode.
|
|
/// \p SizeOptLevel of 1 corresponds to the the -Os flag and 2 corresponds to
|
|
/// the -Oz flag.
|
|
InlineParams getInlineParams(unsigned OptLevel, unsigned SizeOptLevel);
|
|
|
|
/// \brief Get an InlineCost object representing the cost of inlining this
|
|
/// callsite.
|
|
///
|
|
/// Note that a default threshold is passed into this function. This threshold
|
|
/// could be modified based on callsite's properties and only costs below this
|
|
/// new threshold are computed with any accuracy. The new threshold can be
|
|
/// used to bound the computation necessary to determine whether the cost is
|
|
/// sufficiently low to warrant inlining.
|
|
///
|
|
/// Also note that calling this function *dynamically* computes the cost of
|
|
/// inlining the callsite. It is an expensive, heavyweight call.
|
|
InlineCost
|
|
getInlineCost(CallSite CS, const InlineParams &Params,
|
|
TargetTransformInfo &CalleeTTI,
|
|
std::function<AssumptionCache &(Function &)> &GetAssumptionCache,
|
|
Optional<function_ref<BlockFrequencyInfo &(Function &)>> GetBFI,
|
|
ProfileSummaryInfo *PSI);
|
|
|
|
/// \brief Get an InlineCost with the callee explicitly specified.
|
|
/// This allows you to calculate the cost of inlining a function via a
|
|
/// pointer. This behaves exactly as the version with no explicit callee
|
|
/// parameter in all other respects.
|
|
//
|
|
InlineCost
|
|
getInlineCost(CallSite CS, Function *Callee, const InlineParams &Params,
|
|
TargetTransformInfo &CalleeTTI,
|
|
std::function<AssumptionCache &(Function &)> &GetAssumptionCache,
|
|
Optional<function_ref<BlockFrequencyInfo &(Function &)>> GetBFI,
|
|
ProfileSummaryInfo *PSI);
|
|
|
|
/// \brief Minimal filter to detect invalid constructs for inlining.
|
|
bool isInlineViable(Function &Callee);
|
|
}
|
|
|
|
#endif
|