mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-22 02:33:06 +01:00
022ca8be28
We create flag variable "__llvm_fs_discriminator__" in the binary to indicate that FSAFDO hierarchical discriminators are used. This variable might be GC'ed by the linker since it is not explicitly reference. I initially added the var to the use list in pass MIRFSDiscriminator but it did not work. It turned out the used global list is collected in lowering (before MIR pass) and then emitted in the end of pass pipeline. Here I add the variable to the use list in IR level's AddDiscriminators pass. The machine level code is still keep in the case IR's AddDiscriminators is not invoked. If this is the case, this just use -Wl,--export-dynamic-symbol=__llvm_fs_discriminator__ to force the emit. Differential Revision: https://reviews.llvm.org/D103988
178 lines
7.3 KiB
C++
178 lines
7.3 KiB
C++
//===- SampleProfileLoaderBaseUtil.cpp - Profile loader Util func ---------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file implements the SampleProfileLoader base utility functions.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/Transforms/Utils/SampleProfileLoaderBaseUtil.h"
|
|
|
|
namespace llvm {
|
|
|
|
cl::opt<unsigned> SampleProfileMaxPropagateIterations(
|
|
"sample-profile-max-propagate-iterations", cl::init(100),
|
|
cl::desc("Maximum number of iterations to go through when propagating "
|
|
"sample block/edge weights through the CFG."));
|
|
|
|
cl::opt<unsigned> SampleProfileRecordCoverage(
|
|
"sample-profile-check-record-coverage", cl::init(0), cl::value_desc("N"),
|
|
cl::desc("Emit a warning if less than N% of records in the input profile "
|
|
"are matched to the IR."));
|
|
|
|
cl::opt<unsigned> SampleProfileSampleCoverage(
|
|
"sample-profile-check-sample-coverage", cl::init(0), cl::value_desc("N"),
|
|
cl::desc("Emit a warning if less than N% of samples in the input profile "
|
|
"are matched to the IR."));
|
|
|
|
cl::opt<bool> NoWarnSampleUnused(
|
|
"no-warn-sample-unused", cl::init(false), cl::Hidden,
|
|
cl::desc("Use this option to turn off/on warnings about function with "
|
|
"samples but without debug information to use those samples. "));
|
|
|
|
namespace sampleprofutil {
|
|
|
|
/// Return true if the given callsite is hot wrt to hot cutoff threshold.
|
|
///
|
|
/// Functions that were inlined in the original binary will be represented
|
|
/// in the inline stack in the sample profile. If the profile shows that
|
|
/// the original inline decision was "good" (i.e., the callsite is executed
|
|
/// frequently), then we will recreate the inline decision and apply the
|
|
/// profile from the inlined callsite.
|
|
///
|
|
/// To decide whether an inlined callsite is hot, we compare the callsite
|
|
/// sample count with the hot cutoff computed by ProfileSummaryInfo, it is
|
|
/// regarded as hot if the count is above the cutoff value.
|
|
///
|
|
/// When ProfileAccurateForSymsInList is enabled and profile symbol list
|
|
/// is present, functions in the profile symbol list but without profile will
|
|
/// be regarded as cold and much less inlining will happen in CGSCC inlining
|
|
/// pass, so we tend to lower the hot criteria here to allow more early
|
|
/// inlining to happen for warm callsites and it is helpful for performance.
|
|
bool callsiteIsHot(const FunctionSamples *CallsiteFS, ProfileSummaryInfo *PSI,
|
|
bool ProfAccForSymsInList) {
|
|
if (!CallsiteFS)
|
|
return false; // The callsite was not inlined in the original binary.
|
|
|
|
assert(PSI && "PSI is expected to be non null");
|
|
uint64_t CallsiteTotalSamples = CallsiteFS->getTotalSamples();
|
|
if (ProfAccForSymsInList)
|
|
return !PSI->isColdCount(CallsiteTotalSamples);
|
|
else
|
|
return PSI->isHotCount(CallsiteTotalSamples);
|
|
}
|
|
|
|
/// Mark as used the sample record for the given function samples at
|
|
/// (LineOffset, Discriminator).
|
|
///
|
|
/// \returns true if this is the first time we mark the given record.
|
|
bool SampleCoverageTracker::markSamplesUsed(const FunctionSamples *FS,
|
|
uint32_t LineOffset,
|
|
uint32_t Discriminator,
|
|
uint64_t Samples) {
|
|
LineLocation Loc(LineOffset, Discriminator);
|
|
unsigned &Count = SampleCoverage[FS][Loc];
|
|
bool FirstTime = (++Count == 1);
|
|
if (FirstTime)
|
|
TotalUsedSamples += Samples;
|
|
return FirstTime;
|
|
}
|
|
|
|
/// Return the number of sample records that were applied from this profile.
|
|
///
|
|
/// This count does not include records from cold inlined callsites.
|
|
unsigned
|
|
SampleCoverageTracker::countUsedRecords(const FunctionSamples *FS,
|
|
ProfileSummaryInfo *PSI) const {
|
|
auto I = SampleCoverage.find(FS);
|
|
|
|
// The size of the coverage map for FS represents the number of records
|
|
// that were marked used at least once.
|
|
unsigned Count = (I != SampleCoverage.end()) ? I->second.size() : 0;
|
|
|
|
// If there are inlined callsites in this function, count the samples found
|
|
// in the respective bodies. However, do not bother counting callees with 0
|
|
// total samples, these are callees that were never invoked at runtime.
|
|
for (const auto &I : FS->getCallsiteSamples())
|
|
for (const auto &J : I.second) {
|
|
const FunctionSamples *CalleeSamples = &J.second;
|
|
if (callsiteIsHot(CalleeSamples, PSI, ProfAccForSymsInList))
|
|
Count += countUsedRecords(CalleeSamples, PSI);
|
|
}
|
|
|
|
return Count;
|
|
}
|
|
|
|
/// Return the number of sample records in the body of this profile.
|
|
///
|
|
/// This count does not include records from cold inlined callsites.
|
|
unsigned
|
|
SampleCoverageTracker::countBodyRecords(const FunctionSamples *FS,
|
|
ProfileSummaryInfo *PSI) const {
|
|
unsigned Count = FS->getBodySamples().size();
|
|
|
|
// Only count records in hot callsites.
|
|
for (const auto &I : FS->getCallsiteSamples())
|
|
for (const auto &J : I.second) {
|
|
const FunctionSamples *CalleeSamples = &J.second;
|
|
if (callsiteIsHot(CalleeSamples, PSI, ProfAccForSymsInList))
|
|
Count += countBodyRecords(CalleeSamples, PSI);
|
|
}
|
|
|
|
return Count;
|
|
}
|
|
|
|
/// Return the number of samples collected in the body of this profile.
|
|
///
|
|
/// This count does not include samples from cold inlined callsites.
|
|
uint64_t
|
|
SampleCoverageTracker::countBodySamples(const FunctionSamples *FS,
|
|
ProfileSummaryInfo *PSI) const {
|
|
uint64_t Total = 0;
|
|
for (const auto &I : FS->getBodySamples())
|
|
Total += I.second.getSamples();
|
|
|
|
// Only count samples in hot callsites.
|
|
for (const auto &I : FS->getCallsiteSamples())
|
|
for (const auto &J : I.second) {
|
|
const FunctionSamples *CalleeSamples = &J.second;
|
|
if (callsiteIsHot(CalleeSamples, PSI, ProfAccForSymsInList))
|
|
Total += countBodySamples(CalleeSamples, PSI);
|
|
}
|
|
|
|
return Total;
|
|
}
|
|
|
|
/// Return the fraction of sample records used in this profile.
|
|
///
|
|
/// The returned value is an unsigned integer in the range 0-100 indicating
|
|
/// the percentage of sample records that were used while applying this
|
|
/// profile to the associated function.
|
|
unsigned SampleCoverageTracker::computeCoverage(unsigned Used,
|
|
unsigned Total) const {
|
|
assert(Used <= Total &&
|
|
"number of used records cannot exceed the total number of records");
|
|
return Total > 0 ? Used * 100 / Total : 100;
|
|
}
|
|
|
|
/// Create a global variable to flag FSDiscriminators are used.
|
|
void createFSDiscriminatorVariable(Module *M) {
|
|
const char *FSDiscriminatorVar = "__llvm_fs_discriminator__";
|
|
if (M->getGlobalVariable(FSDiscriminatorVar))
|
|
return;
|
|
|
|
auto &Context = M->getContext();
|
|
// Place this variable to llvm.used so it won't be GC'ed.
|
|
appendToUsed(*M, {new GlobalVariable(*M, Type::getInt1Ty(Context), true,
|
|
GlobalValue::WeakODRLinkage,
|
|
ConstantInt::getTrue(Context),
|
|
FSDiscriminatorVar)});
|
|
}
|
|
|
|
} // end of namespace sampleprofutil
|
|
} // end of namespace llvm
|