mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-22 18:54:02 +01:00
[PGO] Exit early if all count values are zero
If all the edge counts for a function are zero, skip count population and annotation, as nothing will happen. This can save some compile time. Differential Revision: https://reviews.llvm.org/D54212 llvm-svn: 346370
This commit is contained in:
parent
7431c3adad
commit
7948668802
@ -859,7 +859,7 @@ public:
|
||||
FreqAttr(FFA_Normal) {}
|
||||
|
||||
// Read counts for the instrumented BB from profile.
|
||||
bool readCounters(IndexedInstrProfReader *PGOReader);
|
||||
bool readCounters(IndexedInstrProfReader *PGOReader, bool &AllZeros);
|
||||
|
||||
// Populate the counts for all BBs.
|
||||
void populateCounters();
|
||||
@ -904,6 +904,7 @@ public:
|
||||
FuncInfo.dumpInfo(Str);
|
||||
}
|
||||
|
||||
uint64_t getProgramMaxCount() const { return ProgramMaxCount; }
|
||||
private:
|
||||
Function &F;
|
||||
Module *M;
|
||||
@ -1013,7 +1014,7 @@ void PGOUseFunc::setEdgeCount(DirectEdges &Edges, uint64_t Value) {
|
||||
// Read the profile from ProfileFileName and assign the value to the
|
||||
// instrumented BB and the edges. This function also updates ProgramMaxCount.
|
||||
// Return true if the profile are successfully read, and false on errors.
|
||||
bool PGOUseFunc::readCounters(IndexedInstrProfReader *PGOReader) {
|
||||
bool PGOUseFunc::readCounters(IndexedInstrProfReader *PGOReader, bool &AllZeros) {
|
||||
auto &Ctx = M->getContext();
|
||||
Expected<InstrProfRecord> Result =
|
||||
PGOReader->getInstrProfRecord(FuncInfo.FuncName, FuncInfo.FunctionHash);
|
||||
@ -1053,6 +1054,7 @@ bool PGOUseFunc::readCounters(IndexedInstrProfReader *PGOReader) {
|
||||
LLVM_DEBUG(dbgs() << " " << I << ": " << CountFromProfile[I] << "\n");
|
||||
ValueSum += CountFromProfile[I];
|
||||
}
|
||||
AllZeros = (ValueSum == 0);
|
||||
|
||||
LLVM_DEBUG(dbgs() << "SUM = " << ValueSum << "\n");
|
||||
|
||||
@ -1477,8 +1479,15 @@ static bool annotateAllFunctions(
|
||||
// later in getInstrBB() to avoid invalidating it.
|
||||
SplitIndirectBrCriticalEdges(F, BPI, BFI);
|
||||
PGOUseFunc Func(F, &M, ComdatMembers, BPI, BFI);
|
||||
if (!Func.readCounters(PGOReader.get()))
|
||||
bool AllZeros = false;
|
||||
if (!Func.readCounters(PGOReader.get(), AllZeros))
|
||||
continue;
|
||||
if (AllZeros) {
|
||||
F.setEntryCount(ProfileCount(0, Function::PCT_Real));
|
||||
if (Func.getProgramMaxCount() != 0)
|
||||
ColdFunctions.push_back(&F);
|
||||
continue;
|
||||
}
|
||||
Func.populateCounters();
|
||||
Func.setBranchWeights();
|
||||
Func.annotateValueSites();
|
||||
|
17
test/Transforms/PGOProfile/Inputs/func_entry.proftext
Normal file
17
test/Transforms/PGOProfile/Inputs/func_entry.proftext
Normal file
@ -0,0 +1,17 @@
|
||||
# IR level Instrumentation Flag
|
||||
:ir
|
||||
foo
|
||||
# Func Hash:
|
||||
12884901887
|
||||
# Num Counters:
|
||||
1
|
||||
# Counter Values:
|
||||
9999
|
||||
|
||||
bar
|
||||
# Func Hash:
|
||||
12884901887
|
||||
# Num Counters:
|
||||
1
|
||||
# Counter Values:
|
||||
0
|
29
test/Transforms/PGOProfile/func_entry.ll
Normal file
29
test/Transforms/PGOProfile/func_entry.ll
Normal file
@ -0,0 +1,29 @@
|
||||
; RUN: llvm-profdata merge %S/Inputs/func_entry.proftext -o %t.profdata
|
||||
; RUN: opt < %s -passes=pgo-instr-use -pgo-test-profile-file=%t.profdata -S | FileCheck %s
|
||||
|
||||
target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
|
||||
target triple = "x86_64-unknown-linux-gnu"
|
||||
|
||||
@s = common dso_local local_unnamed_addr global i32 0, align 4
|
||||
|
||||
define void @bar() {
|
||||
; CHECK-LABEL: @bar
|
||||
; CHECK-SAME: !prof ![[FUNC_ENTRY_COUNT_ZERO:[0-9]+]]
|
||||
|
||||
entry:
|
||||
store i32 1, i32* @s, align 4
|
||||
ret void
|
||||
}
|
||||
|
||||
define void @foo() {
|
||||
; CHECK-LABEL: @foo
|
||||
; CHECK-SAME: !prof ![[FUNC_ENTRY_COUNT_NON_ZERO:[0-9]+]]
|
||||
entry:
|
||||
%0 = load i32, i32* @s, align 4
|
||||
%add = add nsw i32 %0, 4
|
||||
store i32 %add, i32* @s, align 4
|
||||
ret void
|
||||
}
|
||||
|
||||
; CHECK-DAG: ![[FUNC_ENTRY_COUNT_ZERO]] = !{!"function_entry_count", i64 0}
|
||||
; CHECK-DAG: ![[FUNC_ENTRY_COUNT_NON_ZERO]] = !{!"function_entry_count", i64 9999}
|
Loading…
Reference in New Issue
Block a user