mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-23 11:13:28 +01:00
fe4a3fd086
Otherwise, the Win64 unwinder considers direct branches to such empty trailing BBs to be a branch out of the function. It treats such a branch as a tail call, which can only be part of an epilogue. If the unwinder misclassifies such a branch as part of the epilogue, it will fail to unwind the stack further. This can lead to bad stack traces, or failure to handle exceptions properly. This is described in https://llvm.org/PR45064#c4, and by the comment at the top of the X86AvoidTrailingCallPass.cpp file. It should be safe to insert int3 for such blocks. An empty trailing BB that reaches this pass is pretty much guaranteed to be unreachable. If a program executed such a block, it would fall off the end of the function. Most of the complexity in this patch comes from threading through the "EHFuncletEntry" boolean on the MIRParser and registering the pass so we can stop and start codegen around it. I used an MIR test because we should teach LLVM to optimize away these branches as a follow-up. Reviewed By: hans Differential Revision: https://reviews.llvm.org/D76531
136 lines
4.9 KiB
C++
136 lines
4.9 KiB
C++
//===----- X86AvoidTrailingCall.cpp - Insert int3 after trailing calls ----===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// The Windows x64 unwinder decodes the instruction stream during unwinding.
|
|
// The unwinder decodes forward from the current PC to detect epilogue code
|
|
// patterns.
|
|
//
|
|
// First, this means that there must be an instruction after every
|
|
// call instruction for the unwinder to decode. LLVM must maintain the invariant
|
|
// that the last instruction of a function or funclet is not a call, or the
|
|
// unwinder may decode into the next function. Similarly, a call may not
|
|
// immediately precede an epilogue code pattern. As of this writing, the
|
|
// SEH_Epilogue pseudo instruction takes care of that.
|
|
//
|
|
// Second, all non-tail call jump targets must be within the *half-open*
|
|
// interval of the bounds of the function. The unwinder distinguishes between
|
|
// internal jump instructions and tail calls in an epilogue sequence by checking
|
|
// the jump target against the function bounds from the .pdata section. This
|
|
// means that the last regular MBB of an LLVM function must not be empty if
|
|
// there are regular jumps targeting it.
|
|
//
|
|
// This pass upholds these invariants by ensuring that blocks at the end of a
|
|
// function or funclet are a) not empty and b) do not end in a CALL instruction.
|
|
//
|
|
// Unwinder implementation for reference:
|
|
// https://github.com/dotnet/coreclr/blob/a9f3fc16483eecfc47fb79c362811d870be02249/src/unwinder/amd64/unwinder_amd64.cpp#L1015
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "X86.h"
|
|
#include "X86InstrInfo.h"
|
|
#include "X86Subtarget.h"
|
|
#include "llvm/CodeGen/MachineInstrBuilder.h"
|
|
|
|
#define AVOIDCALL_DESC "X86 avoid trailing call pass"
|
|
#define AVOIDCALL_NAME "x86-avoid-trailing-call"
|
|
|
|
#define DEBUG_TYPE AVOIDCALL_NAME
|
|
|
|
using namespace llvm;
|
|
|
|
namespace {
|
|
class X86AvoidTrailingCallPass : public MachineFunctionPass {
|
|
public:
|
|
X86AvoidTrailingCallPass() : MachineFunctionPass(ID) {}
|
|
|
|
bool runOnMachineFunction(MachineFunction &MF) override;
|
|
|
|
static char ID;
|
|
|
|
private:
|
|
StringRef getPassName() const override { return AVOIDCALL_DESC; }
|
|
};
|
|
} // end anonymous namespace
|
|
|
|
char X86AvoidTrailingCallPass::ID = 0;
|
|
|
|
FunctionPass *llvm::createX86AvoidTrailingCallPass() {
|
|
return new X86AvoidTrailingCallPass();
|
|
}
|
|
|
|
INITIALIZE_PASS(X86AvoidTrailingCallPass, AVOIDCALL_NAME, AVOIDCALL_DESC, false, false)
|
|
|
|
// A real instruction is a non-meta, non-pseudo instruction. Some pseudos
|
|
// expand to nothing, and some expand to code. This logic conservatively assumes
|
|
// they might expand to nothing.
|
|
static bool isRealInstruction(MachineInstr &MI) {
|
|
return !MI.isPseudo() && !MI.isMetaInstruction();
|
|
}
|
|
|
|
// Return true if this is a call instruction, but not a tail call.
|
|
static bool isCallInstruction(const MachineInstr &MI) {
|
|
return MI.isCall() && !MI.isReturn();
|
|
}
|
|
|
|
bool X86AvoidTrailingCallPass::runOnMachineFunction(MachineFunction &MF) {
|
|
const X86Subtarget &STI = MF.getSubtarget<X86Subtarget>();
|
|
const X86InstrInfo &TII = *STI.getInstrInfo();
|
|
assert(STI.isTargetWin64() && "pass only runs on Win64");
|
|
|
|
// We don't need to worry about any of the invariants described above if there
|
|
// is no unwind info (CFI).
|
|
if (!MF.hasWinCFI())
|
|
return false;
|
|
|
|
// FIXME: Perhaps this pass should also replace SEH_Epilogue by inserting nops
|
|
// before epilogues.
|
|
|
|
bool Changed = false;
|
|
for (MachineBasicBlock &MBB : MF) {
|
|
// Look for basic blocks that precede funclet entries or are at the end of
|
|
// the function.
|
|
MachineBasicBlock *NextMBB = MBB.getNextNode();
|
|
if (NextMBB && !NextMBB->isEHFuncletEntry())
|
|
continue;
|
|
|
|
// Find the last real instruction in this block.
|
|
auto LastRealInstr = llvm::find_if(reverse(MBB), isRealInstruction);
|
|
|
|
// If the block is empty or the last real instruction is a call instruction,
|
|
// insert an int3. If there is a call instruction, insert the int3 between
|
|
// the call and any labels or other meta instructions. If the block is
|
|
// empty, insert at block end.
|
|
bool IsEmpty = LastRealInstr == MBB.rend();
|
|
bool IsCall = !IsEmpty && isCallInstruction(*LastRealInstr);
|
|
if (IsEmpty || IsCall) {
|
|
LLVM_DEBUG({
|
|
if (IsCall) {
|
|
dbgs() << "inserting int3 after trailing call instruction:\n";
|
|
LastRealInstr->dump();
|
|
dbgs() << '\n';
|
|
} else {
|
|
dbgs() << "inserting int3 in trailing empty MBB:\n";
|
|
MBB.dump();
|
|
}
|
|
});
|
|
|
|
MachineBasicBlock::iterator MBBI = MBB.end();
|
|
DebugLoc DL;
|
|
if (IsCall) {
|
|
MBBI = std::next(LastRealInstr.getReverse());
|
|
DL = LastRealInstr->getDebugLoc();
|
|
}
|
|
BuildMI(MBB, MBBI, DL, TII.get(X86::INT3));
|
|
Changed = true;
|
|
}
|
|
}
|
|
|
|
return Changed;
|
|
}
|