mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-25 12:12:47 +01:00
0f2b9d9dc4
llvm-svn: 123399
387 lines
14 KiB
C++
387 lines
14 KiB
C++
//=====- SystemZFrameLowering.cpp - SystemZ Frame Information ------*- C++ -*-====//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file contains the SystemZ implementation of TargetFrameLowering class.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "SystemZFrameLowering.h"
|
|
#include "SystemZInstrBuilder.h"
|
|
#include "SystemZInstrInfo.h"
|
|
#include "SystemZMachineFunctionInfo.h"
|
|
#include "llvm/Function.h"
|
|
#include "llvm/CodeGen/MachineFrameInfo.h"
|
|
#include "llvm/CodeGen/MachineFunction.h"
|
|
#include "llvm/CodeGen/MachineInstrBuilder.h"
|
|
#include "llvm/CodeGen/MachineModuleInfo.h"
|
|
#include "llvm/CodeGen/MachineRegisterInfo.h"
|
|
#include "llvm/Target/TargetData.h"
|
|
#include "llvm/Target/TargetOptions.h"
|
|
#include "llvm/Support/CommandLine.h"
|
|
|
|
using namespace llvm;
|
|
|
|
SystemZFrameLowering::SystemZFrameLowering(const SystemZSubtarget &sti)
|
|
: TargetFrameLowering(TargetFrameLowering::StackGrowsDown, 8, -160), STI(sti) {
|
|
// Fill the spill offsets map
|
|
static const unsigned SpillOffsTab[][2] = {
|
|
{ SystemZ::R2D, 0x10 },
|
|
{ SystemZ::R3D, 0x18 },
|
|
{ SystemZ::R4D, 0x20 },
|
|
{ SystemZ::R5D, 0x28 },
|
|
{ SystemZ::R6D, 0x30 },
|
|
{ SystemZ::R7D, 0x38 },
|
|
{ SystemZ::R8D, 0x40 },
|
|
{ SystemZ::R9D, 0x48 },
|
|
{ SystemZ::R10D, 0x50 },
|
|
{ SystemZ::R11D, 0x58 },
|
|
{ SystemZ::R12D, 0x60 },
|
|
{ SystemZ::R13D, 0x68 },
|
|
{ SystemZ::R14D, 0x70 },
|
|
{ SystemZ::R15D, 0x78 }
|
|
};
|
|
|
|
RegSpillOffsets.grow(SystemZ::NUM_TARGET_REGS);
|
|
|
|
for (unsigned i = 0, e = array_lengthof(SpillOffsTab); i != e; ++i)
|
|
RegSpillOffsets[SpillOffsTab[i][0]] = SpillOffsTab[i][1];
|
|
}
|
|
|
|
/// needsFP - Return true if the specified function should have a dedicated
|
|
/// frame pointer register. This is true if the function has variable sized
|
|
/// allocas or if frame pointer elimination is disabled.
|
|
bool SystemZFrameLowering::hasFP(const MachineFunction &MF) const {
|
|
const MachineFrameInfo *MFI = MF.getFrameInfo();
|
|
return DisableFramePointerElim(MF) || MFI->hasVarSizedObjects();
|
|
}
|
|
|
|
/// emitSPUpdate - Emit a series of instructions to increment / decrement the
|
|
/// stack pointer by a constant value.
|
|
static
|
|
void emitSPUpdate(MachineBasicBlock &MBB, MachineBasicBlock::iterator &MBBI,
|
|
int64_t NumBytes, const TargetInstrInfo &TII) {
|
|
unsigned Opc; uint64_t Chunk;
|
|
bool isSub = NumBytes < 0;
|
|
uint64_t Offset = isSub ? -NumBytes : NumBytes;
|
|
|
|
if (Offset >= (1LL << 15) - 1) {
|
|
Opc = SystemZ::ADD64ri32;
|
|
Chunk = (1LL << 31) - 1;
|
|
} else {
|
|
Opc = SystemZ::ADD64ri16;
|
|
Chunk = (1LL << 15) - 1;
|
|
}
|
|
|
|
DebugLoc DL = MBBI != MBB.end() ? MBBI->getDebugLoc() : DebugLoc();
|
|
|
|
while (Offset) {
|
|
uint64_t ThisVal = (Offset > Chunk) ? Chunk : Offset;
|
|
MachineInstr *MI =
|
|
BuildMI(MBB, MBBI, DL, TII.get(Opc), SystemZ::R15D)
|
|
.addReg(SystemZ::R15D).addImm(isSub ? -ThisVal : ThisVal);
|
|
// The PSW implicit def is dead.
|
|
MI->getOperand(3).setIsDead();
|
|
Offset -= ThisVal;
|
|
}
|
|
}
|
|
|
|
void SystemZFrameLowering::emitPrologue(MachineFunction &MF) const {
|
|
MachineBasicBlock &MBB = MF.front(); // Prolog goes in entry BB
|
|
MachineFrameInfo *MFI = MF.getFrameInfo();
|
|
const SystemZInstrInfo &TII =
|
|
*static_cast<const SystemZInstrInfo*>(MF.getTarget().getInstrInfo());
|
|
SystemZMachineFunctionInfo *SystemZMFI =
|
|
MF.getInfo<SystemZMachineFunctionInfo>();
|
|
MachineBasicBlock::iterator MBBI = MBB.begin();
|
|
DebugLoc DL = MBBI != MBB.end() ? MBBI->getDebugLoc() : DebugLoc();
|
|
|
|
// Get the number of bytes to allocate from the FrameInfo.
|
|
// Note that area for callee-saved stuff is already allocated, thus we need to
|
|
// 'undo' the stack movement.
|
|
uint64_t StackSize = MFI->getStackSize();
|
|
StackSize -= SystemZMFI->getCalleeSavedFrameSize();
|
|
|
|
uint64_t NumBytes = StackSize - getOffsetOfLocalArea();
|
|
|
|
// Skip the callee-saved push instructions.
|
|
while (MBBI != MBB.end() &&
|
|
(MBBI->getOpcode() == SystemZ::MOV64mr ||
|
|
MBBI->getOpcode() == SystemZ::MOV64mrm))
|
|
++MBBI;
|
|
|
|
if (MBBI != MBB.end())
|
|
DL = MBBI->getDebugLoc();
|
|
|
|
// adjust stack pointer: R15 -= numbytes
|
|
if (StackSize || MFI->hasCalls()) {
|
|
assert(MF.getRegInfo().isPhysRegUsed(SystemZ::R15D) &&
|
|
"Invalid stack frame calculation!");
|
|
emitSPUpdate(MBB, MBBI, -(int64_t)NumBytes, TII);
|
|
}
|
|
|
|
if (hasFP(MF)) {
|
|
// Update R11 with the new base value...
|
|
BuildMI(MBB, MBBI, DL, TII.get(SystemZ::MOV64rr), SystemZ::R11D)
|
|
.addReg(SystemZ::R15D);
|
|
|
|
// Mark the FramePtr as live-in in every block except the entry.
|
|
for (MachineFunction::iterator I = llvm::next(MF.begin()), E = MF.end();
|
|
I != E; ++I)
|
|
I->addLiveIn(SystemZ::R11D);
|
|
|
|
}
|
|
}
|
|
|
|
void SystemZFrameLowering::emitEpilogue(MachineFunction &MF,
|
|
MachineBasicBlock &MBB) const {
|
|
const MachineFrameInfo *MFI = MF.getFrameInfo();
|
|
MachineBasicBlock::iterator MBBI = MBB.getLastNonDebugInstr();
|
|
const SystemZInstrInfo &TII =
|
|
*static_cast<const SystemZInstrInfo*>(MF.getTarget().getInstrInfo());
|
|
SystemZMachineFunctionInfo *SystemZMFI =
|
|
MF.getInfo<SystemZMachineFunctionInfo>();
|
|
unsigned RetOpcode = MBBI->getOpcode();
|
|
|
|
switch (RetOpcode) {
|
|
case SystemZ::RET: break; // These are ok
|
|
default:
|
|
assert(0 && "Can only insert epilog into returning blocks");
|
|
}
|
|
|
|
// Get the number of bytes to allocate from the FrameInfo
|
|
// Note that area for callee-saved stuff is already allocated, thus we need to
|
|
// 'undo' the stack movement.
|
|
uint64_t StackSize =
|
|
MFI->getStackSize() - SystemZMFI->getCalleeSavedFrameSize();
|
|
uint64_t NumBytes = StackSize - getOffsetOfLocalArea();
|
|
|
|
// Skip the final terminator instruction.
|
|
while (MBBI != MBB.begin()) {
|
|
MachineBasicBlock::iterator PI = prior(MBBI);
|
|
--MBBI;
|
|
if (!PI->getDesc().isTerminator())
|
|
break;
|
|
}
|
|
|
|
// During callee-saved restores emission stack frame was not yet finialized
|
|
// (and thus - the stack size was unknown). Tune the offset having full stack
|
|
// size in hands.
|
|
if (StackSize || MFI->hasCalls()) {
|
|
assert((MBBI->getOpcode() == SystemZ::MOV64rmm ||
|
|
MBBI->getOpcode() == SystemZ::MOV64rm) &&
|
|
"Expected to see callee-save register restore code");
|
|
assert(MF.getRegInfo().isPhysRegUsed(SystemZ::R15D) &&
|
|
"Invalid stack frame calculation!");
|
|
|
|
unsigned i = 0;
|
|
MachineInstr &MI = *MBBI;
|
|
while (!MI.getOperand(i).isImm()) {
|
|
++i;
|
|
assert(i < MI.getNumOperands() && "Unexpected restore code!");
|
|
}
|
|
|
|
uint64_t Offset = NumBytes + MI.getOperand(i).getImm();
|
|
// If Offset does not fit into 20-bit signed displacement field we need to
|
|
// emit some additional code...
|
|
if (Offset > 524287) {
|
|
// Fold the displacement into load instruction as much as possible.
|
|
NumBytes = Offset - 524287;
|
|
Offset = 524287;
|
|
emitSPUpdate(MBB, MBBI, NumBytes, TII);
|
|
}
|
|
|
|
MI.getOperand(i).ChangeToImmediate(Offset);
|
|
}
|
|
}
|
|
|
|
int SystemZFrameLowering::getFrameIndexOffset(const MachineFunction &MF,
|
|
int FI) const {
|
|
const MachineFrameInfo *MFI = MF.getFrameInfo();
|
|
const SystemZMachineFunctionInfo *SystemZMFI =
|
|
MF.getInfo<SystemZMachineFunctionInfo>();
|
|
int Offset = MFI->getObjectOffset(FI) + MFI->getOffsetAdjustment();
|
|
uint64_t StackSize = MFI->getStackSize();
|
|
|
|
// Fixed objects are really located in the "previous" frame.
|
|
if (FI < 0)
|
|
StackSize -= SystemZMFI->getCalleeSavedFrameSize();
|
|
|
|
Offset += StackSize - getOffsetOfLocalArea();
|
|
|
|
// Skip the register save area if we generated the stack frame.
|
|
if (StackSize || MFI->hasCalls())
|
|
Offset -= getOffsetOfLocalArea();
|
|
|
|
return Offset;
|
|
}
|
|
|
|
bool
|
|
SystemZFrameLowering::spillCalleeSavedRegisters(MachineBasicBlock &MBB,
|
|
MachineBasicBlock::iterator MI,
|
|
const std::vector<CalleeSavedInfo> &CSI,
|
|
const TargetRegisterInfo *TRI) const {
|
|
if (CSI.empty())
|
|
return false;
|
|
|
|
DebugLoc DL;
|
|
if (MI != MBB.end()) DL = MI->getDebugLoc();
|
|
|
|
MachineFunction &MF = *MBB.getParent();
|
|
const TargetInstrInfo &TII = *MF.getTarget().getInstrInfo();
|
|
SystemZMachineFunctionInfo *MFI = MF.getInfo<SystemZMachineFunctionInfo>();
|
|
unsigned CalleeFrameSize = 0;
|
|
|
|
// Scan the callee-saved and find the bounds of register spill area.
|
|
unsigned LowReg = 0, HighReg = 0, StartOffset = -1U, EndOffset = 0;
|
|
for (unsigned i = 0, e = CSI.size(); i != e; ++i) {
|
|
unsigned Reg = CSI[i].getReg();
|
|
if (!SystemZ::FP64RegClass.contains(Reg)) {
|
|
unsigned Offset = RegSpillOffsets[Reg];
|
|
CalleeFrameSize += 8;
|
|
if (StartOffset > Offset) {
|
|
LowReg = Reg; StartOffset = Offset;
|
|
}
|
|
if (EndOffset < Offset) {
|
|
HighReg = Reg; EndOffset = RegSpillOffsets[Reg];
|
|
}
|
|
}
|
|
}
|
|
|
|
// Save information for epilogue inserter.
|
|
MFI->setCalleeSavedFrameSize(CalleeFrameSize);
|
|
MFI->setLowReg(LowReg); MFI->setHighReg(HighReg);
|
|
|
|
// Save GPRs
|
|
if (StartOffset) {
|
|
// Build a store instruction. Use STORE MULTIPLE instruction if there are many
|
|
// registers to store, otherwise - just STORE.
|
|
MachineInstrBuilder MIB =
|
|
BuildMI(MBB, MI, DL, TII.get((LowReg == HighReg ?
|
|
SystemZ::MOV64mr : SystemZ::MOV64mrm)));
|
|
|
|
// Add store operands.
|
|
MIB.addReg(SystemZ::R15D).addImm(StartOffset);
|
|
if (LowReg == HighReg)
|
|
MIB.addReg(0);
|
|
MIB.addReg(LowReg, RegState::Kill);
|
|
if (LowReg != HighReg)
|
|
MIB.addReg(HighReg, RegState::Kill);
|
|
|
|
// Do a second scan adding regs as being killed by instruction
|
|
for (unsigned i = 0, e = CSI.size(); i != e; ++i) {
|
|
unsigned Reg = CSI[i].getReg();
|
|
// Add the callee-saved register as live-in. It's killed at the spill.
|
|
MBB.addLiveIn(Reg);
|
|
if (Reg != LowReg && Reg != HighReg)
|
|
MIB.addReg(Reg, RegState::ImplicitKill);
|
|
}
|
|
}
|
|
|
|
// Save FPRs
|
|
for (unsigned i = 0, e = CSI.size(); i != e; ++i) {
|
|
unsigned Reg = CSI[i].getReg();
|
|
if (SystemZ::FP64RegClass.contains(Reg)) {
|
|
MBB.addLiveIn(Reg);
|
|
TII.storeRegToStackSlot(MBB, MI, Reg, true, CSI[i].getFrameIdx(),
|
|
&SystemZ::FP64RegClass, TRI);
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
bool
|
|
SystemZFrameLowering::restoreCalleeSavedRegisters(MachineBasicBlock &MBB,
|
|
MachineBasicBlock::iterator MI,
|
|
const std::vector<CalleeSavedInfo> &CSI,
|
|
const TargetRegisterInfo *TRI) const {
|
|
if (CSI.empty())
|
|
return false;
|
|
|
|
DebugLoc DL;
|
|
if (MI != MBB.end()) DL = MI->getDebugLoc();
|
|
|
|
MachineFunction &MF = *MBB.getParent();
|
|
const TargetInstrInfo &TII = *MF.getTarget().getInstrInfo();
|
|
SystemZMachineFunctionInfo *MFI = MF.getInfo<SystemZMachineFunctionInfo>();
|
|
|
|
// Restore FP registers
|
|
for (unsigned i = 0, e = CSI.size(); i != e; ++i) {
|
|
unsigned Reg = CSI[i].getReg();
|
|
if (SystemZ::FP64RegClass.contains(Reg))
|
|
TII.loadRegFromStackSlot(MBB, MI, Reg, CSI[i].getFrameIdx(),
|
|
&SystemZ::FP64RegClass, TRI);
|
|
}
|
|
|
|
// Restore GP registers
|
|
unsigned LowReg = MFI->getLowReg(), HighReg = MFI->getHighReg();
|
|
unsigned StartOffset = RegSpillOffsets[LowReg];
|
|
|
|
if (StartOffset) {
|
|
// Build a load instruction. Use LOAD MULTIPLE instruction if there are many
|
|
// registers to load, otherwise - just LOAD.
|
|
MachineInstrBuilder MIB =
|
|
BuildMI(MBB, MI, DL, TII.get((LowReg == HighReg ?
|
|
SystemZ::MOV64rm : SystemZ::MOV64rmm)));
|
|
// Add store operands.
|
|
MIB.addReg(LowReg, RegState::Define);
|
|
if (LowReg != HighReg)
|
|
MIB.addReg(HighReg, RegState::Define);
|
|
|
|
MIB.addReg(hasFP(MF) ? SystemZ::R11D : SystemZ::R15D);
|
|
MIB.addImm(StartOffset);
|
|
if (LowReg == HighReg)
|
|
MIB.addReg(0);
|
|
|
|
// Do a second scan adding regs as being defined by instruction
|
|
for (unsigned i = 0, e = CSI.size(); i != e; ++i) {
|
|
unsigned Reg = CSI[i].getReg();
|
|
if (Reg != LowReg && Reg != HighReg)
|
|
MIB.addReg(Reg, RegState::ImplicitDefine);
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
void
|
|
SystemZFrameLowering::processFunctionBeforeCalleeSavedScan(MachineFunction &MF,
|
|
RegScavenger *RS) const {
|
|
// Determine whether R15/R14 will ever be clobbered inside the function. And
|
|
// if yes - mark it as 'callee' saved.
|
|
MachineFrameInfo *FFI = MF.getFrameInfo();
|
|
MachineRegisterInfo &MRI = MF.getRegInfo();
|
|
|
|
// Check whether high FPRs are ever used, if yes - we need to save R15 as
|
|
// well.
|
|
static const unsigned HighFPRs[] = {
|
|
SystemZ::F8L, SystemZ::F9L, SystemZ::F10L, SystemZ::F11L,
|
|
SystemZ::F12L, SystemZ::F13L, SystemZ::F14L, SystemZ::F15L,
|
|
SystemZ::F8S, SystemZ::F9S, SystemZ::F10S, SystemZ::F11S,
|
|
SystemZ::F12S, SystemZ::F13S, SystemZ::F14S, SystemZ::F15S,
|
|
};
|
|
|
|
bool HighFPRsUsed = false;
|
|
for (unsigned i = 0, e = array_lengthof(HighFPRs); i != e; ++i)
|
|
HighFPRsUsed |= MRI.isPhysRegUsed(HighFPRs[i]);
|
|
|
|
if (FFI->hasCalls())
|
|
/* FIXME: function is varargs */
|
|
/* FIXME: function grabs RA */
|
|
/* FIXME: function calls eh_return */
|
|
MRI.setPhysRegUsed(SystemZ::R14D);
|
|
|
|
if (HighFPRsUsed ||
|
|
FFI->hasCalls() ||
|
|
FFI->getObjectIndexEnd() != 0 || // Contains automatic variables
|
|
FFI->hasVarSizedObjects() // Function calls dynamic alloca's
|
|
/* FIXME: function is varargs */)
|
|
MRI.setPhysRegUsed(SystemZ::R15D);
|
|
}
|