1
0
mirror of https://github.com/RPCS3/llvm-mirror.git synced 2024-11-25 12:12:47 +01:00
llvm-mirror/lib/Target/ARM/ARMHazardRecognizer.cpp
David Penry 94988510e6 [ARM] Add bank conflict hazarding
Adds ARMBankConflictHazardRecognizer. This hazard recognizer
looks for a few situations where the same base pointer is used and
then checks whether the offsets lead to a bank conflict. Two
parameters are also added to permit overriding of the target
assumptions:

arm-data-bank-mask=<int> - Mask of bits which are to be checked for
conflicts.  If all these bits are equal in the offsets, there is a
conflict.
arm-assume-itcm-bankconflict=<bool> - Assume that there will be bank
conflicts on any loads to a constant pool.

This hazard recognizer is enabled for Cortex-M7, where the Technical
Reference Manual states that there are two DTCM banks banked using bit
2 and one ITCM bank.

Differential Revision: https://reviews.llvm.org/D93054
2020-12-23 14:00:59 +00:00

269 lines
9.4 KiB
C++

//===-- ARMHazardRecognizer.cpp - ARM postra hazard recognizer ------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
#include "ARMHazardRecognizer.h"
#include "ARMBaseInstrInfo.h"
#include "ARMBaseRegisterInfo.h"
#include "ARMSubtarget.h"
#include "llvm/Analysis/ValueTracking.h"
#include "llvm/CodeGen/MachineInstr.h"
#include "llvm/CodeGen/ScheduleDAG.h"
#include "llvm/CodeGen/TargetRegisterInfo.h"
#include "llvm/Support/CommandLine.h"
using namespace llvm;
static cl::opt<int> DataBankMask("arm-data-bank-mask", cl::init(-1),
cl::Hidden);
static cl::opt<bool> AssumeITCMConflict("arm-assume-itcm-bankconflict",
cl::init(false), cl::Hidden);
static bool hasRAWHazard(MachineInstr *DefMI, MachineInstr *MI,
const TargetRegisterInfo &TRI) {
// FIXME: Detect integer instructions properly.
const MCInstrDesc &MCID = MI->getDesc();
unsigned Domain = MCID.TSFlags & ARMII::DomainMask;
if (MI->mayStore())
return false;
unsigned Opcode = MCID.getOpcode();
if (Opcode == ARM::VMOVRS || Opcode == ARM::VMOVRRD)
return false;
if ((Domain & ARMII::DomainVFP) || (Domain & ARMII::DomainNEON))
return MI->readsRegister(DefMI->getOperand(0).getReg(), &TRI);
return false;
}
ScheduleHazardRecognizer::HazardType
ARMHazardRecognizerFPMLx::getHazardType(SUnit *SU, int Stalls) {
assert(Stalls == 0 && "ARM hazards don't support scoreboard lookahead");
MachineInstr *MI = SU->getInstr();
if (!MI->isDebugInstr()) {
// Look for special VMLA / VMLS hazards. A VMUL / VADD / VSUB following
// a VMLA / VMLS will cause 4 cycle stall.
const MCInstrDesc &MCID = MI->getDesc();
if (LastMI && (MCID.TSFlags & ARMII::DomainMask) != ARMII::DomainGeneral) {
MachineInstr *DefMI = LastMI;
const MCInstrDesc &LastMCID = LastMI->getDesc();
const MachineFunction *MF = MI->getParent()->getParent();
const ARMBaseInstrInfo &TII = *static_cast<const ARMBaseInstrInfo *>(
MF->getSubtarget().getInstrInfo());
// Skip over one non-VFP / NEON instruction.
if (!LastMI->isBarrier() &&
!(TII.getSubtarget().hasMuxedUnits() && LastMI->mayLoadOrStore()) &&
(LastMCID.TSFlags & ARMII::DomainMask) == ARMII::DomainGeneral) {
MachineBasicBlock::iterator I = LastMI;
if (I != LastMI->getParent()->begin()) {
I = std::prev(I);
DefMI = &*I;
}
}
if (TII.isFpMLxInstruction(DefMI->getOpcode()) &&
(TII.canCauseFpMLxStall(MI->getOpcode()) ||
hasRAWHazard(DefMI, MI, TII.getRegisterInfo()))) {
// Try to schedule another instruction for the next 4 cycles.
if (FpMLxStalls == 0)
FpMLxStalls = 4;
return Hazard;
}
}
}
return NoHazard;
}
void ARMHazardRecognizerFPMLx::Reset() {
LastMI = nullptr;
FpMLxStalls = 0;
}
void ARMHazardRecognizerFPMLx::EmitInstruction(SUnit *SU) {
MachineInstr *MI = SU->getInstr();
if (!MI->isDebugInstr()) {
LastMI = MI;
FpMLxStalls = 0;
}
}
void ARMHazardRecognizerFPMLx::AdvanceCycle() {
if (FpMLxStalls && --FpMLxStalls == 0)
// Stalled for 4 cycles but still can't schedule any other instructions.
LastMI = nullptr;
}
void ARMHazardRecognizerFPMLx::RecedeCycle() {
llvm_unreachable("reverse ARM hazard checking unsupported");
}
///////// Bank conflicts handled as hazards //////////////
static bool getBaseOffset(const MachineInstr &MI, const MachineOperand *&BaseOp,
int64_t &Offset) {
uint64_t TSFlags = MI.getDesc().TSFlags;
unsigned AddrMode = (TSFlags & ARMII::AddrModeMask);
unsigned IndexMode =
(TSFlags & ARMII::IndexModeMask) >> ARMII::IndexModeShift;
// Address mode tells us what we want to know about operands for T2
// instructions (but not size). It tells us size (but not about operands)
// for T1 instructions.
switch (AddrMode) {
default:
return false;
case ARMII::AddrModeT2_i8:
// t2LDRBT, t2LDRB_POST, t2LDRB_PRE, t2LDRBi8,
// t2LDRHT, t2LDRH_POST, t2LDRH_PRE, t2LDRHi8,
// t2LDRSBT, t2LDRSB_POST, t2LDRSB_PRE, t2LDRSBi8,
// t2LDRSHT, t2LDRSH_POST, t2LDRSH_PRE, t2LDRSHi8,
// t2LDRT, t2LDR_POST, t2LDR_PRE, t2LDRi8
BaseOp = &MI.getOperand(1);
Offset = (IndexMode == ARMII::IndexModePost)
? 0
: (IndexMode == ARMII::IndexModePre ||
IndexMode == ARMII::IndexModeUpd)
? MI.getOperand(3).getImm()
: MI.getOperand(2).getImm();
return true;
case ARMII::AddrModeT2_i12:
// t2LDRBi12, t2LDRHi12
// t2LDRSBi12, t2LDRSHi12
// t2LDRi12
BaseOp = &MI.getOperand(1);
Offset = MI.getOperand(2).getImm();
return true;
case ARMII::AddrModeT2_i8s4:
// t2LDRD_POST, t2LDRD_PRE, t2LDRDi8
BaseOp = &MI.getOperand(2);
Offset = (IndexMode == ARMII::IndexModePost)
? 0
: (IndexMode == ARMII::IndexModePre ||
IndexMode == ARMII::IndexModeUpd)
? MI.getOperand(4).getImm()
: MI.getOperand(3).getImm();
return true;
case ARMII::AddrModeT1_1:
// tLDRBi, tLDRBr (watch out!), TLDRSB
case ARMII::AddrModeT1_2:
// tLDRHi, tLDRHr (watch out!), TLDRSH
case ARMII::AddrModeT1_4:
// tLDRi, tLDRr (watch out!)
BaseOp = &MI.getOperand(1);
Offset = MI.getOperand(2).isImm() ? MI.getOperand(2).getImm() : 0;
return MI.getOperand(2).isImm();
}
return false;
}
ARMBankConflictHazardRecognizer::ARMBankConflictHazardRecognizer(
const ScheduleDAG *DAG, int64_t CPUBankMask, bool CPUAssumeITCMConflict)
: ScheduleHazardRecognizer(), MF(DAG->MF), DL(DAG->MF.getDataLayout()),
DataMask(DataBankMask.getNumOccurrences() ? int64_t(DataBankMask)
: CPUBankMask),
AssumeITCMBankConflict(AssumeITCMConflict.getNumOccurrences()
? AssumeITCMConflict
: CPUAssumeITCMConflict) {
MaxLookAhead = 1;
}
ScheduleHazardRecognizer::HazardType
ARMBankConflictHazardRecognizer::CheckOffsets(unsigned O0, unsigned O1) {
return (((O0 ^ O1) & DataMask) != 0) ? NoHazard : Hazard;
}
ScheduleHazardRecognizer::HazardType
ARMBankConflictHazardRecognizer::getHazardType(SUnit *SU, int Stalls) {
MachineInstr &L0 = *SU->getInstr();
if (!L0.mayLoad() || L0.mayStore() || L0.getNumMemOperands() != 1)
return NoHazard;
auto MO0 = *L0.memoperands().begin();
auto BaseVal0 = MO0->getValue();
auto BasePseudoVal0 = MO0->getPseudoValue();
int64_t Offset0 = 0;
if (MO0->getSize() > 4)
return NoHazard;
bool SPvalid = false;
const MachineOperand *SP = nullptr;
int64_t SPOffset0 = 0;
for (auto L1 : Accesses) {
auto MO1 = *L1->memoperands().begin();
auto BaseVal1 = MO1->getValue();
auto BasePseudoVal1 = MO1->getPseudoValue();
int64_t Offset1 = 0;
// Pointers to the same object
if (BaseVal0 && BaseVal1) {
const Value *Ptr0, *Ptr1;
Ptr0 = GetPointerBaseWithConstantOffset(BaseVal0, Offset0, DL, true);
Ptr1 = GetPointerBaseWithConstantOffset(BaseVal1, Offset1, DL, true);
if (Ptr0 == Ptr1 && Ptr0)
return CheckOffsets(Offset0, Offset1);
}
if (BasePseudoVal0 && BasePseudoVal1 &&
BasePseudoVal0->kind() == BasePseudoVal1->kind() &&
BasePseudoVal0->kind() == PseudoSourceValue::FixedStack) {
// Spills/fills
auto FS0 = cast<FixedStackPseudoSourceValue>(BasePseudoVal0);
auto FS1 = cast<FixedStackPseudoSourceValue>(BasePseudoVal1);
Offset0 = MF.getFrameInfo().getObjectOffset(FS0->getFrameIndex());
Offset1 = MF.getFrameInfo().getObjectOffset(FS1->getFrameIndex());
return CheckOffsets(Offset0, Offset1);
}
// Constant pools (likely in ITCM)
if (BasePseudoVal0 && BasePseudoVal1 &&
BasePseudoVal0->kind() == BasePseudoVal1->kind() &&
BasePseudoVal0->isConstantPool() && AssumeITCMBankConflict)
return Hazard;
// Is this a stack pointer-relative access? We could in general try to
// use "is this the same register and is it unchanged?", but the
// memory operand tracking is highly likely to have already found that.
// What we're after here is bank conflicts between different objects in
// the stack frame.
if (!SPvalid) { // set up SP
if (!getBaseOffset(L0, SP, SPOffset0) || SP->getReg().id() != ARM::SP)
SP = nullptr;
SPvalid = true;
}
if (SP) {
int64_t SPOffset1;
const MachineOperand *SP1;
if (getBaseOffset(*L1, SP1, SPOffset1) && SP1->getReg().id() == ARM::SP)
return CheckOffsets(SPOffset0, SPOffset1);
}
}
return NoHazard;
}
void ARMBankConflictHazardRecognizer::Reset() { Accesses.clear(); }
void ARMBankConflictHazardRecognizer::EmitInstruction(SUnit *SU) {
MachineInstr &MI = *SU->getInstr();
if (!MI.mayLoad() || MI.mayStore() || MI.getNumMemOperands() != 1)
return;
auto MO = *MI.memoperands().begin();
uint64_t Size1 = MO->getSize();
if (Size1 > 4)
return;
Accesses.push_back(&MI);
}
void ARMBankConflictHazardRecognizer::AdvanceCycle() { Accesses.clear(); }
void ARMBankConflictHazardRecognizer::RecedeCycle() { Accesses.clear(); }