mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-10-21 12:02:58 +02:00
ae65e281f3
to reflect the new license. We understand that people may be surprised that we're moving the header entirely to discuss the new license. We checked this carefully with the Foundation's lawyer and we believe this is the correct approach. Essentially, all code in the project is now made available by the LLVM project under our new license, so you will see that the license headers include that license only. Some of our contributors have contributed code under our old license, and accordingly, we have retained a copy of our old license notice in the top-level files in each project and repository. llvm-svn: 351636
408 lines
13 KiB
C++
408 lines
13 KiB
C++
//===- R600MergeVectorRegisters.cpp ---------------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
/// \file
|
|
/// This pass merges inputs of swizzeable instructions into vector sharing
|
|
/// common data and/or have enough undef subreg using swizzle abilities.
|
|
///
|
|
/// For instance let's consider the following pseudo code :
|
|
/// %5 = REG_SEQ %1, sub0, %2, sub1, %3, sub2, undef, sub3
|
|
/// ...
|
|
/// %7 = REG_SEQ %1, sub0, %3, sub1, undef, sub2, %4, sub3
|
|
/// (swizzable Inst) %7, SwizzleMask : sub0, sub1, sub2, sub3
|
|
///
|
|
/// is turned into :
|
|
/// %5 = REG_SEQ %1, sub0, %2, sub1, %3, sub2, undef, sub3
|
|
/// ...
|
|
/// %7 = INSERT_SUBREG %4, sub3
|
|
/// (swizzable Inst) %7, SwizzleMask : sub0, sub2, sub1, sub3
|
|
///
|
|
/// This allow regalloc to reduce register pressure for vector registers and
|
|
/// to reduce MOV count.
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "AMDGPU.h"
|
|
#include "AMDGPUSubtarget.h"
|
|
#include "R600Defines.h"
|
|
#include "R600InstrInfo.h"
|
|
#include "MCTargetDesc/AMDGPUMCTargetDesc.h"
|
|
#include "llvm/ADT/DenseMap.h"
|
|
#include "llvm/ADT/STLExtras.h"
|
|
#include "llvm/ADT/StringRef.h"
|
|
#include "llvm/CodeGen/MachineBasicBlock.h"
|
|
#include "llvm/CodeGen/MachineDominators.h"
|
|
#include "llvm/CodeGen/MachineFunction.h"
|
|
#include "llvm/CodeGen/MachineFunctionPass.h"
|
|
#include "llvm/CodeGen/MachineInstr.h"
|
|
#include "llvm/CodeGen/MachineInstrBuilder.h"
|
|
#include "llvm/CodeGen/MachineLoopInfo.h"
|
|
#include "llvm/CodeGen/MachineOperand.h"
|
|
#include "llvm/CodeGen/MachineRegisterInfo.h"
|
|
#include "llvm/IR/DebugLoc.h"
|
|
#include "llvm/Pass.h"
|
|
#include "llvm/Support/Debug.h"
|
|
#include "llvm/Support/ErrorHandling.h"
|
|
#include "llvm/Support/raw_ostream.h"
|
|
#include <cassert>
|
|
#include <utility>
|
|
#include <vector>
|
|
|
|
using namespace llvm;
|
|
|
|
#define DEBUG_TYPE "vec-merger"
|
|
|
|
static bool
|
|
isImplicitlyDef(MachineRegisterInfo &MRI, unsigned Reg) {
|
|
for (MachineRegisterInfo::def_instr_iterator It = MRI.def_instr_begin(Reg),
|
|
E = MRI.def_instr_end(); It != E; ++It) {
|
|
return (*It).isImplicitDef();
|
|
}
|
|
if (MRI.isReserved(Reg)) {
|
|
return false;
|
|
}
|
|
llvm_unreachable("Reg without a def");
|
|
return false;
|
|
}
|
|
|
|
namespace {
|
|
|
|
class RegSeqInfo {
|
|
public:
|
|
MachineInstr *Instr;
|
|
DenseMap<unsigned, unsigned> RegToChan;
|
|
std::vector<unsigned> UndefReg;
|
|
|
|
RegSeqInfo(MachineRegisterInfo &MRI, MachineInstr *MI) : Instr(MI) {
|
|
assert(MI->getOpcode() == R600::REG_SEQUENCE);
|
|
for (unsigned i = 1, e = Instr->getNumOperands(); i < e; i+=2) {
|
|
MachineOperand &MO = Instr->getOperand(i);
|
|
unsigned Chan = Instr->getOperand(i + 1).getImm();
|
|
if (isImplicitlyDef(MRI, MO.getReg()))
|
|
UndefReg.push_back(Chan);
|
|
else
|
|
RegToChan[MO.getReg()] = Chan;
|
|
}
|
|
}
|
|
|
|
RegSeqInfo() = default;
|
|
|
|
bool operator==(const RegSeqInfo &RSI) const {
|
|
return RSI.Instr == Instr;
|
|
}
|
|
};
|
|
|
|
class R600VectorRegMerger : public MachineFunctionPass {
|
|
private:
|
|
using InstructionSetMap = DenseMap<unsigned, std::vector<MachineInstr *>>;
|
|
|
|
MachineRegisterInfo *MRI;
|
|
const R600InstrInfo *TII = nullptr;
|
|
DenseMap<MachineInstr *, RegSeqInfo> PreviousRegSeq;
|
|
InstructionSetMap PreviousRegSeqByReg;
|
|
InstructionSetMap PreviousRegSeqByUndefCount;
|
|
|
|
bool canSwizzle(const MachineInstr &MI) const;
|
|
bool areAllUsesSwizzeable(unsigned Reg) const;
|
|
void SwizzleInput(MachineInstr &,
|
|
const std::vector<std::pair<unsigned, unsigned>> &RemapChan) const;
|
|
bool tryMergeVector(const RegSeqInfo *Untouched, RegSeqInfo *ToMerge,
|
|
std::vector<std::pair<unsigned, unsigned>> &Remap) const;
|
|
bool tryMergeUsingCommonSlot(RegSeqInfo &RSI, RegSeqInfo &CompatibleRSI,
|
|
std::vector<std::pair<unsigned, unsigned>> &RemapChan);
|
|
bool tryMergeUsingFreeSlot(RegSeqInfo &RSI, RegSeqInfo &CompatibleRSI,
|
|
std::vector<std::pair<unsigned, unsigned>> &RemapChan);
|
|
MachineInstr *RebuildVector(RegSeqInfo *MI, const RegSeqInfo *BaseVec,
|
|
const std::vector<std::pair<unsigned, unsigned>> &RemapChan) const;
|
|
void RemoveMI(MachineInstr *);
|
|
void trackRSI(const RegSeqInfo &RSI);
|
|
|
|
public:
|
|
static char ID;
|
|
|
|
R600VectorRegMerger() : MachineFunctionPass(ID) {}
|
|
|
|
void getAnalysisUsage(AnalysisUsage &AU) const override {
|
|
AU.setPreservesCFG();
|
|
AU.addRequired<MachineDominatorTree>();
|
|
AU.addPreserved<MachineDominatorTree>();
|
|
AU.addRequired<MachineLoopInfo>();
|
|
AU.addPreserved<MachineLoopInfo>();
|
|
MachineFunctionPass::getAnalysisUsage(AU);
|
|
}
|
|
|
|
StringRef getPassName() const override {
|
|
return "R600 Vector Registers Merge Pass";
|
|
}
|
|
|
|
bool runOnMachineFunction(MachineFunction &Fn) override;
|
|
};
|
|
|
|
} // end anonymous namespace
|
|
|
|
INITIALIZE_PASS_BEGIN(R600VectorRegMerger, DEBUG_TYPE,
|
|
"R600 Vector Reg Merger", false, false)
|
|
INITIALIZE_PASS_END(R600VectorRegMerger, DEBUG_TYPE,
|
|
"R600 Vector Reg Merger", false, false)
|
|
|
|
char R600VectorRegMerger::ID = 0;
|
|
|
|
char &llvm::R600VectorRegMergerID = R600VectorRegMerger::ID;
|
|
|
|
bool R600VectorRegMerger::canSwizzle(const MachineInstr &MI)
|
|
const {
|
|
if (TII->get(MI.getOpcode()).TSFlags & R600_InstFlag::TEX_INST)
|
|
return true;
|
|
switch (MI.getOpcode()) {
|
|
case R600::R600_ExportSwz:
|
|
case R600::EG_ExportSwz:
|
|
return true;
|
|
default:
|
|
return false;
|
|
}
|
|
}
|
|
|
|
bool R600VectorRegMerger::tryMergeVector(const RegSeqInfo *Untouched,
|
|
RegSeqInfo *ToMerge, std::vector< std::pair<unsigned, unsigned>> &Remap)
|
|
const {
|
|
unsigned CurrentUndexIdx = 0;
|
|
for (DenseMap<unsigned, unsigned>::iterator It = ToMerge->RegToChan.begin(),
|
|
E = ToMerge->RegToChan.end(); It != E; ++It) {
|
|
DenseMap<unsigned, unsigned>::const_iterator PosInUntouched =
|
|
Untouched->RegToChan.find((*It).first);
|
|
if (PosInUntouched != Untouched->RegToChan.end()) {
|
|
Remap.push_back(std::pair<unsigned, unsigned>
|
|
((*It).second, (*PosInUntouched).second));
|
|
continue;
|
|
}
|
|
if (CurrentUndexIdx >= Untouched->UndefReg.size())
|
|
return false;
|
|
Remap.push_back(std::pair<unsigned, unsigned>
|
|
((*It).second, Untouched->UndefReg[CurrentUndexIdx++]));
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
static
|
|
unsigned getReassignedChan(
|
|
const std::vector<std::pair<unsigned, unsigned>> &RemapChan,
|
|
unsigned Chan) {
|
|
for (unsigned j = 0, je = RemapChan.size(); j < je; j++) {
|
|
if (RemapChan[j].first == Chan)
|
|
return RemapChan[j].second;
|
|
}
|
|
llvm_unreachable("Chan wasn't reassigned");
|
|
}
|
|
|
|
MachineInstr *R600VectorRegMerger::RebuildVector(
|
|
RegSeqInfo *RSI, const RegSeqInfo *BaseRSI,
|
|
const std::vector<std::pair<unsigned, unsigned>> &RemapChan) const {
|
|
unsigned Reg = RSI->Instr->getOperand(0).getReg();
|
|
MachineBasicBlock::iterator Pos = RSI->Instr;
|
|
MachineBasicBlock &MBB = *Pos->getParent();
|
|
DebugLoc DL = Pos->getDebugLoc();
|
|
|
|
unsigned SrcVec = BaseRSI->Instr->getOperand(0).getReg();
|
|
DenseMap<unsigned, unsigned> UpdatedRegToChan = BaseRSI->RegToChan;
|
|
std::vector<unsigned> UpdatedUndef = BaseRSI->UndefReg;
|
|
for (DenseMap<unsigned, unsigned>::iterator It = RSI->RegToChan.begin(),
|
|
E = RSI->RegToChan.end(); It != E; ++It) {
|
|
unsigned DstReg = MRI->createVirtualRegister(&R600::R600_Reg128RegClass);
|
|
unsigned SubReg = (*It).first;
|
|
unsigned Swizzle = (*It).second;
|
|
unsigned Chan = getReassignedChan(RemapChan, Swizzle);
|
|
|
|
MachineInstr *Tmp = BuildMI(MBB, Pos, DL, TII->get(R600::INSERT_SUBREG),
|
|
DstReg)
|
|
.addReg(SrcVec)
|
|
.addReg(SubReg)
|
|
.addImm(Chan);
|
|
UpdatedRegToChan[SubReg] = Chan;
|
|
std::vector<unsigned>::iterator ChanPos = llvm::find(UpdatedUndef, Chan);
|
|
if (ChanPos != UpdatedUndef.end())
|
|
UpdatedUndef.erase(ChanPos);
|
|
assert(!is_contained(UpdatedUndef, Chan) &&
|
|
"UpdatedUndef shouldn't contain Chan more than once!");
|
|
LLVM_DEBUG(dbgs() << " ->"; Tmp->dump(););
|
|
(void)Tmp;
|
|
SrcVec = DstReg;
|
|
}
|
|
MachineInstr *NewMI =
|
|
BuildMI(MBB, Pos, DL, TII->get(R600::COPY), Reg).addReg(SrcVec);
|
|
LLVM_DEBUG(dbgs() << " ->"; NewMI->dump(););
|
|
|
|
LLVM_DEBUG(dbgs() << " Updating Swizzle:\n");
|
|
for (MachineRegisterInfo::use_instr_iterator It = MRI->use_instr_begin(Reg),
|
|
E = MRI->use_instr_end(); It != E; ++It) {
|
|
LLVM_DEBUG(dbgs() << " "; (*It).dump(); dbgs() << " ->");
|
|
SwizzleInput(*It, RemapChan);
|
|
LLVM_DEBUG((*It).dump());
|
|
}
|
|
RSI->Instr->eraseFromParent();
|
|
|
|
// Update RSI
|
|
RSI->Instr = NewMI;
|
|
RSI->RegToChan = UpdatedRegToChan;
|
|
RSI->UndefReg = UpdatedUndef;
|
|
|
|
return NewMI;
|
|
}
|
|
|
|
void R600VectorRegMerger::RemoveMI(MachineInstr *MI) {
|
|
for (InstructionSetMap::iterator It = PreviousRegSeqByReg.begin(),
|
|
E = PreviousRegSeqByReg.end(); It != E; ++It) {
|
|
std::vector<MachineInstr *> &MIs = (*It).second;
|
|
MIs.erase(llvm::find(MIs, MI), MIs.end());
|
|
}
|
|
for (InstructionSetMap::iterator It = PreviousRegSeqByUndefCount.begin(),
|
|
E = PreviousRegSeqByUndefCount.end(); It != E; ++It) {
|
|
std::vector<MachineInstr *> &MIs = (*It).second;
|
|
MIs.erase(llvm::find(MIs, MI), MIs.end());
|
|
}
|
|
}
|
|
|
|
void R600VectorRegMerger::SwizzleInput(MachineInstr &MI,
|
|
const std::vector<std::pair<unsigned, unsigned>> &RemapChan) const {
|
|
unsigned Offset;
|
|
if (TII->get(MI.getOpcode()).TSFlags & R600_InstFlag::TEX_INST)
|
|
Offset = 2;
|
|
else
|
|
Offset = 3;
|
|
for (unsigned i = 0; i < 4; i++) {
|
|
unsigned Swizzle = MI.getOperand(i + Offset).getImm() + 1;
|
|
for (unsigned j = 0, e = RemapChan.size(); j < e; j++) {
|
|
if (RemapChan[j].first == Swizzle) {
|
|
MI.getOperand(i + Offset).setImm(RemapChan[j].second - 1);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
bool R600VectorRegMerger::areAllUsesSwizzeable(unsigned Reg) const {
|
|
for (MachineRegisterInfo::use_instr_iterator It = MRI->use_instr_begin(Reg),
|
|
E = MRI->use_instr_end(); It != E; ++It) {
|
|
if (!canSwizzle(*It))
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
bool R600VectorRegMerger::tryMergeUsingCommonSlot(RegSeqInfo &RSI,
|
|
RegSeqInfo &CompatibleRSI,
|
|
std::vector<std::pair<unsigned, unsigned>> &RemapChan) {
|
|
for (MachineInstr::mop_iterator MOp = RSI.Instr->operands_begin(),
|
|
MOE = RSI.Instr->operands_end(); MOp != MOE; ++MOp) {
|
|
if (!MOp->isReg())
|
|
continue;
|
|
if (PreviousRegSeqByReg[MOp->getReg()].empty())
|
|
continue;
|
|
for (MachineInstr *MI : PreviousRegSeqByReg[MOp->getReg()]) {
|
|
CompatibleRSI = PreviousRegSeq[MI];
|
|
if (RSI == CompatibleRSI)
|
|
continue;
|
|
if (tryMergeVector(&CompatibleRSI, &RSI, RemapChan))
|
|
return true;
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
bool R600VectorRegMerger::tryMergeUsingFreeSlot(RegSeqInfo &RSI,
|
|
RegSeqInfo &CompatibleRSI,
|
|
std::vector<std::pair<unsigned, unsigned>> &RemapChan) {
|
|
unsigned NeededUndefs = 4 - RSI.UndefReg.size();
|
|
if (PreviousRegSeqByUndefCount[NeededUndefs].empty())
|
|
return false;
|
|
std::vector<MachineInstr *> &MIs =
|
|
PreviousRegSeqByUndefCount[NeededUndefs];
|
|
CompatibleRSI = PreviousRegSeq[MIs.back()];
|
|
tryMergeVector(&CompatibleRSI, &RSI, RemapChan);
|
|
return true;
|
|
}
|
|
|
|
void R600VectorRegMerger::trackRSI(const RegSeqInfo &RSI) {
|
|
for (DenseMap<unsigned, unsigned>::const_iterator
|
|
It = RSI.RegToChan.begin(), E = RSI.RegToChan.end(); It != E; ++It) {
|
|
PreviousRegSeqByReg[(*It).first].push_back(RSI.Instr);
|
|
}
|
|
PreviousRegSeqByUndefCount[RSI.UndefReg.size()].push_back(RSI.Instr);
|
|
PreviousRegSeq[RSI.Instr] = RSI;
|
|
}
|
|
|
|
bool R600VectorRegMerger::runOnMachineFunction(MachineFunction &Fn) {
|
|
if (skipFunction(Fn.getFunction()))
|
|
return false;
|
|
|
|
const R600Subtarget &ST = Fn.getSubtarget<R600Subtarget>();
|
|
TII = ST.getInstrInfo();
|
|
MRI = &Fn.getRegInfo();
|
|
|
|
for (MachineFunction::iterator MBB = Fn.begin(), MBBe = Fn.end();
|
|
MBB != MBBe; ++MBB) {
|
|
MachineBasicBlock *MB = &*MBB;
|
|
PreviousRegSeq.clear();
|
|
PreviousRegSeqByReg.clear();
|
|
PreviousRegSeqByUndefCount.clear();
|
|
|
|
for (MachineBasicBlock::iterator MII = MB->begin(), MIIE = MB->end();
|
|
MII != MIIE; ++MII) {
|
|
MachineInstr &MI = *MII;
|
|
if (MI.getOpcode() != R600::REG_SEQUENCE) {
|
|
if (TII->get(MI.getOpcode()).TSFlags & R600_InstFlag::TEX_INST) {
|
|
unsigned Reg = MI.getOperand(1).getReg();
|
|
for (MachineRegisterInfo::def_instr_iterator
|
|
It = MRI->def_instr_begin(Reg), E = MRI->def_instr_end();
|
|
It != E; ++It) {
|
|
RemoveMI(&(*It));
|
|
}
|
|
}
|
|
continue;
|
|
}
|
|
|
|
RegSeqInfo RSI(*MRI, &MI);
|
|
|
|
// All uses of MI are swizzeable ?
|
|
unsigned Reg = MI.getOperand(0).getReg();
|
|
if (!areAllUsesSwizzeable(Reg))
|
|
continue;
|
|
|
|
LLVM_DEBUG({
|
|
dbgs() << "Trying to optimize ";
|
|
MI.dump();
|
|
});
|
|
|
|
RegSeqInfo CandidateRSI;
|
|
std::vector<std::pair<unsigned, unsigned>> RemapChan;
|
|
LLVM_DEBUG(dbgs() << "Using common slots...\n";);
|
|
if (tryMergeUsingCommonSlot(RSI, CandidateRSI, RemapChan)) {
|
|
// Remove CandidateRSI mapping
|
|
RemoveMI(CandidateRSI.Instr);
|
|
MII = RebuildVector(&RSI, &CandidateRSI, RemapChan);
|
|
trackRSI(RSI);
|
|
continue;
|
|
}
|
|
LLVM_DEBUG(dbgs() << "Using free slots...\n";);
|
|
RemapChan.clear();
|
|
if (tryMergeUsingFreeSlot(RSI, CandidateRSI, RemapChan)) {
|
|
RemoveMI(CandidateRSI.Instr);
|
|
MII = RebuildVector(&RSI, &CandidateRSI, RemapChan);
|
|
trackRSI(RSI);
|
|
continue;
|
|
}
|
|
//Failed to merge
|
|
trackRSI(RSI);
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
llvm::FunctionPass *llvm::createR600VectorRegMerger() {
|
|
return new R600VectorRegMerger();
|
|
}
|