mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-26 04:32:44 +01:00
10839866a1
This patch implements initial backend support for a -mtune CPU controlled by a "tune-cpu" function attribute. If the attribute is not present X86 will use the resolved CPU from target-cpu attribute or command line. This patch adds MC layer support a tune CPU. Each CPU now has two sets of features stored in their GenSubtargetInfo.inc tables . These features lists are passed separately to the Processor and ProcessorModel classes in tablegen. The tune list defaults to an empty list to avoid changes to non-X86. This annoyingly increases the size of static tables on all target as we now store 24 more bytes per CPU. I haven't quantified the overall impact, but I can if we're concerned. One new test is added to X86 to show a few tuning features with mismatched tune-cpu and target-cpu/target-feature attributes to demonstrate independent control. Another new test is added to demonstrate that the scheduler model follows the tune CPU. I have not added a -mtune to llc/opt or MC layer command line yet. With no attributes we'll just use the -mcpu for both. MC layer tools will always follow the normal CPU for tuning. Differential Revision: https://reviews.llvm.org/D85165
92 lines
3.0 KiB
C++
92 lines
3.0 KiB
C++
//=====-- NVPTXSubtarget.h - Define Subtarget for the NVPTX ---*- C++ -*--====//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file declares the NVPTX specific subclass of TargetSubtarget.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLVM_LIB_TARGET_NVPTX_NVPTXSUBTARGET_H
|
|
#define LLVM_LIB_TARGET_NVPTX_NVPTXSUBTARGET_H
|
|
|
|
#include "NVPTX.h"
|
|
#include "NVPTXFrameLowering.h"
|
|
#include "NVPTXISelLowering.h"
|
|
#include "NVPTXInstrInfo.h"
|
|
#include "NVPTXRegisterInfo.h"
|
|
#include "llvm/CodeGen/SelectionDAGTargetInfo.h"
|
|
#include "llvm/CodeGen/TargetSubtargetInfo.h"
|
|
#include "llvm/IR/DataLayout.h"
|
|
#include <string>
|
|
|
|
#define GET_SUBTARGETINFO_HEADER
|
|
#include "NVPTXGenSubtargetInfo.inc"
|
|
|
|
namespace llvm {
|
|
|
|
class NVPTXSubtarget : public NVPTXGenSubtargetInfo {
|
|
virtual void anchor();
|
|
std::string TargetName;
|
|
|
|
// PTX version x.y is represented as 10*x+y, e.g. 3.1 == 31
|
|
unsigned PTXVersion;
|
|
|
|
// SM version x.y is represented as 10*x+y, e.g. 3.1 == 31
|
|
unsigned int SmVersion;
|
|
|
|
const NVPTXTargetMachine &TM;
|
|
NVPTXInstrInfo InstrInfo;
|
|
NVPTXTargetLowering TLInfo;
|
|
SelectionDAGTargetInfo TSInfo;
|
|
|
|
// NVPTX does not have any call stack frame, but need a NVPTX specific
|
|
// FrameLowering class because TargetFrameLowering is abstract.
|
|
NVPTXFrameLowering FrameLowering;
|
|
|
|
public:
|
|
/// This constructor initializes the data members to match that
|
|
/// of the specified module.
|
|
///
|
|
NVPTXSubtarget(const Triple &TT, const std::string &CPU,
|
|
const std::string &FS, const NVPTXTargetMachine &TM);
|
|
|
|
const TargetFrameLowering *getFrameLowering() const override {
|
|
return &FrameLowering;
|
|
}
|
|
const NVPTXInstrInfo *getInstrInfo() const override { return &InstrInfo; }
|
|
const NVPTXRegisterInfo *getRegisterInfo() const override {
|
|
return &InstrInfo.getRegisterInfo();
|
|
}
|
|
const NVPTXTargetLowering *getTargetLowering() const override {
|
|
return &TLInfo;
|
|
}
|
|
const SelectionDAGTargetInfo *getSelectionDAGInfo() const override {
|
|
return &TSInfo;
|
|
}
|
|
|
|
bool hasAtomAddF64() const { return SmVersion >= 60; }
|
|
bool hasAtomScope() const { return SmVersion >= 60; }
|
|
bool hasAtomBitwise64() const { return SmVersion >= 32; }
|
|
bool hasAtomMinMax64() const { return SmVersion >= 32; }
|
|
bool hasLDG() const { return SmVersion >= 32; }
|
|
inline bool hasHWROT32() const { return SmVersion >= 32; }
|
|
bool hasImageHandles() const;
|
|
bool hasFP16Math() const { return SmVersion >= 53; }
|
|
bool allowFP16Math() const;
|
|
unsigned int getSmVersion() const { return SmVersion; }
|
|
std::string getTargetName() const { return TargetName; }
|
|
|
|
unsigned getPTXVersion() const { return PTXVersion; }
|
|
|
|
NVPTXSubtarget &initializeSubtargetDependencies(StringRef CPU, StringRef FS);
|
|
void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS);
|
|
};
|
|
|
|
} // End llvm namespace
|
|
|
|
#endif
|