1
0
mirror of https://github.com/RPCS3/llvm-mirror.git synced 2025-01-31 20:51:52 +01:00

ScheduleDAG: Cleanup; NFC

- Fix doxygen comments (do not repeat documented name, remove definition
    comment if there is already one at the declaration, add \p, ...)
- Add some const modifiers
- Use range based for

llvm-svn: 295688
This commit is contained in:
Matthias Braun 2017-02-21 01:27:33 +00:00
parent 70dad586fc
commit 96cfe02f14
2 changed files with 322 additions and 393 deletions

View File

@ -7,9 +7,9 @@
// //
//===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===//
// //
// This file implements the ScheduleDAG class, which is used as the common /// \file Implements the ScheduleDAG class, which is used as the common base
// base class for instruction schedulers. This encapsulates the scheduling DAG, /// class for instruction schedulers. This encapsulates the scheduling DAG,
// which is shared between SelectionDAG and MachineInstr scheduling. /// which is shared between SelectionDAG and MachineInstr scheduling.
// //
//===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===//
@ -40,11 +40,11 @@ namespace llvm {
class TargetRegisterClass; class TargetRegisterClass;
template<class Graph> class GraphWriter; template<class Graph> class GraphWriter;
/// SDep - Scheduling dependency. This represents one direction of an /// Scheduling dependency. This represents one direction of an edge in the
/// edge in the scheduling DAG. /// scheduling DAG.
class SDep { class SDep {
public: public:
/// Kind - These are the different kinds of scheduling dependencies. /// These are the different kinds of scheduling dependencies.
enum Kind { enum Kind {
Data, ///< Regular data dependence (aka true-dependence). Data, ///< Regular data dependence (aka true-dependence).
Anti, ///< A register anti-dependedence (aka WAR). Anti, ///< A register anti-dependedence (aka WAR).
@ -71,33 +71,32 @@ namespace llvm {
}; };
private: private:
/// Dep - A pointer to the depending/depended-on SUnit, and an enum /// \brief A pointer to the depending/depended-on SUnit, and an enum
/// indicating the kind of the dependency. /// indicating the kind of the dependency.
PointerIntPair<SUnit *, 2, Kind> Dep; PointerIntPair<SUnit *, 2, Kind> Dep;
/// Contents - A union discriminated by the dependence kind. /// A union discriminated by the dependence kind.
union { union {
/// Reg - For Data, Anti, and Output dependencies, the associated /// For Data, Anti, and Output dependencies, the associated register. For
/// register. For Data dependencies that don't currently have a register /// Data dependencies that don't currently have a register/ assigned, this
/// assigned, this is set to zero. /// is set to zero.
unsigned Reg; unsigned Reg;
/// Order - Additional information about Order dependencies. /// Additional information about Order dependencies.
unsigned OrdKind; // enum OrderKind unsigned OrdKind; // enum OrderKind
} Contents; } Contents;
/// Latency - The time associated with this edge. Often this is just /// The time associated with this edge. Often this is just the value of the
/// the value of the Latency field of the predecessor, however advanced /// Latency field of the predecessor, however advanced models may provide
/// models may provide additional information about specific edges. /// additional information about specific edges.
unsigned Latency; unsigned Latency;
public: public:
/// SDep - Construct a null SDep. This is only for use by container /// Constructs a null SDep. This is only for use by container classes which
/// classes which require default constructors. SUnits may not /// require default constructors. SUnits may not/ have null SDep edges.
/// have null SDep edges.
SDep() : Dep(nullptr, Data) {} SDep() : Dep(nullptr, Data) {}
/// SDep - Construct an SDep with the specified values. /// Constructs an SDep with the specified values.
SDep(SUnit *S, Kind kind, unsigned Reg) SDep(SUnit *S, Kind kind, unsigned Reg)
: Dep(S, kind), Contents() { : Dep(S, kind), Contents() {
switch (kind) { switch (kind) {
@ -121,7 +120,7 @@ namespace llvm {
Contents.OrdKind = kind; Contents.OrdKind = kind;
} }
/// Return true if the specified SDep is equivalent except for latency. /// Returns true if the specified SDep is equivalent except for latency.
bool overlaps(const SDep &Other) const; bool overlaps(const SDep &Other) const;
bool operator==(const SDep &Other) const { bool operator==(const SDep &Other) const {
@ -132,100 +131,95 @@ namespace llvm {
return !operator==(Other); return !operator==(Other);
} }
/// getLatency - Return the latency value for this edge, which roughly /// \brief Returns the latency value for this edge, which roughly means the
/// means the minimum number of cycles that must elapse between the /// minimum number of cycles that must elapse between the predecessor and
/// predecessor and the successor, given that they have this edge /// the successor, given that they have this edge between them.
/// between them.
unsigned getLatency() const { unsigned getLatency() const {
return Latency; return Latency;
} }
/// setLatency - Set the latency for this edge. /// Sets the latency for this edge.
void setLatency(unsigned Lat) { void setLatency(unsigned Lat) {
Latency = Lat; Latency = Lat;
} }
//// getSUnit - Return the SUnit to which this edge points. //// Returns the SUnit to which this edge points.
SUnit *getSUnit() const; SUnit *getSUnit() const;
//// setSUnit - Assign the SUnit to which this edge points. //// Assigns the SUnit to which this edge points.
void setSUnit(SUnit *SU); void setSUnit(SUnit *SU);
/// getKind - Return an enum value representing the kind of the dependence. /// Returns an enum value representing the kind of the dependence.
Kind getKind() const; Kind getKind() const;
/// isCtrl - Shorthand for getKind() != SDep::Data. /// Shorthand for getKind() != SDep::Data.
bool isCtrl() const { bool isCtrl() const {
return getKind() != Data; return getKind() != Data;
} }
/// isNormalMemory - Test if this is an Order dependence between two /// \brief Tests if this is an Order dependence between two memory accesses
/// memory accesses where both sides of the dependence access memory /// where both sides of the dependence access memory in non-volatile and
/// in non-volatile and fully modeled ways. /// fully modeled ways.
bool isNormalMemory() const { bool isNormalMemory() const {
return getKind() == Order && (Contents.OrdKind == MayAliasMem return getKind() == Order && (Contents.OrdKind == MayAliasMem
|| Contents.OrdKind == MustAliasMem); || Contents.OrdKind == MustAliasMem);
} }
/// isBarrier - Test if this is an Order dependence that is marked /// Tests if this is an Order dependence that is marked as a barrier.
/// as a barrier.
bool isBarrier() const { bool isBarrier() const {
return getKind() == Order && Contents.OrdKind == Barrier; return getKind() == Order && Contents.OrdKind == Barrier;
} }
/// isNormalMemoryOrBarrier - Test if this is could be any kind of memory /// Tests if this is could be any kind of memory dependence.
/// dependence.
bool isNormalMemoryOrBarrier() const { bool isNormalMemoryOrBarrier() const {
return (isNormalMemory() || isBarrier()); return (isNormalMemory() || isBarrier());
} }
/// isMustAlias - Test if this is an Order dependence that is marked /// \brief Tests if this is an Order dependence that is marked as
/// as "must alias", meaning that the SUnits at either end of the edge /// "must alias", meaning that the SUnits at either end of the edge have a
/// have a memory dependence on a known memory location. /// memory dependence on a known memory location.
bool isMustAlias() const { bool isMustAlias() const {
return getKind() == Order && Contents.OrdKind == MustAliasMem; return getKind() == Order && Contents.OrdKind == MustAliasMem;
} }
/// isWeak - Test if this a weak dependence. Weak dependencies are /// Tests if this a weak dependence. Weak dependencies are considered DAG
/// considered DAG edges for height computation and other heuristics, but do /// edges for height computation and other heuristics, but do not force
/// not force ordering. Breaking a weak edge may require the scheduler to /// ordering. Breaking a weak edge may require the scheduler to compensate,
/// compensate, for example by inserting a copy. /// for example by inserting a copy.
bool isWeak() const { bool isWeak() const {
return getKind() == Order && Contents.OrdKind >= Weak; return getKind() == Order && Contents.OrdKind >= Weak;
} }
/// isArtificial - Test if this is an Order dependence that is marked /// \brief Tests if this is an Order dependence that is marked as
/// as "artificial", meaning it isn't necessary for correctness. /// "artificial", meaning it isn't necessary for correctness.
bool isArtificial() const { bool isArtificial() const {
return getKind() == Order && Contents.OrdKind == Artificial; return getKind() == Order && Contents.OrdKind == Artificial;
} }
/// isCluster - Test if this is an Order dependence that is marked /// \brief Tests if this is an Order dependence that is marked as "cluster",
/// as "cluster", meaning it is artificial and wants to be adjacent. /// meaning it is artificial and wants to be adjacent.
bool isCluster() const { bool isCluster() const {
return getKind() == Order && Contents.OrdKind == Cluster; return getKind() == Order && Contents.OrdKind == Cluster;
} }
/// isAssignedRegDep - Test if this is a Data dependence that is /// Tests if this is a Data dependence that is associated with a register.
/// associated with a register.
bool isAssignedRegDep() const { bool isAssignedRegDep() const {
return getKind() == Data && Contents.Reg != 0; return getKind() == Data && Contents.Reg != 0;
} }
/// getReg - Return the register associated with this edge. This is /// Returns the register associated with this edge. This is only valid on
/// only valid on Data, Anti, and Output edges. On Data edges, this /// Data, Anti, and Output edges. On Data edges, this value may be zero,
/// value may be zero, meaning there is no associated register. /// meaning there is no associated register.
unsigned getReg() const { unsigned getReg() const {
assert((getKind() == Data || getKind() == Anti || getKind() == Output) && assert((getKind() == Data || getKind() == Anti || getKind() == Output) &&
"getReg called on non-register dependence edge!"); "getReg called on non-register dependence edge!");
return Contents.Reg; return Contents.Reg;
} }
/// setReg - Assign the associated register for this edge. This is /// Assigns the associated register for this edge. This is only valid on
/// only valid on Data, Anti, and Output edges. On Anti and Output /// Data, Anti, and Output edges. On Anti and Output edges, this value must
/// edges, this value must not be zero. On Data edges, the value may /// not be zero. On Data edges, the value may be zero, which would mean that
/// be zero, which would mean that no specific register is associated /// no specific register is associated with this edge.
/// with this edge.
void setReg(unsigned Reg) { void setReg(unsigned Reg) {
assert((getKind() == Data || getKind() == Anti || getKind() == Output) && assert((getKind() == Data || getKind() == Anti || getKind() == Output) &&
"setReg called on non-register dependence edge!"); "setReg called on non-register dependence edge!");
@ -240,71 +234,70 @@ namespace llvm {
template <> template <>
struct isPodLike<SDep> { static const bool value = true; }; struct isPodLike<SDep> { static const bool value = true; };
/// SUnit - Scheduling unit. This is a node in the scheduling DAG. /// Scheduling unit. This is a node in the scheduling DAG.
class SUnit { class SUnit {
private: private:
enum : unsigned { BoundaryID = ~0u }; enum : unsigned { BoundaryID = ~0u };
SDNode *Node; // Representative node. SDNode *Node; ///< Representative node.
MachineInstr *Instr; // Alternatively, a MachineInstr. MachineInstr *Instr; ///< Alternatively, a MachineInstr.
public: public:
SUnit *OrigNode; // If not this, the node from which SUnit *OrigNode; ///< If not this, the node from which
// this node was cloned. /// this node was cloned.
// (SD scheduling only) /// (SD scheduling only)
const MCSchedClassDesc *SchedClass; // NULL or resolved SchedClass. const MCSchedClassDesc *SchedClass; ///< nullptr or resolved SchedClass.
// Preds/Succs - The SUnits before/after us in the graph. SmallVector<SDep, 4> Preds; ///< All sunit predecessors.
SmallVector<SDep, 4> Preds; // All sunit predecessors. SmallVector<SDep, 4> Succs; ///< All sunit successors.
SmallVector<SDep, 4> Succs; // All sunit successors.
typedef SmallVectorImpl<SDep>::iterator pred_iterator; typedef SmallVectorImpl<SDep>::iterator pred_iterator;
typedef SmallVectorImpl<SDep>::iterator succ_iterator; typedef SmallVectorImpl<SDep>::iterator succ_iterator;
typedef SmallVectorImpl<SDep>::const_iterator const_pred_iterator; typedef SmallVectorImpl<SDep>::const_iterator const_pred_iterator;
typedef SmallVectorImpl<SDep>::const_iterator const_succ_iterator; typedef SmallVectorImpl<SDep>::const_iterator const_succ_iterator;
unsigned NodeNum; // Entry # of node in the node vector. unsigned NodeNum; ///< Entry # of node in the node vector.
unsigned NodeQueueId; // Queue id of node. unsigned NodeQueueId; ///< Queue id of node.
unsigned NumPreds; // # of SDep::Data preds. unsigned NumPreds; ///< # of SDep::Data preds.
unsigned NumSuccs; // # of SDep::Data sucss. unsigned NumSuccs; ///< # of SDep::Data sucss.
unsigned NumPredsLeft; // # of preds not scheduled. unsigned NumPredsLeft; ///< # of preds not scheduled.
unsigned NumSuccsLeft; // # of succs not scheduled. unsigned NumSuccsLeft; ///< # of succs not scheduled.
unsigned WeakPredsLeft; // # of weak preds not scheduled. unsigned WeakPredsLeft; ///< # of weak preds not scheduled.
unsigned WeakSuccsLeft; // # of weak succs not scheduled. unsigned WeakSuccsLeft; ///< # of weak succs not scheduled.
unsigned short NumRegDefsLeft; // # of reg defs with no scheduled use. unsigned short NumRegDefsLeft; ///< # of reg defs with no scheduled use.
unsigned short Latency; // Node latency. unsigned short Latency; ///< Node latency.
bool isVRegCycle : 1; // May use and def the same vreg. bool isVRegCycle : 1; ///< May use and def the same vreg.
bool isCall : 1; // Is a function call. bool isCall : 1; ///< Is a function call.
bool isCallOp : 1; // Is a function call operand. bool isCallOp : 1; ///< Is a function call operand.
bool isTwoAddress : 1; // Is a two-address instruction. bool isTwoAddress : 1; ///< Is a two-address instruction.
bool isCommutable : 1; // Is a commutable instruction. bool isCommutable : 1; ///< Is a commutable instruction.
bool hasPhysRegUses : 1; // Has physreg uses. bool hasPhysRegUses : 1; ///< Has physreg uses.
bool hasPhysRegDefs : 1; // Has physreg defs that are being used. bool hasPhysRegDefs : 1; ///< Has physreg defs that are being used.
bool hasPhysRegClobbers : 1; // Has any physreg defs, used or not. bool hasPhysRegClobbers : 1; ///< Has any physreg defs, used or not.
bool isPending : 1; // True once pending. bool isPending : 1; ///< True once pending.
bool isAvailable : 1; // True once available. bool isAvailable : 1; ///< True once available.
bool isScheduled : 1; // True once scheduled. bool isScheduled : 1; ///< True once scheduled.
bool isScheduleHigh : 1; // True if preferable to schedule high. bool isScheduleHigh : 1; ///< True if preferable to schedule high.
bool isScheduleLow : 1; // True if preferable to schedule low. bool isScheduleLow : 1; ///< True if preferable to schedule low.
bool isCloned : 1; // True if this node has been cloned. bool isCloned : 1; ///< True if this node has been cloned.
bool isUnbuffered : 1; // Uses an unbuffered resource. bool isUnbuffered : 1; ///< Uses an unbuffered resource.
bool hasReservedResource : 1; // Uses a reserved resource. bool hasReservedResource : 1; ///< Uses a reserved resource.
Sched::Preference SchedulingPref; // Scheduling preference. Sched::Preference SchedulingPref; ///< Scheduling preference.
private: private:
bool isDepthCurrent : 1; // True if Depth is current. bool isDepthCurrent : 1; ///< True if Depth is current.
bool isHeightCurrent : 1; // True if Height is current. bool isHeightCurrent : 1; ///< True if Height is current.
unsigned Depth; // Node depth. unsigned Depth; ///< Node depth.
unsigned Height; // Node height. unsigned Height; ///< Node height.
public: public:
unsigned TopReadyCycle; // Cycle relative to start when node is ready. unsigned TopReadyCycle; ///< Cycle relative to start when node is ready.
unsigned BotReadyCycle; // Cycle relative to end when node is ready. unsigned BotReadyCycle; ///< Cycle relative to end when node is ready.
const TargetRegisterClass *CopyDstRC; // Is a special copy node if not null. const TargetRegisterClass *CopyDstRC; ///< Is a special copy node if !=null.
const TargetRegisterClass *CopySrcRC; const TargetRegisterClass *CopySrcRC;
/// SUnit - Construct an SUnit for pre-regalloc scheduling to represent /// \brief Constructs an SUnit for pre-regalloc scheduling to represent an
/// an SDNode and any nodes flagged to it. /// SDNode and any nodes flagged to it.
SUnit(SDNode *node, unsigned nodenum) SUnit(SDNode *node, unsigned nodenum)
: Node(node), Instr(nullptr), OrigNode(nullptr), SchedClass(nullptr), : Node(node), Instr(nullptr), OrigNode(nullptr), SchedClass(nullptr),
NodeNum(nodenum), NodeQueueId(0), NumPreds(0), NumSuccs(0), NodeNum(nodenum), NodeQueueId(0), NumPreds(0), NumSuccs(0),
@ -319,8 +312,8 @@ namespace llvm {
isHeightCurrent(false), Depth(0), Height(0), TopReadyCycle(0), isHeightCurrent(false), Depth(0), Height(0), TopReadyCycle(0),
BotReadyCycle(0), CopyDstRC(nullptr), CopySrcRC(nullptr) {} BotReadyCycle(0), CopyDstRC(nullptr), CopySrcRC(nullptr) {}
/// SUnit - Construct an SUnit for post-regalloc scheduling to represent /// \brief Constructs an SUnit for post-regalloc scheduling to represent a
/// a MachineInstr. /// MachineInstr.
SUnit(MachineInstr *instr, unsigned nodenum) SUnit(MachineInstr *instr, unsigned nodenum)
: Node(nullptr), Instr(instr), OrigNode(nullptr), SchedClass(nullptr), : Node(nullptr), Instr(instr), OrigNode(nullptr), SchedClass(nullptr),
NodeNum(nodenum), NodeQueueId(0), NumPreds(0), NumSuccs(0), NodeNum(nodenum), NodeQueueId(0), NumPreds(0), NumSuccs(0),
@ -335,7 +328,7 @@ namespace llvm {
isHeightCurrent(false), Depth(0), Height(0), TopReadyCycle(0), isHeightCurrent(false), Depth(0), Height(0), TopReadyCycle(0),
BotReadyCycle(0), CopyDstRC(nullptr), CopySrcRC(nullptr) {} BotReadyCycle(0), CopyDstRC(nullptr), CopySrcRC(nullptr) {}
/// SUnit - Construct a placeholder SUnit. /// \brief Constructs a placeholder SUnit.
SUnit() SUnit()
: Node(nullptr), Instr(nullptr), OrigNode(nullptr), SchedClass(nullptr), : Node(nullptr), Instr(nullptr), OrigNode(nullptr), SchedClass(nullptr),
NodeNum(BoundaryID), NodeQueueId(0), NumPreds(0), NumSuccs(0), NodeNum(BoundaryID), NodeQueueId(0), NumPreds(0), NumSuccs(0),
@ -359,46 +352,44 @@ namespace llvm {
/// an assoicative data structure keyed on node ID. /// an assoicative data structure keyed on node ID.
bool isBoundaryNode() const { return NodeNum == BoundaryID; } bool isBoundaryNode() const { return NodeNum == BoundaryID; }
/// setNode - Assign the representative SDNode for this SUnit. /// Assigns the representative SDNode for this SUnit. This may be used
/// This may be used during pre-regalloc scheduling. /// during pre-regalloc scheduling.
void setNode(SDNode *N) { void setNode(SDNode *N) {
assert(!Instr && "Setting SDNode of SUnit with MachineInstr!"); assert(!Instr && "Setting SDNode of SUnit with MachineInstr!");
Node = N; Node = N;
} }
/// getNode - Return the representative SDNode for this SUnit. /// Returns the representative SDNode for this SUnit. This may be used
/// This may be used during pre-regalloc scheduling. /// during pre-regalloc scheduling.
SDNode *getNode() const { SDNode *getNode() const {
assert(!Instr && "Reading SDNode of SUnit with MachineInstr!"); assert(!Instr && "Reading SDNode of SUnit with MachineInstr!");
return Node; return Node;
} }
/// isInstr - Return true if this SUnit refers to a machine instruction as /// \brief Returns true if this SUnit refers to a machine instruction as
/// opposed to an SDNode. /// opposed to an SDNode.
bool isInstr() const { return Instr; } bool isInstr() const { return Instr; }
/// setInstr - Assign the instruction for the SUnit. /// Assigns the instruction for the SUnit. This may be used during
/// This may be used during post-regalloc scheduling. /// post-regalloc scheduling.
void setInstr(MachineInstr *MI) { void setInstr(MachineInstr *MI) {
assert(!Node && "Setting MachineInstr of SUnit with SDNode!"); assert(!Node && "Setting MachineInstr of SUnit with SDNode!");
Instr = MI; Instr = MI;
} }
/// getInstr - Return the representative MachineInstr for this SUnit. /// Returns the representative MachineInstr for this SUnit. This may be used
/// This may be used during post-regalloc scheduling. /// during post-regalloc scheduling.
MachineInstr *getInstr() const { MachineInstr *getInstr() const {
assert(!Node && "Reading MachineInstr of SUnit with SDNode!"); assert(!Node && "Reading MachineInstr of SUnit with SDNode!");
return Instr; return Instr;
} }
/// addPred - This adds the specified edge as a pred of the current node if /// Adds the specified edge as a pred of the current node if not already.
/// not already. It also adds the current node as a successor of the /// It also adds the current node as a successor of the specified node.
/// specified node.
bool addPred(const SDep &D, bool Required = true); bool addPred(const SDep &D, bool Required = true);
/// addPredBarrier - This adds a barrier edge to SU by calling /// \brief Adds a barrier edge to SU by calling addPred(), with latency 0
/// addPred(), with latency 0 generally or latency 1 for a store /// generally or latency 1 for a store followed by a load.
/// followed by a load.
bool addPredBarrier(SUnit *SU) { bool addPredBarrier(SUnit *SU) {
SDep Dep(SU, SDep::Barrier); SDep Dep(SU, SDep::Barrier);
unsigned TrueMemOrderLatency = unsigned TrueMemOrderLatency =
@ -407,20 +398,19 @@ namespace llvm {
return addPred(Dep); return addPred(Dep);
} }
/// removePred - This removes the specified edge as a pred of the current /// Removes the specified edge as a pred of the current node if it exists.
/// node if it exists. It also removes the current node as a successor of /// It also removes the current node as a successor of the specified node.
/// the specified node.
void removePred(const SDep &D); void removePred(const SDep &D);
/// getDepth - Return the depth of this node, which is the length of the /// Returns the depth of this node, which is the length of the maximum path
/// maximum path up to any node which has no predecessors. /// up to any node which has no predecessors.
unsigned getDepth() const { unsigned getDepth() const {
if (!isDepthCurrent) if (!isDepthCurrent)
const_cast<SUnit *>(this)->ComputeDepth(); const_cast<SUnit *>(this)->ComputeDepth();
return Depth; return Depth;
} }
/// getHeight - Return the height of this node, which is the length of the /// \brief Returns the height of this node, which is the length of the
/// maximum path down to any node which has no successors. /// maximum path down to any node which has no successors.
unsigned getHeight() const { unsigned getHeight() const {
if (!isHeightCurrent) if (!isHeightCurrent)
@ -428,38 +418,36 @@ namespace llvm {
return Height; return Height;
} }
/// setDepthToAtLeast - If NewDepth is greater than this node's /// \brief If NewDepth is greater than this node's depth value, sets it to
/// depth value, set it to be the new depth value. This also /// be the new depth value. This also recursively marks successor nodes
/// recursively marks successor nodes dirty. /// dirty.
void setDepthToAtLeast(unsigned NewDepth); void setDepthToAtLeast(unsigned NewDepth);
/// setDepthToAtLeast - If NewDepth is greater than this node's /// \brief If NewDepth is greater than this node's depth value, set it to be
/// depth value, set it to be the new height value. This also /// the new height value. This also recursively marks predecessor nodes
/// recursively marks predecessor nodes dirty. /// dirty.
void setHeightToAtLeast(unsigned NewHeight); void setHeightToAtLeast(unsigned NewHeight);
/// setDepthDirty - Set a flag in this node to indicate that its /// \brief Sets a flag in this node to indicate that its stored Depth value
/// stored Depth value will require recomputation the next time /// will require recomputation the next time getDepth() is called.
/// getDepth() is called.
void setDepthDirty(); void setDepthDirty();
/// setHeightDirty - Set a flag in this node to indicate that its /// \brief Sets a flag in this node to indicate that its stored Height value
/// stored Height value will require recomputation the next time /// will require recomputation the next time getHeight() is called.
/// getHeight() is called.
void setHeightDirty(); void setHeightDirty();
/// isPred - Test if node N is a predecessor of this node. /// Tests if node N is a predecessor of this node.
bool isPred(SUnit *N) { bool isPred(const SUnit *N) const {
for (unsigned i = 0, e = (unsigned)Preds.size(); i != e; ++i) for (const SDep &Pred : Preds)
if (Preds[i].getSUnit() == N) if (Pred.getSUnit() == N)
return true; return true;
return false; return false;
} }
/// isSucc - Test if node N is a successor of this node. /// Tests if node N is a successor of this node.
bool isSucc(SUnit *N) { bool isSucc(const SUnit *N) const {
for (unsigned i = 0, e = (unsigned)Succs.size(); i != e; ++i) for (const SDep &Succ : Succs)
if (Succs[i].getSUnit() == N) if (Succ.getSUnit() == N)
return true; return true;
return false; return false;
} }
@ -471,7 +459,7 @@ namespace llvm {
return NumSuccsLeft == 0; return NumSuccsLeft == 0;
} }
/// \brief Order this node's predecessor edges such that the critical path /// \brief Orders this node's predecessor edges such that the critical path
/// edge occurs first. /// edge occurs first.
void biasCriticalPath(); void biasCriticalPath();
@ -484,7 +472,7 @@ namespace llvm {
void ComputeHeight(); void ComputeHeight();
}; };
/// Return true if the specified SDep is equivalent except for latency. /// Returns true if the specified SDep is equivalent except for latency.
inline bool SDep::overlaps(const SDep &Other) const { inline bool SDep::overlaps(const SDep &Other) const {
if (Dep != Other.Dep) if (Dep != Other.Dep)
return false; return false;
@ -499,23 +487,23 @@ namespace llvm {
llvm_unreachable("Invalid dependency kind!"); llvm_unreachable("Invalid dependency kind!");
} }
//// getSUnit - Return the SUnit to which this edge points. //// Returns the SUnit to which this edge points.
inline SUnit *SDep::getSUnit() const { return Dep.getPointer(); } inline SUnit *SDep::getSUnit() const { return Dep.getPointer(); }
//// setSUnit - Assign the SUnit to which this edge points. //// Assigns the SUnit to which this edge points.
inline void SDep::setSUnit(SUnit *SU) { Dep.setPointer(SU); } inline void SDep::setSUnit(SUnit *SU) { Dep.setPointer(SU); }
/// getKind - Return an enum value representing the kind of the dependence. /// Returns an enum value representing the kind of the dependence.
inline SDep::Kind SDep::getKind() const { return Dep.getInt(); } inline SDep::Kind SDep::getKind() const { return Dep.getInt(); }
//===--------------------------------------------------------------------===// //===--------------------------------------------------------------------===//
/// SchedulingPriorityQueue - This interface is used to plug different
/// priorities computation algorithms into the list scheduler. It implements /// \brief This interface is used to plug different priorities computation
/// the interface of a standard priority queue, where nodes are inserted in /// algorithms into the list scheduler. It implements the interface of a
/// arbitrary order and returned in priority order. The computation of the /// standard priority queue, where nodes are inserted in arbitrary order and
/// priority and the representation of the queue are totally up to the /// returned in priority order. The computation of the priority and the
/// implementation to decide. /// representation of the queue are totally up to the implementation to
/// /// decide.
class SchedulingPriorityQueue { class SchedulingPriorityQueue {
virtual void anchor(); virtual void anchor();
unsigned CurCycle; unsigned CurCycle;
@ -556,10 +544,9 @@ namespace llvm {
virtual void dump(ScheduleDAG *) const {} virtual void dump(ScheduleDAG *) const {}
/// scheduledNode - As each node is scheduled, this method is invoked. This /// As each node is scheduled, this method is invoked. This allows the
/// allows the priority function to adjust the priority of related /// priority function to adjust the priority of related unscheduled nodes,
/// unscheduled nodes, for example. /// for example.
///
virtual void scheduledNode(SUnit *) {} virtual void scheduledNode(SUnit *) {}
virtual void unscheduledNode(SUnit *) {} virtual void unscheduledNode(SUnit *) {}
@ -575,14 +562,14 @@ namespace llvm {
class ScheduleDAG { class ScheduleDAG {
public: public:
const TargetMachine &TM; // Target processor const TargetMachine &TM; ///< Target processor
const TargetInstrInfo *TII; // Target instruction information const TargetInstrInfo *TII; ///< Target instruction information
const TargetRegisterInfo *TRI; // Target processor register info const TargetRegisterInfo *TRI; ///< Target processor register info
MachineFunction &MF; // Machine function MachineFunction &MF; ///< Machine function
MachineRegisterInfo &MRI; // Virtual/real register map MachineRegisterInfo &MRI; ///< Virtual/real register map
std::vector<SUnit> SUnits; // The scheduling units. std::vector<SUnit> SUnits; ///< The scheduling units.
SUnit EntrySU; // Special node for the region entry. SUnit EntrySU; ///< Special node for the region entry.
SUnit ExitSU; // Special node for the region exit. SUnit ExitSU; ///< Special node for the region exit.
#ifdef NDEBUG #ifdef NDEBUG
static const bool StressSched = false; static const bool StressSched = false;
@ -594,43 +581,39 @@ namespace llvm {
virtual ~ScheduleDAG(); virtual ~ScheduleDAG();
/// clearDAG - clear the DAG state (between regions). /// Clears the DAG state (between regions).
void clearDAG(); void clearDAG();
/// getInstrDesc - Return the MCInstrDesc of this SUnit. /// Returns the MCInstrDesc of this SUnit.
/// Return NULL for SDNodes without a machine opcode. /// Returns NULL for SDNodes without a machine opcode.
const MCInstrDesc *getInstrDesc(const SUnit *SU) const { const MCInstrDesc *getInstrDesc(const SUnit *SU) const {
if (SU->isInstr()) return &SU->getInstr()->getDesc(); if (SU->isInstr()) return &SU->getInstr()->getDesc();
return getNodeDesc(SU->getNode()); return getNodeDesc(SU->getNode());
} }
/// viewGraph - Pop up a GraphViz/gv window with the ScheduleDAG rendered /// Pops up a GraphViz/gv window with the ScheduleDAG rendered using 'dot'.
/// using 'dot'.
///
virtual void viewGraph(const Twine &Name, const Twine &Title); virtual void viewGraph(const Twine &Name, const Twine &Title);
virtual void viewGraph(); virtual void viewGraph();
virtual void dumpNode(const SUnit *SU) const = 0; virtual void dumpNode(const SUnit *SU) const = 0;
/// getGraphNodeLabel - Return a label for an SUnit node in a visualization /// Returns a label for an SUnit node in a visualization of the ScheduleDAG.
/// of the ScheduleDAG.
virtual std::string getGraphNodeLabel(const SUnit *SU) const = 0; virtual std::string getGraphNodeLabel(const SUnit *SU) const = 0;
/// getDAGLabel - Return a label for the region of code covered by the DAG. /// Returns a label for the region of code covered by the DAG.
virtual std::string getDAGName() const = 0; virtual std::string getDAGName() const = 0;
/// addCustomGraphFeatures - Add custom features for a visualization of /// Adds custom features for a visualization of the ScheduleDAG.
/// the ScheduleDAG.
virtual void addCustomGraphFeatures(GraphWriter<ScheduleDAG*> &) const {} virtual void addCustomGraphFeatures(GraphWriter<ScheduleDAG*> &) const {}
#ifndef NDEBUG #ifndef NDEBUG
/// VerifyScheduledDAG - Verify that all SUnits were scheduled and that /// \brief Verifies that all SUnits were scheduled and that their state is
/// their state is consistent. Return the number of scheduled SUnits. /// consistent. Returns the number of scheduled SUnits.
unsigned VerifyScheduledDAG(bool isBottomUp); unsigned VerifyScheduledDAG(bool isBottomUp);
#endif #endif
private: private:
// Return the MCInstrDesc of this SDNode or NULL. /// Returns the MCInstrDesc of this SDNode or NULL.
const MCInstrDesc *getNodeDesc(const SDNode *Node) const; const MCInstrDesc *getNodeDesc(const SDNode *Node) const;
}; };
@ -666,7 +649,7 @@ namespace llvm {
unsigned getOperand() const { return Operand; } unsigned getOperand() const { return Operand; }
const SUnit *getNode() const { return Node; } const SUnit *getNode() const { return Node; }
/// isCtrlDep - Test if this is not an SDep::Data dependence. /// Tests if this is not an SDep::Data dependence.
bool isCtrlDep() const { bool isCtrlDep() const {
return getSDep().isCtrl(); return getSDep().isCtrl();
} }
@ -700,56 +683,53 @@ namespace llvm {
} }
}; };
/// ScheduleDAGTopologicalSort is a class that computes a topological /// This class can compute a topological ordering for SUnits and provides
/// ordering for SUnits and provides methods for dynamically updating /// methods for dynamically updating the ordering as new edges are added.
/// the ordering as new edges are added.
/// ///
/// This allows a very fast implementation of IsReachable, for example. /// This allows a very fast implementation of IsReachable, for example.
///
class ScheduleDAGTopologicalSort { class ScheduleDAGTopologicalSort {
/// SUnits - A reference to the ScheduleDAG's SUnits. /// A reference to the ScheduleDAG's SUnits.
std::vector<SUnit> &SUnits; std::vector<SUnit> &SUnits;
SUnit *ExitSU; SUnit *ExitSU;
/// Index2Node - Maps topological index to the node number. /// Maps topological index to the node number.
std::vector<int> Index2Node; std::vector<int> Index2Node;
/// Node2Index - Maps the node number to its topological index. /// Maps the node number to its topological index.
std::vector<int> Node2Index; std::vector<int> Node2Index;
/// Visited - a set of nodes visited during a DFS traversal. /// a set of nodes visited during a DFS traversal.
BitVector Visited; BitVector Visited;
/// DFS - make a DFS traversal and mark all nodes affected by the /// Makes a DFS traversal and mark all nodes affected by the edge insertion.
/// edge insertion. These nodes will later get new topological indexes /// These nodes will later get new topological indexes by means of the Shift
/// by means of the Shift method. /// method.
void DFS(const SUnit *SU, int UpperBound, bool& HasLoop); void DFS(const SUnit *SU, int UpperBound, bool& HasLoop);
/// Shift - reassign topological indexes for the nodes in the DAG /// \brief Reassigns topological indexes for the nodes in the DAG to
/// to preserve the topological ordering. /// preserve the topological ordering.
void Shift(BitVector& Visited, int LowerBound, int UpperBound); void Shift(BitVector& Visited, int LowerBound, int UpperBound);
/// Allocate - assign the topological index to the node n. /// Assigns the topological index to the node n.
void Allocate(int n, int index); void Allocate(int n, int index);
public: public:
ScheduleDAGTopologicalSort(std::vector<SUnit> &SUnits, SUnit *ExitSU); ScheduleDAGTopologicalSort(std::vector<SUnit> &SUnits, SUnit *ExitSU);
/// InitDAGTopologicalSorting - create the initial topological /// Creates the initial topological ordering from the DAG to be scheduled.
/// ordering from the DAG to be scheduled.
void InitDAGTopologicalSorting(); void InitDAGTopologicalSorting();
/// IsReachable - Checks if SU is reachable from TargetSU. /// Checks if \p SU is reachable from \p TargetSU.
bool IsReachable(const SUnit *SU, const SUnit *TargetSU); bool IsReachable(const SUnit *SU, const SUnit *TargetSU);
/// WillCreateCycle - Return true if addPred(TargetSU, SU) creates a cycle. /// Returns true if addPred(TargetSU, SU) creates a cycle.
bool WillCreateCycle(SUnit *TargetSU, SUnit *SU); bool WillCreateCycle(SUnit *TargetSU, SUnit *SU);
/// AddPred - Updates the topological ordering to accommodate an edge /// \brief Updates the topological ordering to accommodate an edge to be
/// to be added from SUnit X to SUnit Y. /// added from SUnit \p X to SUnit \p Y.
void AddPred(SUnit *Y, SUnit *X); void AddPred(SUnit *Y, SUnit *X);
/// RemovePred - Updates the topological ordering to accommodate an /// \brief Updates the topological ordering to accommodate an an edge to be
/// an edge to be removed from the specified node N from the predecessors /// removed from the specified node \p N from the predecessors of the
/// of the current node M. /// current node \p M.
void RemovePred(SUnit *M, SUnit *N); void RemovePred(SUnit *M, SUnit *N);
typedef std::vector<int>::iterator iterator; typedef std::vector<int>::iterator iterator;

View File

@ -7,8 +7,8 @@
// //
//===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===//
// //
// This implements the ScheduleDAG class, which is a base class used by /// \file Implements the ScheduleDAG class, which is a base class used by
// scheduling implementation classes. /// scheduling implementation classes.
// //
//===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===//
@ -46,45 +46,39 @@ ScheduleDAG::ScheduleDAG(MachineFunction &mf)
ScheduleDAG::~ScheduleDAG() {} ScheduleDAG::~ScheduleDAG() {}
/// Clear the DAG state (e.g. between scheduling regions).
void ScheduleDAG::clearDAG() { void ScheduleDAG::clearDAG() {
SUnits.clear(); SUnits.clear();
EntrySU = SUnit(); EntrySU = SUnit();
ExitSU = SUnit(); ExitSU = SUnit();
} }
/// getInstrDesc helper to handle SDNodes.
const MCInstrDesc *ScheduleDAG::getNodeDesc(const SDNode *Node) const { const MCInstrDesc *ScheduleDAG::getNodeDesc(const SDNode *Node) const {
if (!Node || !Node->isMachineOpcode()) return nullptr; if (!Node || !Node->isMachineOpcode()) return nullptr;
return &TII->get(Node->getMachineOpcode()); return &TII->get(Node->getMachineOpcode());
} }
/// addPred - This adds the specified edge as a pred of the current node if
/// not already. It also adds the current node as a successor of the
/// specified node.
bool SUnit::addPred(const SDep &D, bool Required) { bool SUnit::addPred(const SDep &D, bool Required) {
// If this node already has this dependence, don't add a redundant one. // If this node already has this dependence, don't add a redundant one.
for (SmallVectorImpl<SDep>::iterator I = Preds.begin(), E = Preds.end(); for (SDep &PredDep : Preds) {
I != E; ++I) {
// Zero-latency weak edges may be added purely for heuristic ordering. Don't // Zero-latency weak edges may be added purely for heuristic ordering. Don't
// add them if another kind of edge already exists. // add them if another kind of edge already exists.
if (!Required && I->getSUnit() == D.getSUnit()) if (!Required && PredDep.getSUnit() == D.getSUnit())
return false; return false;
if (I->overlaps(D)) { if (PredDep.overlaps(D)) {
// Extend the latency if needed. Equivalent to removePred(I) + addPred(D). // Extend the latency if needed. Equivalent to
if (I->getLatency() < D.getLatency()) { // removePred(PredDep) + addPred(D).
SUnit *PredSU = I->getSUnit(); if (PredDep.getLatency() < D.getLatency()) {
SUnit *PredSU = PredDep.getSUnit();
// Find the corresponding successor in N. // Find the corresponding successor in N.
SDep ForwardD = *I; SDep ForwardD = PredDep;
ForwardD.setSUnit(this); ForwardD.setSUnit(this);
for (SmallVectorImpl<SDep>::iterator II = PredSU->Succs.begin(), for (SDep &SuccDep : PredSU->Succs) {
EE = PredSU->Succs.end(); II != EE; ++II) { if (SuccDep == ForwardD) {
if (*II == ForwardD) { SuccDep.setLatency(D.getLatency());
II->setLatency(D.getLatency());
break; break;
} }
} }
I->setLatency(D.getLatency()); PredDep.setLatency(D.getLatency());
} }
return false; return false;
} }
@ -127,51 +121,46 @@ bool SUnit::addPred(const SDep &D, bool Required) {
return true; return true;
} }
/// removePred - This removes the specified edge as a pred of the current
/// node if it exists. It also removes the current node as a successor of
/// the specified node.
void SUnit::removePred(const SDep &D) { void SUnit::removePred(const SDep &D) {
// Find the matching predecessor. // Find the matching predecessor.
for (SmallVectorImpl<SDep>::iterator I = Preds.begin(), E = Preds.end(); SmallVectorImpl<SDep>::iterator I = find(Preds, D);
I != E; ++I) if (I == Preds.end())
if (*I == D) { return;
// Find the corresponding successor in N. // Find the corresponding successor in N.
SDep P = D; SDep P = D;
P.setSUnit(this); P.setSUnit(this);
SUnit *N = D.getSUnit(); SUnit *N = D.getSUnit();
SmallVectorImpl<SDep>::iterator Succ = find(N->Succs, P); SmallVectorImpl<SDep>::iterator Succ = find(N->Succs, P);
assert(Succ != N->Succs.end() && "Mismatching preds / succs lists!"); assert(Succ != N->Succs.end() && "Mismatching preds / succs lists!");
N->Succs.erase(Succ); N->Succs.erase(Succ);
Preds.erase(I); Preds.erase(I);
// Update the bookkeeping. // Update the bookkeeping.
if (P.getKind() == SDep::Data) { if (P.getKind() == SDep::Data) {
assert(NumPreds > 0 && "NumPreds will underflow!"); assert(NumPreds > 0 && "NumPreds will underflow!");
assert(N->NumSuccs > 0 && "NumSuccs will underflow!"); assert(N->NumSuccs > 0 && "NumSuccs will underflow!");
--NumPreds; --NumPreds;
--N->NumSuccs; --N->NumSuccs;
} }
if (!N->isScheduled) { if (!N->isScheduled) {
if (D.isWeak()) if (D.isWeak())
--WeakPredsLeft; --WeakPredsLeft;
else { else {
assert(NumPredsLeft > 0 && "NumPredsLeft will underflow!"); assert(NumPredsLeft > 0 && "NumPredsLeft will underflow!");
--NumPredsLeft; --NumPredsLeft;
}
}
if (!isScheduled) {
if (D.isWeak())
--N->WeakSuccsLeft;
else {
assert(N->NumSuccsLeft > 0 && "NumSuccsLeft will underflow!");
--N->NumSuccsLeft;
}
}
if (P.getLatency() != 0) {
this->setDepthDirty();
N->setHeightDirty();
}
return;
} }
}
if (!isScheduled) {
if (D.isWeak())
--N->WeakSuccsLeft;
else {
assert(N->NumSuccsLeft > 0 && "NumSuccsLeft will underflow!");
--N->NumSuccsLeft;
}
}
if (P.getLatency() != 0) {
this->setDepthDirty();
N->setHeightDirty();
}
} }
void SUnit::setDepthDirty() { void SUnit::setDepthDirty() {
@ -181,9 +170,8 @@ void SUnit::setDepthDirty() {
do { do {
SUnit *SU = WorkList.pop_back_val(); SUnit *SU = WorkList.pop_back_val();
SU->isDepthCurrent = false; SU->isDepthCurrent = false;
for (SUnit::const_succ_iterator I = SU->Succs.begin(), for (SDep &SuccDep : SU->Succs) {
E = SU->Succs.end(); I != E; ++I) { SUnit *SuccSU = SuccDep.getSUnit();
SUnit *SuccSU = I->getSUnit();
if (SuccSU->isDepthCurrent) if (SuccSU->isDepthCurrent)
WorkList.push_back(SuccSU); WorkList.push_back(SuccSU);
} }
@ -197,18 +185,14 @@ void SUnit::setHeightDirty() {
do { do {
SUnit *SU = WorkList.pop_back_val(); SUnit *SU = WorkList.pop_back_val();
SU->isHeightCurrent = false; SU->isHeightCurrent = false;
for (SUnit::const_pred_iterator I = SU->Preds.begin(), for (SDep &PredDep : SU->Preds) {
E = SU->Preds.end(); I != E; ++I) { SUnit *PredSU = PredDep.getSUnit();
SUnit *PredSU = I->getSUnit();
if (PredSU->isHeightCurrent) if (PredSU->isHeightCurrent)
WorkList.push_back(PredSU); WorkList.push_back(PredSU);
} }
} while (!WorkList.empty()); } while (!WorkList.empty());
} }
/// setDepthToAtLeast - Update this node's successors to reflect the
/// fact that this node's depth just increased.
///
void SUnit::setDepthToAtLeast(unsigned NewDepth) { void SUnit::setDepthToAtLeast(unsigned NewDepth) {
if (NewDepth <= getDepth()) if (NewDepth <= getDepth())
return; return;
@ -217,9 +201,6 @@ void SUnit::setDepthToAtLeast(unsigned NewDepth) {
isDepthCurrent = true; isDepthCurrent = true;
} }
/// setHeightToAtLeast - Update this node's predecessors to reflect the
/// fact that this node's height just increased.
///
void SUnit::setHeightToAtLeast(unsigned NewHeight) { void SUnit::setHeightToAtLeast(unsigned NewHeight) {
if (NewHeight <= getHeight()) if (NewHeight <= getHeight())
return; return;
@ -228,8 +209,7 @@ void SUnit::setHeightToAtLeast(unsigned NewHeight) {
isHeightCurrent = true; isHeightCurrent = true;
} }
/// ComputeDepth - Calculate the maximal path from the node to the exit. /// Calculates the maximal path from the node to the exit.
///
void SUnit::ComputeDepth() { void SUnit::ComputeDepth() {
SmallVector<SUnit*, 8> WorkList; SmallVector<SUnit*, 8> WorkList;
WorkList.push_back(this); WorkList.push_back(this);
@ -238,12 +218,11 @@ void SUnit::ComputeDepth() {
bool Done = true; bool Done = true;
unsigned MaxPredDepth = 0; unsigned MaxPredDepth = 0;
for (SUnit::const_pred_iterator I = Cur->Preds.begin(), for (const SDep &PredDep : Cur->Preds) {
E = Cur->Preds.end(); I != E; ++I) { SUnit *PredSU = PredDep.getSUnit();
SUnit *PredSU = I->getSUnit();
if (PredSU->isDepthCurrent) if (PredSU->isDepthCurrent)
MaxPredDepth = std::max(MaxPredDepth, MaxPredDepth = std::max(MaxPredDepth,
PredSU->Depth + I->getLatency()); PredSU->Depth + PredDep.getLatency());
else { else {
Done = false; Done = false;
WorkList.push_back(PredSU); WorkList.push_back(PredSU);
@ -261,8 +240,7 @@ void SUnit::ComputeDepth() {
} while (!WorkList.empty()); } while (!WorkList.empty());
} }
/// ComputeHeight - Calculate the maximal path from the node to the entry. /// Calculates the maximal path from the node to the entry.
///
void SUnit::ComputeHeight() { void SUnit::ComputeHeight() {
SmallVector<SUnit*, 8> WorkList; SmallVector<SUnit*, 8> WorkList;
WorkList.push_back(this); WorkList.push_back(this);
@ -271,12 +249,11 @@ void SUnit::ComputeHeight() {
bool Done = true; bool Done = true;
unsigned MaxSuccHeight = 0; unsigned MaxSuccHeight = 0;
for (SUnit::const_succ_iterator I = Cur->Succs.begin(), for (const SDep &SuccDep : Cur->Succs) {
E = Cur->Succs.end(); I != E; ++I) { SUnit *SuccSU = SuccDep.getSUnit();
SUnit *SuccSU = I->getSUnit();
if (SuccSU->isHeightCurrent) if (SuccSU->isHeightCurrent)
MaxSuccHeight = std::max(MaxSuccHeight, MaxSuccHeight = std::max(MaxSuccHeight,
SuccSU->Height + I->getLatency()); SuccSU->Height + SuccDep.getLatency());
else { else {
Done = false; Done = false;
WorkList.push_back(SuccSU); WorkList.push_back(SuccSU);
@ -320,8 +297,6 @@ void SUnit::print(raw_ostream &OS, const ScheduleDAG *DAG) const {
OS << "SU(" << NodeNum << ")"; OS << "SU(" << NodeNum << ")";
} }
/// SUnit - Scheduling unit. It's an wrapper around either a single SDNode or
/// a group of nodes flagged together.
LLVM_DUMP_METHOD void SUnit::dump(const ScheduleDAG *G) const { LLVM_DUMP_METHOD void SUnit::dump(const ScheduleDAG *G) const {
print(dbgs(), G); print(dbgs(), G);
dbgs() << ": "; dbgs() << ": ";
@ -344,41 +319,39 @@ LLVM_DUMP_METHOD void SUnit::dumpAll(const ScheduleDAG *G) const {
if (Preds.size() != 0) { if (Preds.size() != 0) {
dbgs() << " Predecessors:\n"; dbgs() << " Predecessors:\n";
for (SUnit::const_succ_iterator I = Preds.begin(), E = Preds.end(); for (const SDep &SuccDep : Preds) {
I != E; ++I) {
dbgs() << " "; dbgs() << " ";
switch (I->getKind()) { switch (SuccDep.getKind()) {
case SDep::Data: dbgs() << "data "; break; case SDep::Data: dbgs() << "data "; break;
case SDep::Anti: dbgs() << "anti "; break; case SDep::Anti: dbgs() << "anti "; break;
case SDep::Output: dbgs() << "out "; break; case SDep::Output: dbgs() << "out "; break;
case SDep::Order: dbgs() << "ord "; break; case SDep::Order: dbgs() << "ord "; break;
} }
I->getSUnit()->print(dbgs(), G); SuccDep.getSUnit()->print(dbgs(), G);
if (I->isArtificial()) if (SuccDep.isArtificial())
dbgs() << " *"; dbgs() << " *";
dbgs() << ": Latency=" << I->getLatency(); dbgs() << ": Latency=" << SuccDep.getLatency();
if (I->isAssignedRegDep()) if (SuccDep.isAssignedRegDep())
dbgs() << " Reg=" << PrintReg(I->getReg(), G->TRI); dbgs() << " Reg=" << PrintReg(SuccDep.getReg(), G->TRI);
dbgs() << "\n"; dbgs() << "\n";
} }
} }
if (Succs.size() != 0) { if (Succs.size() != 0) {
dbgs() << " Successors:\n"; dbgs() << " Successors:\n";
for (SUnit::const_succ_iterator I = Succs.begin(), E = Succs.end(); for (const SDep &SuccDep : Succs) {
I != E; ++I) {
dbgs() << " "; dbgs() << " ";
switch (I->getKind()) { switch (SuccDep.getKind()) {
case SDep::Data: dbgs() << "data "; break; case SDep::Data: dbgs() << "data "; break;
case SDep::Anti: dbgs() << "anti "; break; case SDep::Anti: dbgs() << "anti "; break;
case SDep::Output: dbgs() << "out "; break; case SDep::Output: dbgs() << "out "; break;
case SDep::Order: dbgs() << "ord "; break; case SDep::Order: dbgs() << "ord "; break;
} }
I->getSUnit()->print(dbgs(), G); SuccDep.getSUnit()->print(dbgs(), G);
if (I->isArtificial()) if (SuccDep.isArtificial())
dbgs() << " *"; dbgs() << " *";
dbgs() << ": Latency=" << I->getLatency(); dbgs() << ": Latency=" << SuccDep.getLatency();
if (I->isAssignedRegDep()) if (SuccDep.isAssignedRegDep())
dbgs() << " Reg=" << PrintReg(I->getReg(), G->TRI); dbgs() << " Reg=" << PrintReg(SuccDep.getReg(), G->TRI);
dbgs() << "\n"; dbgs() << "\n";
} }
} }
@ -386,47 +359,44 @@ LLVM_DUMP_METHOD void SUnit::dumpAll(const ScheduleDAG *G) const {
#endif #endif
#ifndef NDEBUG #ifndef NDEBUG
/// VerifyScheduledDAG - Verify that all SUnits were scheduled and that
/// their state is consistent. Return the number of scheduled nodes.
///
unsigned ScheduleDAG::VerifyScheduledDAG(bool isBottomUp) { unsigned ScheduleDAG::VerifyScheduledDAG(bool isBottomUp) {
bool AnyNotSched = false; bool AnyNotSched = false;
unsigned DeadNodes = 0; unsigned DeadNodes = 0;
for (unsigned i = 0, e = SUnits.size(); i != e; ++i) { for (const SUnit &SUnit : SUnits) {
if (!SUnits[i].isScheduled) { if (!SUnit.isScheduled) {
if (SUnits[i].NumPreds == 0 && SUnits[i].NumSuccs == 0) { if (SUnit.NumPreds == 0 && SUnit.NumSuccs == 0) {
++DeadNodes; ++DeadNodes;
continue; continue;
} }
if (!AnyNotSched) if (!AnyNotSched)
dbgs() << "*** Scheduling failed! ***\n"; dbgs() << "*** Scheduling failed! ***\n";
SUnits[i].dump(this); SUnit.dump(this);
dbgs() << "has not been scheduled!\n"; dbgs() << "has not been scheduled!\n";
AnyNotSched = true; AnyNotSched = true;
} }
if (SUnits[i].isScheduled && if (SUnit.isScheduled &&
(isBottomUp ? SUnits[i].getHeight() : SUnits[i].getDepth()) > (isBottomUp ? SUnit.getHeight() : SUnit.getDepth()) >
unsigned(INT_MAX)) { unsigned(INT_MAX)) {
if (!AnyNotSched) if (!AnyNotSched)
dbgs() << "*** Scheduling failed! ***\n"; dbgs() << "*** Scheduling failed! ***\n";
SUnits[i].dump(this); SUnit.dump(this);
dbgs() << "has an unexpected " dbgs() << "has an unexpected "
<< (isBottomUp ? "Height" : "Depth") << " value!\n"; << (isBottomUp ? "Height" : "Depth") << " value!\n";
AnyNotSched = true; AnyNotSched = true;
} }
if (isBottomUp) { if (isBottomUp) {
if (SUnits[i].NumSuccsLeft != 0) { if (SUnit.NumSuccsLeft != 0) {
if (!AnyNotSched) if (!AnyNotSched)
dbgs() << "*** Scheduling failed! ***\n"; dbgs() << "*** Scheduling failed! ***\n";
SUnits[i].dump(this); SUnit.dump(this);
dbgs() << "has successors left!\n"; dbgs() << "has successors left!\n";
AnyNotSched = true; AnyNotSched = true;
} }
} else { } else {
if (SUnits[i].NumPredsLeft != 0) { if (SUnit.NumPredsLeft != 0) {
if (!AnyNotSched) if (!AnyNotSched)
dbgs() << "*** Scheduling failed! ***\n"; dbgs() << "*** Scheduling failed! ***\n";
SUnits[i].dump(this); SUnit.dump(this);
dbgs() << "has predecessors left!\n"; dbgs() << "has predecessors left!\n";
AnyNotSched = true; AnyNotSched = true;
} }
@ -437,36 +407,33 @@ unsigned ScheduleDAG::VerifyScheduledDAG(bool isBottomUp) {
} }
#endif #endif
/// InitDAGTopologicalSorting - create the initial topological
/// ordering from the DAG to be scheduled.
///
/// The idea of the algorithm is taken from
/// "Online algorithms for managing the topological order of
/// a directed acyclic graph" by David J. Pearce and Paul H.J. Kelly
/// This is the MNR algorithm, which was first introduced by
/// A. Marchetti-Spaccamela, U. Nanni and H. Rohnert in
/// "Maintaining a topological order under edge insertions".
///
/// Short description of the algorithm:
///
/// Topological ordering, ord, of a DAG maps each node to a topological
/// index so that for all edges X->Y it is the case that ord(X) < ord(Y).
///
/// This means that if there is a path from the node X to the node Z,
/// then ord(X) < ord(Z).
///
/// This property can be used to check for reachability of nodes:
/// if Z is reachable from X, then an insertion of the edge Z->X would
/// create a cycle.
///
/// The algorithm first computes a topological ordering for the DAG by
/// initializing the Index2Node and Node2Index arrays and then tries to keep
/// the ordering up-to-date after edge insertions by reordering the DAG.
///
/// On insertion of the edge X->Y, the algorithm first marks by calling DFS
/// the nodes reachable from Y, and then shifts them using Shift to lie
/// immediately after X in Index2Node.
void ScheduleDAGTopologicalSort::InitDAGTopologicalSorting() { void ScheduleDAGTopologicalSort::InitDAGTopologicalSorting() {
// The idea of the algorithm is taken from
// "Online algorithms for managing the topological order of
// a directed acyclic graph" by David J. Pearce and Paul H.J. Kelly
// This is the MNR algorithm, which was first introduced by
// A. Marchetti-Spaccamela, U. Nanni and H. Rohnert in
// "Maintaining a topological order under edge insertions".
//
// Short description of the algorithm:
//
// Topological ordering, ord, of a DAG maps each node to a topological
// index so that for all edges X->Y it is the case that ord(X) < ord(Y).
//
// This means that if there is a path from the node X to the node Z,
// then ord(X) < ord(Z).
//
// This property can be used to check for reachability of nodes:
// if Z is reachable from X, then an insertion of the edge Z->X would
// create a cycle.
//
// The algorithm first computes a topological ordering for the DAG by
// initializing the Index2Node and Node2Index arrays and then tries to keep
// the ordering up-to-date after edge insertions by reordering the DAG.
//
// On insertion of the edge X->Y, the algorithm first marks by calling DFS
// the nodes reachable from Y, and then shifts them using Shift to lie
// immediately after X in Index2Node.
unsigned DAGSize = SUnits.size(); unsigned DAGSize = SUnits.size();
std::vector<SUnit*> WorkList; std::vector<SUnit*> WorkList;
WorkList.reserve(DAGSize); WorkList.reserve(DAGSize);
@ -477,18 +444,17 @@ void ScheduleDAGTopologicalSort::InitDAGTopologicalSorting() {
// Initialize the data structures. // Initialize the data structures.
if (ExitSU) if (ExitSU)
WorkList.push_back(ExitSU); WorkList.push_back(ExitSU);
for (unsigned i = 0, e = DAGSize; i != e; ++i) { for (SUnit &SU : SUnits) {
SUnit *SU = &SUnits[i]; int NodeNum = SU.NodeNum;
int NodeNum = SU->NodeNum; unsigned Degree = SU.Succs.size();
unsigned Degree = SU->Succs.size();
// Temporarily use the Node2Index array as scratch space for degree counts. // Temporarily use the Node2Index array as scratch space for degree counts.
Node2Index[NodeNum] = Degree; Node2Index[NodeNum] = Degree;
// Is it a node without dependencies? // Is it a node without dependencies?
if (Degree == 0) { if (Degree == 0) {
assert(SU->Succs.empty() && "SUnit should have no successors"); assert(SU.Succs.empty() && "SUnit should have no successors");
// Collect leaf nodes. // Collect leaf nodes.
WorkList.push_back(SU); WorkList.push_back(&SU);
} }
} }
@ -498,9 +464,8 @@ void ScheduleDAGTopologicalSort::InitDAGTopologicalSorting() {
WorkList.pop_back(); WorkList.pop_back();
if (SU->NodeNum < DAGSize) if (SU->NodeNum < DAGSize)
Allocate(SU->NodeNum, --Id); Allocate(SU->NodeNum, --Id);
for (SUnit::const_pred_iterator I = SU->Preds.begin(), E = SU->Preds.end(); for (const SDep &PredDep : SU->Preds) {
I != E; ++I) { SUnit *SU = PredDep.getSUnit();
SUnit *SU = I->getSUnit();
if (SU->NodeNum < DAGSize && !--Node2Index[SU->NodeNum]) if (SU->NodeNum < DAGSize && !--Node2Index[SU->NodeNum])
// If all dependencies of the node are processed already, // If all dependencies of the node are processed already,
// then the node can be computed now. // then the node can be computed now.
@ -512,19 +477,15 @@ void ScheduleDAGTopologicalSort::InitDAGTopologicalSorting() {
#ifndef NDEBUG #ifndef NDEBUG
// Check correctness of the ordering // Check correctness of the ordering
for (unsigned i = 0, e = DAGSize; i != e; ++i) { for (SUnit &SU : SUnits) {
SUnit *SU = &SUnits[i]; for (const SDep &PD : SU.Preds) {
for (SUnit::const_pred_iterator I = SU->Preds.begin(), E = SU->Preds.end(); assert(Node2Index[SU.NodeNum] > Node2Index[PD.getSUnit()->NodeNum] &&
I != E; ++I) {
assert(Node2Index[SU->NodeNum] > Node2Index[I->getSUnit()->NodeNum] &&
"Wrong topological sorting"); "Wrong topological sorting");
} }
} }
#endif #endif
} }
/// AddPred - Updates the topological ordering to accommodate an edge
/// to be added from SUnit X to SUnit Y.
void ScheduleDAGTopologicalSort::AddPred(SUnit *Y, SUnit *X) { void ScheduleDAGTopologicalSort::AddPred(SUnit *Y, SUnit *X) {
int UpperBound, LowerBound; int UpperBound, LowerBound;
LowerBound = Node2Index[Y->NodeNum]; LowerBound = Node2Index[Y->NodeNum];
@ -541,16 +502,10 @@ void ScheduleDAGTopologicalSort::AddPred(SUnit *Y, SUnit *X) {
} }
} }
/// RemovePred - Updates the topological ordering to accommodate an
/// an edge to be removed from the specified node N from the predecessors
/// of the current node M.
void ScheduleDAGTopologicalSort::RemovePred(SUnit *M, SUnit *N) { void ScheduleDAGTopologicalSort::RemovePred(SUnit *M, SUnit *N) {
// InitDAGTopologicalSorting(); // InitDAGTopologicalSorting();
} }
/// DFS - Make a DFS traversal to mark all nodes reachable from SU and mark
/// all nodes affected by the edge insertion. These nodes will later get new
/// topological indexes by means of the Shift method.
void ScheduleDAGTopologicalSort::DFS(const SUnit *SU, int UpperBound, void ScheduleDAGTopologicalSort::DFS(const SUnit *SU, int UpperBound,
bool &HasLoop) { bool &HasLoop) {
std::vector<const SUnit*> WorkList; std::vector<const SUnit*> WorkList;
@ -561,8 +516,9 @@ void ScheduleDAGTopologicalSort::DFS(const SUnit *SU, int UpperBound,
SU = WorkList.back(); SU = WorkList.back();
WorkList.pop_back(); WorkList.pop_back();
Visited.set(SU->NodeNum); Visited.set(SU->NodeNum);
for (int I = SU->Succs.size()-1; I >= 0; --I) { for (const SDep &SuccDep
unsigned s = SU->Succs[I].getSUnit()->NodeNum; : make_range(SU->Succs.rbegin(), SU->Succs.rend())) {
unsigned s = SuccDep.getSUnit()->NodeNum;
// Edges to non-SUnits are allowed but ignored (e.g. ExitSU). // Edges to non-SUnits are allowed but ignored (e.g. ExitSU).
if (s >= Node2Index.size()) if (s >= Node2Index.size())
continue; continue;
@ -572,14 +528,12 @@ void ScheduleDAGTopologicalSort::DFS(const SUnit *SU, int UpperBound,
} }
// Visit successors if not already and in affected region. // Visit successors if not already and in affected region.
if (!Visited.test(s) && Node2Index[s] < UpperBound) { if (!Visited.test(s) && Node2Index[s] < UpperBound) {
WorkList.push_back(SU->Succs[I].getSUnit()); WorkList.push_back(SuccDep.getSUnit());
} }
} }
} while (!WorkList.empty()); } while (!WorkList.empty());
} }
/// Shift - Renumber the nodes so that the topological ordering is
/// preserved.
void ScheduleDAGTopologicalSort::Shift(BitVector& Visited, int LowerBound, void ScheduleDAGTopologicalSort::Shift(BitVector& Visited, int LowerBound,
int UpperBound) { int UpperBound) {
std::vector<int> L; std::vector<int> L;
@ -599,28 +553,24 @@ void ScheduleDAGTopologicalSort::Shift(BitVector& Visited, int LowerBound,
} }
} }
for (unsigned j = 0; j < L.size(); ++j) { for (unsigned LI : L) {
Allocate(L[j], i - shift); Allocate(LI, i - shift);
i = i + 1; i = i + 1;
} }
} }
/// WillCreateCycle - Returns true if adding an edge to TargetSU from SU will
/// create a cycle. If so, it is not safe to call AddPred(TargetSU, SU).
bool ScheduleDAGTopologicalSort::WillCreateCycle(SUnit *TargetSU, SUnit *SU) { bool ScheduleDAGTopologicalSort::WillCreateCycle(SUnit *TargetSU, SUnit *SU) {
// Is SU reachable from TargetSU via successor edges? // Is SU reachable from TargetSU via successor edges?
if (IsReachable(SU, TargetSU)) if (IsReachable(SU, TargetSU))
return true; return true;
for (SUnit::pred_iterator for (const SDep &PredDep : TargetSU->Preds)
I = TargetSU->Preds.begin(), E = TargetSU->Preds.end(); I != E; ++I) if (PredDep.isAssignedRegDep() &&
if (I->isAssignedRegDep() && IsReachable(SU, PredDep.getSUnit()))
IsReachable(SU, I->getSUnit()))
return true; return true;
return false; return false;
} }
/// IsReachable - Checks if SU is reachable from TargetSU.
bool ScheduleDAGTopologicalSort::IsReachable(const SUnit *SU, bool ScheduleDAGTopologicalSort::IsReachable(const SUnit *SU,
const SUnit *TargetSU) { const SUnit *TargetSU) {
// If insertion of the edge SU->TargetSU would create a cycle // If insertion of the edge SU->TargetSU would create a cycle
@ -638,7 +588,6 @@ bool ScheduleDAGTopologicalSort::IsReachable(const SUnit *SU,
return HasLoop; return HasLoop;
} }
/// Allocate - assign the topological index to the node n.
void ScheduleDAGTopologicalSort::Allocate(int n, int index) { void ScheduleDAGTopologicalSort::Allocate(int n, int index) {
Node2Index[n] = index; Node2Index[n] = index;
Index2Node[index] = n; Index2Node[index] = n;