doxygen/ScheduleDAG_8cpp_source.html

//===- ScheduleDAG.cpp - Implement the ScheduleDAG class ------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file Implements the ScheduleDAG class, which is a base class used by

/// scheduling implementation classes.

//

//===----------------------------------------------------------------------===//


#include "llvm/CodeGen/ScheduleDAG.h"

#include "llvm/ADT/STLExtras.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/CodeGen/MachineFunction.h"

#include "llvm/CodeGen/ScheduleHazardRecognizer.h"

#include "llvm/CodeGen/SelectionDAGNodes.h"

#include "llvm/CodeGen/TargetInstrInfo.h"

#include "llvm/CodeGen/TargetRegisterInfo.h"

#include "llvm/CodeGen/TargetSubtargetInfo.h"

#include "llvm/Config/llvm-config.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/raw_ostream.h"

#include <algorithm>

#include <cassert>

#include <iterator>

#include <limits>

#include <utility>

#include <vector>


using namespace llvm;


#define DEBUG_TYPE "pre-RA-sched"


STATISTIC(NumNewPredsAdded, "Number of times a  single predecessor was added");

STATISTIC(NumTopoInits,

          "Number of times the topological order has been recomputed");


#ifndef NDEBUG

static cl::opt<bool> StressSchedOpt(

  "stress-sched", cl::Hidden, cl::init(false),

  cl::desc("Stress test instruction scheduling"));

#endif


void SchedulingPriorityQueue::anchor() {}


ScheduleDAG::ScheduleDAG(MachineFunction &mf)

    : TM(mf.getTarget()), TII(mf.getSubtarget().getInstrInfo()),

      TRI(mf.getSubtarget().getRegisterInfo()), MF(mf),

      MRI(mf.getRegInfo()) {

#ifndef NDEBUG

  StressSched = StressSchedOpt;

#endif

}


ScheduleDAG::~ScheduleDAG() = default;


void ScheduleDAG::clearDAG() {

  SUnits.clear();

  EntrySU = SUnit();

  ExitSU = SUnit();

}


const MCInstrDesc *ScheduleDAG::getNodeDesc(const SDNode *Node) const {

  if (!Node || !Node->isMachineOpcode()) return nullptr;

  return &TII->get(Node->getMachineOpcode());

}


LLVM_DUMP_METHOD void SDep::dump(const TargetRegisterInfo *TRI) const {

  switch (getKind()) {

  case Data:   dbgs() << "Data"; break;

  case Anti:   dbgs() << "Anti"; break;

  case Output: dbgs() << "Out "; break;

  case Order:  dbgs() << "Ord "; break;

  }


  switch (getKind()) {

  case Data:

    dbgs() << " Latency=" << getLatency();

    if (TRI && isAssignedRegDep())

      dbgs() << " Reg=" << printReg(getReg(), TRI);

    break;

  case Anti:

  case Output:

    dbgs() << " Latency=" << getLatency();

    break;

  case Order:

    dbgs() << " Latency=" << getLatency();

    switch(Contents.OrdKind) {

    case Barrier:      dbgs() << " Barrier"; break;

    case MayAliasMem:

    case MustAliasMem: dbgs() << " Memory"; break;

    case Artificial:   dbgs() << " Artificial"; break;

    case Weak:         dbgs() << " Weak"; break;

    case Cluster:      dbgs() << " Cluster"; break;

    }

    break;

  }

}


bool SUnit::addPred(const SDep &D, bool Required) {

  // If this node already has this dependence, don't add a redundant one.

  for (SDep &PredDep : Preds) {

    // Zero-latency weak edges may be added purely for heuristic ordering. Don't

    // add them if another kind of edge already exists.

    if (!Required && PredDep.getSUnit() == D.getSUnit())

      return false;

    if (PredDep.overlaps(D)) {

      // Extend the latency if needed. Equivalent to

      // removePred(PredDep) + addPred(D).

      if (PredDep.getLatency() < D.getLatency()) {

        SUnit *PredSU = PredDep.getSUnit();

        // Find the corresponding successor in N.

        SDep ForwardD = PredDep;

        ForwardD.setSUnit(this);

        for (SDep &SuccDep : PredSU->Succs) {

          if (SuccDep == ForwardD) {

            SuccDep.setLatency(D.getLatency());

            break;

          }

        }

        PredDep.setLatency(D.getLatency());

        // Changing latency, dirty the involved SUnits.

        this->setDepthDirty();

        D.getSUnit()->setHeightDirty();

      }

      return false;

    }

  }

  // Now add a corresponding succ to N.

  SDep P = D;

  P.setSUnit(this);

  SUnit *N = D.getSUnit();

  // Update the bookkeeping.

  if (D.getKind() == SDep::Data) {

    assert(NumPreds < std::numeric_limits<unsigned>::max() &&

           "NumPreds will overflow!");

    assert(N->NumSuccs < std::numeric_limits<unsigned>::max() &&

           "NumSuccs will overflow!");

    ++NumPreds;

    ++N->NumSuccs;

  }

  if (!N->isScheduled) {

    if (D.isWeak()) {

      ++WeakPredsLeft;

    }

    else {

      assert(NumPredsLeft < std::numeric_limits<unsigned>::max() &&

             "NumPredsLeft will overflow!");

      ++NumPredsLeft;

    }

  }

  if (!isScheduled) {

    if (D.isWeak()) {

      ++N->WeakSuccsLeft;

    }

    else {

      assert(N->NumSuccsLeft < std::numeric_limits<unsigned>::max() &&

             "NumSuccsLeft will overflow!");

      ++N->NumSuccsLeft;

    }

  }

  Preds.push_back(D);

  N->Succs.push_back(P);

  this->setDepthDirty();

  N->setHeightDirty();

  return true;

}


void SUnit::removePred(const SDep &D) {

  // Find the matching predecessor.

  SmallVectorImpl<SDep>::iterator I = llvm::find(Preds, D);

  if (I == Preds.end())

    return;

  // Find the corresponding successor in N.

  SDep P = D;

  P.setSUnit(this);

  SUnit *N = D.getSUnit();

  SmallVectorImpl<SDep>::iterator Succ = llvm::find(N->Succs, P);

  assert(Succ != N->Succs.end() && "Mismatching preds / succs lists!");

  // Update the bookkeeping.

  if (P.getKind() == SDep::Data) {

    assert(NumPreds > 0 && "NumPreds will underflow!");

    assert(N->NumSuccs > 0 && "NumSuccs will underflow!");

    --NumPreds;

    --N->NumSuccs;

  }

  if (!N->isScheduled) {

    if (D.isWeak()) {

      assert(WeakPredsLeft > 0 && "WeakPredsLeft will underflow!");

      --WeakPredsLeft;

    } else {

      assert(NumPredsLeft > 0 && "NumPredsLeft will underflow!");

      --NumPredsLeft;

    }

  }

  if (!isScheduled) {

    if (D.isWeak()) {

      assert(N->WeakSuccsLeft > 0 && "WeakSuccsLeft will underflow!");

      --N->WeakSuccsLeft;

    } else {

      assert(N->NumSuccsLeft > 0 && "NumSuccsLeft will underflow!");

      --N->NumSuccsLeft;

    }

  }

  N->Succs.erase(Succ);

  Preds.erase(I);

  this->setDepthDirty();

  N->setHeightDirty();

}


void SUnit::setDepthDirty() {

  if (!isDepthCurrent) return;

  SmallVector<SUnit*, 8> WorkList;

  WorkList.push_back(this);

  do {

    SUnit *SU = WorkList.pop_back_val();

    SU->isDepthCurrent = false;

    for (SDep &SuccDep : SU->Succs) {

      SUnit *SuccSU = SuccDep.getSUnit();

      if (SuccSU->isDepthCurrent)

        WorkList.push_back(SuccSU);

    }

  } while (!WorkList.empty());

}


void SUnit::setHeightDirty() {

  if (!isHeightCurrent) return;

  SmallVector<SUnit*, 8> WorkList;

  WorkList.push_back(this);

  do {

    SUnit *SU = WorkList.pop_back_val();

    SU->isHeightCurrent = false;

    for (SDep &PredDep : SU->Preds) {

      SUnit *PredSU = PredDep.getSUnit();

      if (PredSU->isHeightCurrent)

        WorkList.push_back(PredSU);

    }

  } while (!WorkList.empty());

}


void SUnit::setDepthToAtLeast(unsigned NewDepth) {

  if (NewDepth <= getDepth())

    return;

  setDepthDirty();

  Depth = NewDepth;

  isDepthCurrent = true;

}


void SUnit::setHeightToAtLeast(unsigned NewHeight) {

  if (NewHeight <= getHeight())

    return;

  setHeightDirty();

  Height = NewHeight;

  isHeightCurrent = true;

}


/// Calculates the maximal path from the node to the exit.

void SUnit::ComputeDepth() {

  SmallVector<SUnit*, 8> WorkList;

  WorkList.push_back(this);

  do {

    SUnit *Cur = WorkList.back();


    bool Done = true;

    unsigned MaxPredDepth = 0;

    for (const SDep &PredDep : Cur->Preds) {

      SUnit *PredSU = PredDep.getSUnit();

      if (PredSU->isDepthCurrent)

        MaxPredDepth = std::max(MaxPredDepth,

                                PredSU->Depth + PredDep.getLatency());

      else {

        Done = false;

        WorkList.push_back(PredSU);

      }

    }


    if (Done) {

      WorkList.pop_back();

      if (MaxPredDepth != Cur->Depth) {

        Cur->setDepthDirty();

        Cur->Depth = MaxPredDepth;

      }

      Cur->isDepthCurrent = true;

    }

  } while (!WorkList.empty());

}


/// Calculates the maximal path from the node to the entry.

void SUnit::ComputeHeight() {

  SmallVector<SUnit*, 8> WorkList;

  WorkList.push_back(this);

  do {

    SUnit *Cur = WorkList.back();


    bool Done = true;

    unsigned MaxSuccHeight = 0;

    for (const SDep &SuccDep : Cur->Succs) {

      SUnit *SuccSU = SuccDep.getSUnit();

      if (SuccSU->isHeightCurrent)

        MaxSuccHeight = std::max(MaxSuccHeight,

                                 SuccSU->Height + SuccDep.getLatency());

      else {

        Done = false;

        WorkList.push_back(SuccSU);

      }

    }


    if (Done) {

      WorkList.pop_back();

      if (MaxSuccHeight != Cur->Height) {

        Cur->setHeightDirty();

        Cur->Height = MaxSuccHeight;

      }

      Cur->isHeightCurrent = true;

    }

  } while (!WorkList.empty());

}


void SUnit::biasCriticalPath() {

  if (NumPreds < 2)

    return;


  SUnit::pred_iterator BestI = Preds.begin();

  unsigned MaxDepth = BestI->getSUnit()->getDepth();

  for (SUnit::pred_iterator I = std::next(BestI), E = Preds.end(); I != E;

       ++I) {

    if (I->getKind() == SDep::Data && I->getSUnit()->getDepth() > MaxDepth) {

      MaxDepth = I->getSUnit()->getDepth();

      BestI = I;

    }

  }

  if (BestI != Preds.begin())

    std::swap(*Preds.begin(), *BestI);

}


#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)


LLVM_DUMP_METHOD void SUnit::dumpAttributes() const {

  dbgs() << "  # preds left       : " << NumPredsLeft << "\n";

  dbgs() << "  # succs left       : " << NumSuccsLeft << "\n";

  if (WeakPredsLeft)

    dbgs() << "  # weak preds left  : " << WeakPredsLeft << "\n";

  if (WeakSuccsLeft)

    dbgs() << "  # weak succs left  : " << WeakSuccsLeft << "\n";

  dbgs() << "  # rdefs left       : " << NumRegDefsLeft << "\n";

  dbgs() << "  Latency            : " << Latency << "\n";

  dbgs() << "  Depth              : " << getDepth() << "\n";

  dbgs() << "  Height             : " << getHeight() << "\n";

}


LLVM_DUMP_METHOD void ScheduleDAG::dumpNodeName(const SUnit &SU) const {

  if (&SU == &EntrySU)

    dbgs() << "EntrySU";

  else if (&SU == &ExitSU)

    dbgs() << "ExitSU";

  else

    dbgs() << "SU(" << SU.NodeNum << ")";

}


LLVM_DUMP_METHOD void ScheduleDAG::dumpNodeAll(const SUnit &SU) const {

  dumpNode(SU);

  SU.dumpAttributes();

  if (SU.ParentClusterIdx != InvalidClusterId)

    dbgs() << "  Parent Cluster Index: " << SU.ParentClusterIdx << '\n';


  if (SU.Preds.size() > 0) {

    dbgs() << "  Predecessors:\n";

    for (const SDep &Dep : SU.Preds) {

      dbgs() << "    ";

      dumpNodeName(*Dep.getSUnit());

      dbgs() << ": ";

      Dep.dump(TRI);

      dbgs() << '\n';

    }

  }

  if (SU.Succs.size() > 0) {

    dbgs() << "  Successors:\n";

    for (const SDep &Dep : SU.Succs) {

      dbgs() << "    ";

      dumpNodeName(*Dep.getSUnit());

      dbgs() << ": ";

      Dep.dump(TRI);

      dbgs() << '\n';

    }

  }

}


#endif


#ifndef NDEBUG


unsigned ScheduleDAG::VerifyScheduledDAG(bool isBottomUp) {

  bool AnyNotSched = false;

  unsigned DeadNodes = 0;

  for (const SUnit &SUnit : SUnits) {

    if (!SUnit.isScheduled) {

      if (SUnit.NumPreds == 0 && SUnit.NumSuccs == 0) {

        ++DeadNodes;

        continue;

      }

      if (!AnyNotSched)

        dbgs() << "*** Scheduling failed! ***\n";

      dumpNode(SUnit);

      dbgs() << "has not been scheduled!\n";

      AnyNotSched = true;

    }

    if (SUnit.isScheduled &&

        (isBottomUp ? SUnit.getHeight() : SUnit.getDepth()) >

          unsigned(std::numeric_limits<int>::max())) {

      if (!AnyNotSched)

        dbgs() << "*** Scheduling failed! ***\n";

      dumpNode(SUnit);

      dbgs() << "has an unexpected "

           << (isBottomUp ? "Height" : "Depth") << " value!\n";

      AnyNotSched = true;

    }

    if (isBottomUp) {

      if (SUnit.NumSuccsLeft != 0) {

        if (!AnyNotSched)

          dbgs() << "*** Scheduling failed! ***\n";

        dumpNode(SUnit);

        dbgs() << "has successors left!\n";

        AnyNotSched = true;

      }

    } else {

      if (SUnit.NumPredsLeft != 0) {

        if (!AnyNotSched)

          dbgs() << "*** Scheduling failed! ***\n";

        dumpNode(SUnit);

        dbgs() << "has predecessors left!\n";

        AnyNotSched = true;

      }

    }

  }

  assert(!AnyNotSched);

  return SUnits.size() - DeadNodes;

}


#endif


void ScheduleDAGTopologicalSort::InitDAGTopologicalSorting() {

  // The idea of the algorithm is taken from

  // "Online algorithms for managing the topological order of

  // a directed acyclic graph" by David J. Pearce and Paul H.J. Kelly

  // This is the MNR algorithm, which was first introduced by

  // A. Marchetti-Spaccamela, U. Nanni and H. Rohnert in

  // "Maintaining a topological order under edge insertions".

  //

  // Short description of the algorithm:

  //

  // Topological ordering, ord, of a DAG maps each node to a topological

  // index so that for all edges X->Y it is the case that ord(X) < ord(Y).

  //

  // This means that if there is a path from the node X to the node Z,

  // then ord(X) < ord(Z).

  //

  // This property can be used to check for reachability of nodes:

  // if Z is reachable from X, then an insertion of the edge Z->X would

  // create a cycle.

  //

  // The algorithm first computes a topological ordering for the DAG by

  // initializing the Index2Node and Node2Index arrays and then tries to keep

  // the ordering up-to-date after edge insertions by reordering the DAG.

  //

  // On insertion of the edge X->Y, the algorithm first marks by calling DFS

  // the nodes reachable from Y, and then shifts them using Shift to lie

  // immediately after X in Index2Node.


  // Cancel pending updates, mark as valid.

  Dirty = false;

  Updates.clear();


  unsigned DAGSize = SUnits.size();

  std::vector<SUnit*> WorkList;

  WorkList.reserve(DAGSize);


  Index2Node.resize(DAGSize);

  Node2Index.resize(DAGSize);


  // Initialize the data structures.

  if (ExitSU)

    WorkList.push_back(ExitSU);

  for (SUnit &SU : SUnits) {

    int NodeNum = SU.NodeNum;

    unsigned Degree = SU.Succs.size();

    // Temporarily use the Node2Index array as scratch space for degree counts.

    Node2Index[NodeNum] = Degree;


    // Is it a node without dependencies?

    if (Degree == 0) {

      assert(SU.Succs.empty() && "SUnit should have no successors");

      // Collect leaf nodes.

      WorkList.push_back(&SU);

    }

  }


  int Id = DAGSize;

  while (!WorkList.empty()) {

    SUnit *SU = WorkList.back();

    WorkList.pop_back();

    if (SU->NodeNum < DAGSize)

      Allocate(SU->NodeNum, --Id);

    for (const SDep &PredDep : SU->Preds) {

      SUnit *SU = PredDep.getSUnit();

      if (SU->NodeNum < DAGSize && !--Node2Index[SU->NodeNum])

        // If all dependencies of the node are processed already,

        // then the node can be computed now.

        WorkList.push_back(SU);

    }

  }


  Visited.resize(DAGSize);

  NumTopoInits++;


#ifndef NDEBUG

  // Check correctness of the ordering

  for (SUnit &SU : SUnits)  {

    for (const SDep &PD : SU.Preds) {

      assert(Node2Index[SU.NodeNum] > Node2Index[PD.getSUnit()->NodeNum] &&

      "Wrong topological sorting");

    }

  }

#endif

}


void ScheduleDAGTopologicalSort::FixOrder() {

  // Recompute from scratch after new nodes have been added.

  if (Dirty) {

    InitDAGTopologicalSorting();

    return;

  }


  // Otherwise apply updates one-by-one.

  for (auto &U : Updates)

    AddPred(U.first, U.second);

  Updates.clear();

}


void ScheduleDAGTopologicalSort::AddPredQueued(SUnit *Y, SUnit *X) {

  // Recomputing the order from scratch is likely more efficient than applying

  // updates one-by-one for too many updates. The current cut-off is arbitrarily

  // chosen.

  Dirty = Dirty || Updates.size() > 10;


  if (Dirty)

    return;


  Updates.emplace_back(Y, X);

}


void ScheduleDAGTopologicalSort::AddPred(SUnit *Y, SUnit *X) {

  int UpperBound, LowerBound;

  LowerBound = Node2Index[Y->NodeNum];

  UpperBound = Node2Index[X->NodeNum];

  bool HasLoop = false;

  // Is Ord(X) < Ord(Y) ?

  if (LowerBound < UpperBound) {

    // Update the topological order.

    Visited.reset();

    DFS(Y, UpperBound, HasLoop);

    assert(!HasLoop && "Inserted edge creates a loop!");

    // Recompute topological indexes.

    Shift(Visited, LowerBound, UpperBound);

  }


  NumNewPredsAdded++;

}


void ScheduleDAGTopologicalSort::RemovePred(SUnit *M, SUnit *N) {

  // InitDAGTopologicalSorting();

}


void ScheduleDAGTopologicalSort::DFS(const SUnit *SU, int UpperBound,

                                     bool &HasLoop) {

  std::vector<const SUnit*> WorkList;

  WorkList.reserve(SUnits.size());


  WorkList.push_back(SU);

  do {

    SU = WorkList.back();

    WorkList.pop_back();

    Visited.set(SU->NodeNum);

    for (const SDep &SuccDep : llvm::reverse(SU->Succs)) {

      unsigned s = SuccDep.getSUnit()->NodeNum;

      // Edges to non-SUnits are allowed but ignored (e.g. ExitSU).

      if (s >= Node2Index.size())

        continue;

      if (Node2Index[s] == UpperBound) {

        HasLoop = true;

        return;

      }

      // Visit successors if not already and in affected region.

      if (!Visited.test(s) && Node2Index[s] < UpperBound) {

        WorkList.push_back(SuccDep.getSUnit());

      }

    }

  } while (!WorkList.empty());

}


std::vector<int> ScheduleDAGTopologicalSort::GetSubGraph(const SUnit &StartSU,

                                                         const SUnit &TargetSU,

                                                         bool &Success) {

  std::vector<const SUnit*> WorkList;

  int LowerBound = Node2Index[StartSU.NodeNum];

  int UpperBound = Node2Index[TargetSU.NodeNum];

  bool Found = false;

  BitVector VisitedBack;

  std::vector<int> Nodes;


  if (LowerBound > UpperBound) {

    Success = false;

    return Nodes;

  }


  WorkList.reserve(SUnits.size());

  Visited.reset();


  // Starting from StartSU, visit all successors up

  // to UpperBound.

  WorkList.push_back(&StartSU);

  do {

    const SUnit *SU = WorkList.back();

    WorkList.pop_back();

    for (const SDep &SD : llvm::reverse(SU->Succs)) {

      const SUnit *Succ = SD.getSUnit();

      unsigned s = Succ->NodeNum;

      // Edges to non-SUnits are allowed but ignored (e.g. ExitSU).

      if (Succ->isBoundaryNode())

        continue;

      if (Node2Index[s] == UpperBound) {

        Found = true;

        continue;

      }

      // Visit successors if not already and in affected region.

      if (!Visited.test(s) && Node2Index[s] < UpperBound) {

        Visited.set(s);

        WorkList.push_back(Succ);

      }

    }

  } while (!WorkList.empty());


  if (!Found) {

    Success = false;

    return Nodes;

  }


  WorkList.clear();

  VisitedBack.resize(SUnits.size());

  Found = false;


  // Starting from TargetSU, visit all predecessors up

  // to LowerBound. SUs that are visited by the two

  // passes are added to Nodes.

  WorkList.push_back(&TargetSU);

  do {

    const SUnit *SU = WorkList.back();

    WorkList.pop_back();

    for (const SDep &SD : llvm::reverse(SU->Preds)) {

      const SUnit *Pred = SD.getSUnit();

      unsigned s = Pred->NodeNum;

      // Edges to non-SUnits are allowed but ignored (e.g. EntrySU).

      if (Pred->isBoundaryNode())

        continue;

      if (Node2Index[s] == LowerBound) {

        Found = true;

        continue;

      }

      if (!VisitedBack.test(s) && Visited.test(s)) {

        VisitedBack.set(s);

        WorkList.push_back(Pred);

        Nodes.push_back(s);

      }

    }

  } while (!WorkList.empty());


  assert(Found && "Error in SUnit Graph!");

  Success = true;

  return Nodes;

}


void ScheduleDAGTopologicalSort::Shift(BitVector& Visited, int LowerBound,

                                       int UpperBound) {

  std::vector<int> L;

  int shift = 0;

  int i;


  for (i = LowerBound; i <= UpperBound; ++i) {

    // w is node at topological index i.

    int w = Index2Node[i];

    if (Visited.test(w)) {

      // Unmark.

      Visited.reset(w);

      L.push_back(w);

      shift = shift + 1;

    } else {

      Allocate(w, i - shift);

    }

  }


  for (unsigned LI : L) {

    Allocate(LI, i - shift);

    i = i + 1;

  }

}


bool ScheduleDAGTopologicalSort::WillCreateCycle(SUnit *TargetSU, SUnit *SU) {

  FixOrder();

  // Is SU reachable from TargetSU via successor edges?

  if (IsReachable(SU, TargetSU))

    return true;

  for (const SDep &PredDep : TargetSU->Preds)

    if (PredDep.isAssignedRegDep() &&

        IsReachable(SU, PredDep.getSUnit()))

      return true;

  return false;

}


void ScheduleDAGTopologicalSort::AddSUnitWithoutPredecessors(const SUnit *SU) {

  assert(SU->NodeNum == Index2Node.size() && "Node cannot be added at the end");

  assert(SU->NumPreds == 0 && "Can only add SU's with no predecessors");

  Node2Index.push_back(Index2Node.size());

  Index2Node.push_back(SU->NodeNum);

  Visited.resize(Node2Index.size());

}


bool ScheduleDAGTopologicalSort::IsReachable(const SUnit *SU,

                                             const SUnit *TargetSU) {

  assert(TargetSU != nullptr && "Invalid target SUnit");

  assert(SU != nullptr && "Invalid SUnit");

  FixOrder();

  // If insertion of the edge SU->TargetSU would create a cycle

  // then there is a path from TargetSU to SU.

  int UpperBound, LowerBound;

  LowerBound = Node2Index[TargetSU->NodeNum];

  UpperBound = Node2Index[SU->NodeNum];

  bool HasLoop = false;

  // Is Ord(TargetSU) < Ord(SU) ?

  if (LowerBound < UpperBound) {

    Visited.reset();

    // There may be a path from TargetSU to SU. Check for it.

    DFS(TargetSU, UpperBound, HasLoop);

  }

  return HasLoop;

}


void ScheduleDAGTopologicalSort::Allocate(int n, int index) {

  Node2Index[n] = index;

  Index2Node[index] = n;

}


ScheduleDAGTopologicalSort::

ScheduleDAGTopologicalSort(std::vector<SUnit> &sunits, SUnit *exitsu)

  : SUnits(sunits), ExitSU(exitsu) {}


ScheduleHazardRecognizer::~ScheduleHazardRecognizer() = default;

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

CommandLine.h

Compiler.h

LLVM_DUMP_METHOD
#define LLVM_DUMP_METHOD
Mark debug helper function definitions like dump() that should not be stripped from debug builds.
Definition Compiler.h:638

TII
const HexagonInstrInfo * TII
Definition HexagonCopyToCombine.cpp:118

I
#define I(x, y, z)
Definition MD5.cpp:58

MachineFunction.h

TRI
Register const TargetRegisterInfo * TRI
Definition MachineSink.cpp:2118

P
#define P(N)

STLExtras.h
This file contains some templates that are useful if you are working with the STL at all.

StressSchedOpt
static cl::opt< bool > StressSchedOpt("stress-sched", cl::Hidden, cl::init(false), cl::desc("Stress test instruction scheduling"))

ScheduleDAG.h

ScheduleHazardRecognizer.h

SelectionDAGNodes.h

SmallVector.h
This file defines the SmallVector class.

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition Statistic.h:171

Debug.h

Y
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")

X
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")

TargetInstrInfo.h

TargetRegisterInfo.h

TargetSubtargetInfo.h

Node
Definition ItaniumDemangle.h:166

llvm::BitVector
Definition BitVector.h:101

llvm::BitVector::test
bool test(unsigned Idx) const
Definition BitVector.h:480

llvm::BitVector::reset
BitVector & reset()
Definition BitVector.h:411

llvm::BitVector::resize
void resize(unsigned N, bool t=false)
resize - Grow or shrink the bitvector.
Definition BitVector.h:360

llvm::BitVector::set
BitVector & set()
Definition BitVector.h:370

llvm::MCInstrDesc
Describe properties that are true of each instruction in the target description file.
Definition MCInstrDesc.h:210

llvm::MachineFunction
Definition MachineFunction.h:286

llvm::SDNode
Represents one node in the SelectionDAG.
Definition SelectionDAGNodes.h:501

llvm::SDep
Scheduling dependency.
Definition ScheduleDAG.h:51

llvm::SDep::getSUnit
SUnit * getSUnit() const
Definition ScheduleDAG.h:507

llvm::SDep::getKind
Kind getKind() const
Returns an enum value representing the kind of the dependence.
Definition ScheduleDAG.h:513

llvm::SDep::Output
@ Output
A register output-dependence (aka WAW).
Definition ScheduleDAG.h:57

llvm::SDep::Order
@ Order
Any other ordering dependency.
Definition ScheduleDAG.h:58

llvm::SDep::Anti
@ Anti
A register anti-dependence (aka WAR).
Definition ScheduleDAG.h:56

llvm::SDep::Data
@ Data
Regular data dependence (aka true-dependence).
Definition ScheduleDAG.h:55

llvm::SDep::setLatency
void setLatency(unsigned Lat)
Sets the latency for this edge.
Definition ScheduleDAG.h:147

llvm::SDep::Cluster
@ Cluster
Weak DAG edge linking a chain of clustered instrs.
Definition ScheduleDAG.h:76

llvm::SDep::Barrier
@ Barrier
An unknown scheduling barrier.
Definition ScheduleDAG.h:71

llvm::SDep::Artificial
@ Artificial
Arbitrary strong DAG edge (no real dependence).
Definition ScheduleDAG.h:74

llvm::SDep::MayAliasMem
@ MayAliasMem
Nonvolatile load/Store instructions that may alias.
Definition ScheduleDAG.h:72

llvm::SDep::Weak
@ Weak
Arbitrary weak DAG edge.
Definition ScheduleDAG.h:75

llvm::SDep::MustAliasMem
@ MustAliasMem
Nonvolatile load/Store instructions that must alias.
Definition ScheduleDAG.h:73

llvm::SDep::getLatency
unsigned getLatency() const
Returns the latency value for this edge, which roughly means the minimum number of cycles that must e...
Definition ScheduleDAG.h:142

llvm::SDep::isAssignedRegDep
bool isAssignedRegDep() const
Tests if this is a Data dependence that is associated with a register.
Definition ScheduleDAG.h:211

llvm::SDep::setSUnit
void setSUnit(SUnit *SU)
Definition ScheduleDAG.h:510

llvm::SDep::getReg
Register getReg() const
Returns the register associated with this edge.
Definition ScheduleDAG.h:216

llvm::SDep::dump
LLVM_ABI void dump(const TargetRegisterInfo *TRI=nullptr) const
Definition ScheduleDAG.cpp:74

llvm::SUnit
Scheduling unit. This is a node in the scheduling DAG.
Definition ScheduleDAG.h:249

llvm::SUnit::setHeightToAtLeast
LLVM_ABI void setHeightToAtLeast(unsigned NewHeight)
If NewHeight is greater than this node's height value, set it to be the new height value.
Definition ScheduleDAG.cpp:255

llvm::SUnit::NumSuccs
unsigned NumSuccs
Definition ScheduleDAG.h:280

llvm::SUnit::NumPreds
unsigned NumPreds
Definition ScheduleDAG.h:279

llvm::SUnit::NodeNum
unsigned NodeNum
Entry # of node in the node vector.
Definition ScheduleDAG.h:277

llvm::SUnit::NumSuccsLeft
unsigned NumSuccsLeft
Definition ScheduleDAG.h:282

llvm::SUnit::biasCriticalPath
LLVM_ABI void biasCriticalPath()
Orders this node's predecessor edges such that the critical path edge occurs first.
Definition ScheduleDAG.cpp:325

llvm::SUnit::getHeight
unsigned getHeight() const
Returns the height of this node, which is the length of the maximum path down to any node which has n...
Definition ScheduleDAG.h:433

llvm::SUnit::setHeightDirty
LLVM_ABI void setHeightDirty()
Sets a flag in this node to indicate that its stored Height value will require recomputation the next...
Definition ScheduleDAG.cpp:232

llvm::SUnit::removePred
LLVM_ABI void removePred(const SDep &D)
Removes the specified edge as a pred of the current node if it exists.
Definition ScheduleDAG.cpp:175

llvm::SUnit::Latency
unsigned short Latency
Node latency.
Definition ScheduleDAG.h:312

llvm::SUnit::pred_iterator
SmallVectorImpl< SDep >::iterator pred_iterator
Definition ScheduleDAG.h:272

llvm::SUnit::isBoundaryNode
bool isBoundaryNode() const
Boundary nodes are placeholders for the boundary of the scheduling region.
Definition ScheduleDAG.h:367

llvm::SUnit::NumRegDefsLeft
unsigned short NumRegDefsLeft
Definition ScheduleDAG.h:311

llvm::SUnit::getDepth
unsigned getDepth() const
Returns the depth of this node, which is the length of the maximum path up to any node which has no p...
Definition ScheduleDAG.h:425

llvm::SUnit::isScheduled
bool isScheduled
True once scheduled.
Definition ScheduleDAG.h:305

llvm::SUnit::ParentClusterIdx
unsigned ParentClusterIdx
The parent cluster id.
Definition ScheduleDAG.h:288

llvm::SUnit::NumPredsLeft
unsigned NumPredsLeft
Definition ScheduleDAG.h:281

llvm::SUnit::dumpAttributes
LLVM_ABI void dumpAttributes() const
Definition ScheduleDAG.cpp:343

llvm::SUnit::Succs
SmallVector< SDep, 4 > Succs
All sunit successors.
Definition ScheduleDAG.h:270

llvm::SUnit::SUnit
SUnit(SDNode *node, unsigned nodenum)
Constructs an SUnit for pre-regalloc scheduling to represent an SDNode and any nodes flagged to it.
Definition ScheduleDAG.h:327

llvm::SUnit::WeakPredsLeft
unsigned WeakPredsLeft
Definition ScheduleDAG.h:283

llvm::SUnit::setDepthDirty
LLVM_ABI void setDepthDirty()
Sets a flag in this node to indicate that its stored Depth value will require recomputation the next ...
Definition ScheduleDAG.cpp:217

llvm::SUnit::Preds
SmallVector< SDep, 4 > Preds
All sunit predecessors.
Definition ScheduleDAG.h:269

llvm::SUnit::WeakSuccsLeft
unsigned WeakSuccsLeft
Definition ScheduleDAG.h:284

llvm::SUnit::setDepthToAtLeast
LLVM_ABI void setDepthToAtLeast(unsigned NewDepth)
If NewDepth is greater than this node's depth value, sets it to be the new depth value.
Definition ScheduleDAG.cpp:247

llvm::SUnit::addPred
LLVM_ABI bool addPred(const SDep &D, bool Required=true)
Adds the specified edge as a pred of the current node if not already.
Definition ScheduleDAG.cpp:106

llvm::ScheduleDAGTopologicalSort::RemovePred
LLVM_ABI void RemovePred(SUnit *M, SUnit *N)
Updates the topological ordering to accommodate an edge to be removed from the specified node N from ...
Definition ScheduleDAG.cpp:571

llvm::ScheduleDAGTopologicalSort::WillCreateCycle
LLVM_ABI bool WillCreateCycle(SUnit *TargetSU, SUnit *SU)
Returns true if addPred(TargetSU, SU) creates a cycle.
Definition ScheduleDAG.cpp:708

llvm::ScheduleDAGTopologicalSort::AddSUnitWithoutPredecessors
LLVM_ABI void AddSUnitWithoutPredecessors(const SUnit *SU)
Add a SUnit without predecessors to the end of the topological order.
Definition ScheduleDAG.cpp:720

llvm::ScheduleDAGTopologicalSort::ScheduleDAGTopologicalSort
LLVM_ABI ScheduleDAGTopologicalSort(std::vector< SUnit > &SUnits, SUnit *ExitSU)
Definition ScheduleDAG.cpp:754

llvm::ScheduleDAGTopologicalSort::GetSubGraph
LLVM_ABI std::vector< int > GetSubGraph(const SUnit &StartSU, const SUnit &TargetSU, bool &Success)
Returns an array of SUs that are both in the successor subtree of StartSU and in the predecessor subt...
Definition ScheduleDAG.cpp:602

llvm::ScheduleDAGTopologicalSort::InitDAGTopologicalSorting
LLVM_ABI void InitDAGTopologicalSorting()
Creates the initial topological ordering from the DAG to be scheduled.
Definition ScheduleDAG.cpp:443

llvm::ScheduleDAGTopologicalSort::AddPred
LLVM_ABI void AddPred(SUnit *Y, SUnit *X)
Updates the topological ordering to accommodate an edge to be added from SUnit X to SUnit Y.
Definition ScheduleDAG.cpp:553

llvm::ScheduleDAGTopologicalSort::IsReachable
LLVM_ABI bool IsReachable(const SUnit *SU, const SUnit *TargetSU)
Checks if SU is reachable from TargetSU.
Definition ScheduleDAG.cpp:728

llvm::ScheduleDAGTopologicalSort::AddPredQueued
LLVM_ABI void AddPredQueued(SUnit *Y, SUnit *X)
Queues an update to the topological ordering to accommodate an edge to be added from SUnit X to SUnit...
Definition ScheduleDAG.cpp:541

llvm::ScheduleDAG::MRI
MachineRegisterInfo & MRI
Virtual/real register map.
Definition ScheduleDAG.h:587

llvm::ScheduleDAG::clearDAG
void clearDAG()
Clears the DAG state (between regions).
Definition ScheduleDAG.cpp:63

llvm::ScheduleDAG::TII
const TargetInstrInfo * TII
Target instruction information.
Definition ScheduleDAG.h:584

llvm::ScheduleDAG::SUnits
std::vector< SUnit > SUnits
The scheduling units.
Definition ScheduleDAG.h:588

llvm::ScheduleDAG::~ScheduleDAG
virtual ~ScheduleDAG()

llvm::ScheduleDAG::TRI
const TargetRegisterInfo * TRI
Target processor register info.
Definition ScheduleDAG.h:585

llvm::ScheduleDAG::EntrySU
SUnit EntrySU
Special node for the region entry.
Definition ScheduleDAG.h:589

llvm::ScheduleDAG::MF
MachineFunction & MF
Machine function.
Definition ScheduleDAG.h:586

llvm::ScheduleDAG::ScheduleDAG
ScheduleDAG(const ScheduleDAG &)=delete

llvm::ScheduleDAG::StressSched
bool StressSched
Definition ScheduleDAG.h:595

llvm::ScheduleDAG::dumpNodeAll
void dumpNodeAll(const SUnit &SU) const
Definition ScheduleDAG.cpp:365

llvm::ScheduleDAG::TM
const TargetMachine & TM
Target processor.
Definition ScheduleDAG.h:583

llvm::ScheduleDAG::VerifyScheduledDAG
unsigned VerifyScheduledDAG(bool isBottomUp)
Verifies that all SUnits were scheduled and that their state is consistent.
Definition ScheduleDAG.cpp:395

llvm::ScheduleDAG::dumpNode
virtual void dumpNode(const SUnit &SU) const =0

llvm::ScheduleDAG::dumpNodeName
void dumpNodeName(const SUnit &SU) const
Definition ScheduleDAG.cpp:356

llvm::ScheduleDAG::ExitSU
SUnit ExitSU
Special node for the region exit.
Definition ScheduleDAG.h:590

llvm::ScheduleHazardRecognizer::~ScheduleHazardRecognizer
virtual ~ScheduleHazardRecognizer()

llvm::SmallVectorImpl::pop_back_val
T pop_back_val()
Definition SmallVector.h:673

llvm::SmallVectorImpl::iterator
typename SuperClass::iterator iterator
Definition SmallVector.h:577

llvm::SmallVectorTemplateBase::pop_back
void pop_back()
Definition SmallVector.h:428

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:416

llvm::SmallVectorTemplateCommon::back
reference back()
Definition SmallVector.h:311

llvm::SmallVectorTemplateCommon::empty
bool empty() const
Definition SmallVector.h:82

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1196

llvm::TargetRegisterInfo
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
Definition TargetRegisterInfo.h:242

llvm::cl::opt
Definition CommandLine.h:1455

llvm::cl::Hidden
@ Hidden
Definition CommandLine.h:139

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition CommandLine.h:445

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::find
auto find(R &&Range, const T &Val)
Provide wrappers to std::find which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1751

llvm::Done
@ Done
Definition Threading.h:60

llvm::reverse
auto reverse(ContainerTy &&C)
Definition STLExtras.h:406

llvm::dbgs
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207

llvm::SmallVector
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
Definition SmallVector.h:1122

llvm::WaitForUnlockResult::Success
@ Success
The lock was released successfully.
Definition AdvisoryLock.h:20

llvm::InvalidClusterId
constexpr unsigned InvalidClusterId
Definition ScheduleDAG.h:241

llvm::WinX64EHUnwindV2Mode::Required
@ Required
Definition CodeGen.h:167

llvm::printReg
LLVM_ABI Printable printReg(Register Reg, const TargetRegisterInfo *TRI=nullptr, unsigned SubIdx=0, const MachineRegisterInfo *MRI=nullptr)
Prints virtual and physical registers with or without a TRI instance.
Definition TargetRegisterInfo.cpp:105

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:869

raw_ostream.h

N
#define N

llvm::cl::desc
Definition CommandLine.h:411