10b57cec5SDimitry Andric //===- ResourcePriorityQueue.cpp - A DFA-oriented priority queue -*- C++ -*-==//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric // This file implements the ResourcePriorityQueue class, which is a
100b57cec5SDimitry Andric // SchedulingPriorityQueue that prioritizes instructions using DFA state to
110b57cec5SDimitry Andric // reduce the length of the critical path through the basic block
120b57cec5SDimitry Andric // on VLIW platforms.
130b57cec5SDimitry Andric // The scheduler is basically a top-down adaptable list scheduler with DFA
140b57cec5SDimitry Andric // resource tracking added to the cost function.
150b57cec5SDimitry Andric // DFA is queried as a state machine to model "packets/bundles" during
160b57cec5SDimitry Andric // schedule. Currently packets/bundles are discarded at the end of
170b57cec5SDimitry Andric // scheduling, affecting only order of instructions.
180b57cec5SDimitry Andric //
190b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
200b57cec5SDimitry Andric
210b57cec5SDimitry Andric #include "llvm/CodeGen/ResourcePriorityQueue.h"
225ffd83dbSDimitry Andric #include "llvm/CodeGen/DFAPacketizer.h"
235ffd83dbSDimitry Andric #include "llvm/CodeGen/SelectionDAGISel.h"
240b57cec5SDimitry Andric #include "llvm/CodeGen/SelectionDAGNodes.h"
255ffd83dbSDimitry Andric #include "llvm/CodeGen/TargetInstrInfo.h"
260b57cec5SDimitry Andric #include "llvm/CodeGen/TargetLowering.h"
275ffd83dbSDimitry Andric #include "llvm/CodeGen/TargetRegisterInfo.h"
280b57cec5SDimitry Andric #include "llvm/CodeGen/TargetSubtargetInfo.h"
290b57cec5SDimitry Andric #include "llvm/Support/CommandLine.h"
300b57cec5SDimitry Andric
310b57cec5SDimitry Andric using namespace llvm;
320b57cec5SDimitry Andric
330b57cec5SDimitry Andric #define DEBUG_TYPE "scheduler"
340b57cec5SDimitry Andric
35*81ad6265SDimitry Andric static cl::opt<bool>
36*81ad6265SDimitry Andric DisableDFASched("disable-dfa-sched", cl::Hidden,
370b57cec5SDimitry Andric cl::desc("Disable use of DFA during scheduling"));
380b57cec5SDimitry Andric
390b57cec5SDimitry Andric static cl::opt<int> RegPressureThreshold(
40*81ad6265SDimitry Andric "dfa-sched-reg-pressure-threshold", cl::Hidden, cl::init(5),
410b57cec5SDimitry Andric cl::desc("Track reg pressure and switch priority to in-depth"));
420b57cec5SDimitry Andric
ResourcePriorityQueue(SelectionDAGISel * IS)430b57cec5SDimitry Andric ResourcePriorityQueue::ResourcePriorityQueue(SelectionDAGISel *IS)
440b57cec5SDimitry Andric : Picker(this), InstrItins(IS->MF->getSubtarget().getInstrItineraryData()) {
450b57cec5SDimitry Andric const TargetSubtargetInfo &STI = IS->MF->getSubtarget();
460b57cec5SDimitry Andric TRI = STI.getRegisterInfo();
470b57cec5SDimitry Andric TLI = IS->TLI;
480b57cec5SDimitry Andric TII = STI.getInstrInfo();
490b57cec5SDimitry Andric ResourcesModel.reset(TII->CreateTargetScheduleState(STI));
500b57cec5SDimitry Andric // This hard requirement could be relaxed, but for now
510b57cec5SDimitry Andric // do not let it proceed.
520b57cec5SDimitry Andric assert(ResourcesModel && "Unimplemented CreateTargetScheduleState.");
530b57cec5SDimitry Andric
540b57cec5SDimitry Andric unsigned NumRC = TRI->getNumRegClasses();
550b57cec5SDimitry Andric RegLimit.resize(NumRC);
560b57cec5SDimitry Andric RegPressure.resize(NumRC);
570b57cec5SDimitry Andric std::fill(RegLimit.begin(), RegLimit.end(), 0);
580b57cec5SDimitry Andric std::fill(RegPressure.begin(), RegPressure.end(), 0);
590b57cec5SDimitry Andric for (const TargetRegisterClass *RC : TRI->regclasses())
600b57cec5SDimitry Andric RegLimit[RC->getID()] = TRI->getRegPressureLimit(RC, *IS->MF);
610b57cec5SDimitry Andric
620b57cec5SDimitry Andric ParallelLiveRanges = 0;
630b57cec5SDimitry Andric HorizontalVerticalBalance = 0;
640b57cec5SDimitry Andric }
650b57cec5SDimitry Andric
660b57cec5SDimitry Andric unsigned
numberRCValPredInSU(SUnit * SU,unsigned RCId)670b57cec5SDimitry Andric ResourcePriorityQueue::numberRCValPredInSU(SUnit *SU, unsigned RCId) {
680b57cec5SDimitry Andric unsigned NumberDeps = 0;
690b57cec5SDimitry Andric for (SDep &Pred : SU->Preds) {
700b57cec5SDimitry Andric if (Pred.isCtrl())
710b57cec5SDimitry Andric continue;
720b57cec5SDimitry Andric
730b57cec5SDimitry Andric SUnit *PredSU = Pred.getSUnit();
740b57cec5SDimitry Andric const SDNode *ScegN = PredSU->getNode();
750b57cec5SDimitry Andric
760b57cec5SDimitry Andric if (!ScegN)
770b57cec5SDimitry Andric continue;
780b57cec5SDimitry Andric
790b57cec5SDimitry Andric // If value is passed to CopyToReg, it is probably
800b57cec5SDimitry Andric // live outside BB.
810b57cec5SDimitry Andric switch (ScegN->getOpcode()) {
820b57cec5SDimitry Andric default: break;
830b57cec5SDimitry Andric case ISD::TokenFactor: break;
840b57cec5SDimitry Andric case ISD::CopyFromReg: NumberDeps++; break;
850b57cec5SDimitry Andric case ISD::CopyToReg: break;
860b57cec5SDimitry Andric case ISD::INLINEASM: break;
870b57cec5SDimitry Andric case ISD::INLINEASM_BR: break;
880b57cec5SDimitry Andric }
890b57cec5SDimitry Andric if (!ScegN->isMachineOpcode())
900b57cec5SDimitry Andric continue;
910b57cec5SDimitry Andric
920b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumValues(); i != e; ++i) {
930b57cec5SDimitry Andric MVT VT = ScegN->getSimpleValueType(i);
940b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)
950b57cec5SDimitry Andric && (TLI->getRegClassFor(VT)->getID() == RCId)) {
960b57cec5SDimitry Andric NumberDeps++;
970b57cec5SDimitry Andric break;
980b57cec5SDimitry Andric }
990b57cec5SDimitry Andric }
1000b57cec5SDimitry Andric }
1010b57cec5SDimitry Andric return NumberDeps;
1020b57cec5SDimitry Andric }
1030b57cec5SDimitry Andric
numberRCValSuccInSU(SUnit * SU,unsigned RCId)1040b57cec5SDimitry Andric unsigned ResourcePriorityQueue::numberRCValSuccInSU(SUnit *SU,
1050b57cec5SDimitry Andric unsigned RCId) {
1060b57cec5SDimitry Andric unsigned NumberDeps = 0;
1070b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs) {
1080b57cec5SDimitry Andric if (Succ.isCtrl())
1090b57cec5SDimitry Andric continue;
1100b57cec5SDimitry Andric
1110b57cec5SDimitry Andric SUnit *SuccSU = Succ.getSUnit();
1120b57cec5SDimitry Andric const SDNode *ScegN = SuccSU->getNode();
1130b57cec5SDimitry Andric if (!ScegN)
1140b57cec5SDimitry Andric continue;
1150b57cec5SDimitry Andric
1160b57cec5SDimitry Andric // If value is passed to CopyToReg, it is probably
1170b57cec5SDimitry Andric // live outside BB.
1180b57cec5SDimitry Andric switch (ScegN->getOpcode()) {
1190b57cec5SDimitry Andric default: break;
1200b57cec5SDimitry Andric case ISD::TokenFactor: break;
1210b57cec5SDimitry Andric case ISD::CopyFromReg: break;
1220b57cec5SDimitry Andric case ISD::CopyToReg: NumberDeps++; break;
1230b57cec5SDimitry Andric case ISD::INLINEASM: break;
1240b57cec5SDimitry Andric case ISD::INLINEASM_BR: break;
1250b57cec5SDimitry Andric }
1260b57cec5SDimitry Andric if (!ScegN->isMachineOpcode())
1270b57cec5SDimitry Andric continue;
1280b57cec5SDimitry Andric
1290b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumOperands(); i != e; ++i) {
1300b57cec5SDimitry Andric const SDValue &Op = ScegN->getOperand(i);
1310b57cec5SDimitry Andric MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
1320b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)
1330b57cec5SDimitry Andric && (TLI->getRegClassFor(VT)->getID() == RCId)) {
1340b57cec5SDimitry Andric NumberDeps++;
1350b57cec5SDimitry Andric break;
1360b57cec5SDimitry Andric }
1370b57cec5SDimitry Andric }
1380b57cec5SDimitry Andric }
1390b57cec5SDimitry Andric return NumberDeps;
1400b57cec5SDimitry Andric }
1410b57cec5SDimitry Andric
numberCtrlDepsInSU(SUnit * SU)1420b57cec5SDimitry Andric static unsigned numberCtrlDepsInSU(SUnit *SU) {
1430b57cec5SDimitry Andric unsigned NumberDeps = 0;
1440b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs)
1450b57cec5SDimitry Andric if (Succ.isCtrl())
1460b57cec5SDimitry Andric NumberDeps++;
1470b57cec5SDimitry Andric
1480b57cec5SDimitry Andric return NumberDeps;
1490b57cec5SDimitry Andric }
1500b57cec5SDimitry Andric
numberCtrlPredInSU(SUnit * SU)1510b57cec5SDimitry Andric static unsigned numberCtrlPredInSU(SUnit *SU) {
1520b57cec5SDimitry Andric unsigned NumberDeps = 0;
1530b57cec5SDimitry Andric for (SDep &Pred : SU->Preds)
1540b57cec5SDimitry Andric if (Pred.isCtrl())
1550b57cec5SDimitry Andric NumberDeps++;
1560b57cec5SDimitry Andric
1570b57cec5SDimitry Andric return NumberDeps;
1580b57cec5SDimitry Andric }
1590b57cec5SDimitry Andric
1600b57cec5SDimitry Andric ///
1610b57cec5SDimitry Andric /// Initialize nodes.
1620b57cec5SDimitry Andric ///
initNodes(std::vector<SUnit> & sunits)1630b57cec5SDimitry Andric void ResourcePriorityQueue::initNodes(std::vector<SUnit> &sunits) {
1640b57cec5SDimitry Andric SUnits = &sunits;
1650b57cec5SDimitry Andric NumNodesSolelyBlocking.resize(SUnits->size(), 0);
1660b57cec5SDimitry Andric
1670eae32dcSDimitry Andric for (SUnit &SU : *SUnits) {
1680eae32dcSDimitry Andric initNumRegDefsLeft(&SU);
1690eae32dcSDimitry Andric SU.NodeQueueId = 0;
1700b57cec5SDimitry Andric }
1710b57cec5SDimitry Andric }
1720b57cec5SDimitry Andric
1730b57cec5SDimitry Andric /// This heuristic is used if DFA scheduling is not desired
1740b57cec5SDimitry Andric /// for some VLIW platform.
operator ()(const SUnit * LHS,const SUnit * RHS) const1750b57cec5SDimitry Andric bool resource_sort::operator()(const SUnit *LHS, const SUnit *RHS) const {
1760b57cec5SDimitry Andric // The isScheduleHigh flag allows nodes with wraparound dependencies that
1770b57cec5SDimitry Andric // cannot easily be modeled as edges with latencies to be scheduled as
1780b57cec5SDimitry Andric // soon as possible in a top-down schedule.
1790b57cec5SDimitry Andric if (LHS->isScheduleHigh && !RHS->isScheduleHigh)
1800b57cec5SDimitry Andric return false;
1810b57cec5SDimitry Andric
1820b57cec5SDimitry Andric if (!LHS->isScheduleHigh && RHS->isScheduleHigh)
1830b57cec5SDimitry Andric return true;
1840b57cec5SDimitry Andric
1850b57cec5SDimitry Andric unsigned LHSNum = LHS->NodeNum;
1860b57cec5SDimitry Andric unsigned RHSNum = RHS->NodeNum;
1870b57cec5SDimitry Andric
1880b57cec5SDimitry Andric // The most important heuristic is scheduling the critical path.
1890b57cec5SDimitry Andric unsigned LHSLatency = PQ->getLatency(LHSNum);
1900b57cec5SDimitry Andric unsigned RHSLatency = PQ->getLatency(RHSNum);
1910b57cec5SDimitry Andric if (LHSLatency < RHSLatency) return true;
1920b57cec5SDimitry Andric if (LHSLatency > RHSLatency) return false;
1930b57cec5SDimitry Andric
1940b57cec5SDimitry Andric // After that, if two nodes have identical latencies, look to see if one will
1950b57cec5SDimitry Andric // unblock more other nodes than the other.
1960b57cec5SDimitry Andric unsigned LHSBlocked = PQ->getNumSolelyBlockNodes(LHSNum);
1970b57cec5SDimitry Andric unsigned RHSBlocked = PQ->getNumSolelyBlockNodes(RHSNum);
1980b57cec5SDimitry Andric if (LHSBlocked < RHSBlocked) return true;
1990b57cec5SDimitry Andric if (LHSBlocked > RHSBlocked) return false;
2000b57cec5SDimitry Andric
2010b57cec5SDimitry Andric // Finally, just to provide a stable ordering, use the node number as a
2020b57cec5SDimitry Andric // deciding factor.
2030b57cec5SDimitry Andric return LHSNum < RHSNum;
2040b57cec5SDimitry Andric }
2050b57cec5SDimitry Andric
2060b57cec5SDimitry Andric
2070b57cec5SDimitry Andric /// getSingleUnscheduledPred - If there is exactly one unscheduled predecessor
2080b57cec5SDimitry Andric /// of SU, return it, otherwise return null.
getSingleUnscheduledPred(SUnit * SU)2090b57cec5SDimitry Andric SUnit *ResourcePriorityQueue::getSingleUnscheduledPred(SUnit *SU) {
2100b57cec5SDimitry Andric SUnit *OnlyAvailablePred = nullptr;
2110b57cec5SDimitry Andric for (const SDep &Pred : SU->Preds) {
2120b57cec5SDimitry Andric SUnit &PredSU = *Pred.getSUnit();
2130b57cec5SDimitry Andric if (!PredSU.isScheduled) {
2140b57cec5SDimitry Andric // We found an available, but not scheduled, predecessor. If it's the
2150b57cec5SDimitry Andric // only one we have found, keep track of it... otherwise give up.
2160b57cec5SDimitry Andric if (OnlyAvailablePred && OnlyAvailablePred != &PredSU)
2170b57cec5SDimitry Andric return nullptr;
2180b57cec5SDimitry Andric OnlyAvailablePred = &PredSU;
2190b57cec5SDimitry Andric }
2200b57cec5SDimitry Andric }
2210b57cec5SDimitry Andric return OnlyAvailablePred;
2220b57cec5SDimitry Andric }
2230b57cec5SDimitry Andric
push(SUnit * SU)2240b57cec5SDimitry Andric void ResourcePriorityQueue::push(SUnit *SU) {
2250b57cec5SDimitry Andric // Look at all of the successors of this node. Count the number of nodes that
2260b57cec5SDimitry Andric // this node is the sole unscheduled node for.
2270b57cec5SDimitry Andric unsigned NumNodesBlocking = 0;
2280b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs)
2290b57cec5SDimitry Andric if (getSingleUnscheduledPred(Succ.getSUnit()) == SU)
2300b57cec5SDimitry Andric ++NumNodesBlocking;
2310b57cec5SDimitry Andric
2320b57cec5SDimitry Andric NumNodesSolelyBlocking[SU->NodeNum] = NumNodesBlocking;
2330b57cec5SDimitry Andric Queue.push_back(SU);
2340b57cec5SDimitry Andric }
2350b57cec5SDimitry Andric
2360b57cec5SDimitry Andric /// Check if scheduling of this SU is possible
2370b57cec5SDimitry Andric /// in the current packet.
isResourceAvailable(SUnit * SU)2380b57cec5SDimitry Andric bool ResourcePriorityQueue::isResourceAvailable(SUnit *SU) {
2390b57cec5SDimitry Andric if (!SU || !SU->getNode())
2400b57cec5SDimitry Andric return false;
2410b57cec5SDimitry Andric
2420b57cec5SDimitry Andric // If this is a compound instruction,
2430b57cec5SDimitry Andric // it is likely to be a call. Do not delay it.
2440b57cec5SDimitry Andric if (SU->getNode()->getGluedNode())
2450b57cec5SDimitry Andric return true;
2460b57cec5SDimitry Andric
2470b57cec5SDimitry Andric // First see if the pipeline could receive this instruction
2480b57cec5SDimitry Andric // in the current cycle.
2490b57cec5SDimitry Andric if (SU->getNode()->isMachineOpcode())
2500b57cec5SDimitry Andric switch (SU->getNode()->getMachineOpcode()) {
2510b57cec5SDimitry Andric default:
2520b57cec5SDimitry Andric if (!ResourcesModel->canReserveResources(&TII->get(
2530b57cec5SDimitry Andric SU->getNode()->getMachineOpcode())))
2540b57cec5SDimitry Andric return false;
2550b57cec5SDimitry Andric break;
2560b57cec5SDimitry Andric case TargetOpcode::EXTRACT_SUBREG:
2570b57cec5SDimitry Andric case TargetOpcode::INSERT_SUBREG:
2580b57cec5SDimitry Andric case TargetOpcode::SUBREG_TO_REG:
2590b57cec5SDimitry Andric case TargetOpcode::REG_SEQUENCE:
2600b57cec5SDimitry Andric case TargetOpcode::IMPLICIT_DEF:
2610b57cec5SDimitry Andric break;
2620b57cec5SDimitry Andric }
2630b57cec5SDimitry Andric
2640b57cec5SDimitry Andric // Now see if there are no other dependencies
2650b57cec5SDimitry Andric // to instructions already in the packet.
2664824e7fdSDimitry Andric for (const SUnit *S : Packet)
2674824e7fdSDimitry Andric for (const SDep &Succ : S->Succs) {
2680b57cec5SDimitry Andric // Since we do not add pseudos to packets, might as well
2690b57cec5SDimitry Andric // ignore order deps.
2700b57cec5SDimitry Andric if (Succ.isCtrl())
2710b57cec5SDimitry Andric continue;
2720b57cec5SDimitry Andric
2730b57cec5SDimitry Andric if (Succ.getSUnit() == SU)
2740b57cec5SDimitry Andric return false;
2750b57cec5SDimitry Andric }
2760b57cec5SDimitry Andric
2770b57cec5SDimitry Andric return true;
2780b57cec5SDimitry Andric }
2790b57cec5SDimitry Andric
2800b57cec5SDimitry Andric /// Keep track of available resources.
reserveResources(SUnit * SU)2810b57cec5SDimitry Andric void ResourcePriorityQueue::reserveResources(SUnit *SU) {
2820b57cec5SDimitry Andric // If this SU does not fit in the packet
2830b57cec5SDimitry Andric // start a new one.
2840b57cec5SDimitry Andric if (!isResourceAvailable(SU) || SU->getNode()->getGluedNode()) {
2850b57cec5SDimitry Andric ResourcesModel->clearResources();
2860b57cec5SDimitry Andric Packet.clear();
2870b57cec5SDimitry Andric }
2880b57cec5SDimitry Andric
2890b57cec5SDimitry Andric if (SU->getNode() && SU->getNode()->isMachineOpcode()) {
2900b57cec5SDimitry Andric switch (SU->getNode()->getMachineOpcode()) {
2910b57cec5SDimitry Andric default:
2920b57cec5SDimitry Andric ResourcesModel->reserveResources(&TII->get(
2930b57cec5SDimitry Andric SU->getNode()->getMachineOpcode()));
2940b57cec5SDimitry Andric break;
2950b57cec5SDimitry Andric case TargetOpcode::EXTRACT_SUBREG:
2960b57cec5SDimitry Andric case TargetOpcode::INSERT_SUBREG:
2970b57cec5SDimitry Andric case TargetOpcode::SUBREG_TO_REG:
2980b57cec5SDimitry Andric case TargetOpcode::REG_SEQUENCE:
2990b57cec5SDimitry Andric case TargetOpcode::IMPLICIT_DEF:
3000b57cec5SDimitry Andric break;
3010b57cec5SDimitry Andric }
3020b57cec5SDimitry Andric Packet.push_back(SU);
3030b57cec5SDimitry Andric }
3040b57cec5SDimitry Andric // Forcefully end packet for PseudoOps.
3050b57cec5SDimitry Andric else {
3060b57cec5SDimitry Andric ResourcesModel->clearResources();
3070b57cec5SDimitry Andric Packet.clear();
3080b57cec5SDimitry Andric }
3090b57cec5SDimitry Andric
3100b57cec5SDimitry Andric // If packet is now full, reset the state so in the next cycle
3110b57cec5SDimitry Andric // we start fresh.
3120b57cec5SDimitry Andric if (Packet.size() >= InstrItins->SchedModel.IssueWidth) {
3130b57cec5SDimitry Andric ResourcesModel->clearResources();
3140b57cec5SDimitry Andric Packet.clear();
3150b57cec5SDimitry Andric }
3160b57cec5SDimitry Andric }
3170b57cec5SDimitry Andric
rawRegPressureDelta(SUnit * SU,unsigned RCId)3180b57cec5SDimitry Andric int ResourcePriorityQueue::rawRegPressureDelta(SUnit *SU, unsigned RCId) {
3190b57cec5SDimitry Andric int RegBalance = 0;
3200b57cec5SDimitry Andric
3210b57cec5SDimitry Andric if (!SU || !SU->getNode() || !SU->getNode()->isMachineOpcode())
3220b57cec5SDimitry Andric return RegBalance;
3230b57cec5SDimitry Andric
3240b57cec5SDimitry Andric // Gen estimate.
3250b57cec5SDimitry Andric for (unsigned i = 0, e = SU->getNode()->getNumValues(); i != e; ++i) {
3260b57cec5SDimitry Andric MVT VT = SU->getNode()->getSimpleValueType(i);
3270b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)
3280b57cec5SDimitry Andric && TLI->getRegClassFor(VT)
3290b57cec5SDimitry Andric && TLI->getRegClassFor(VT)->getID() == RCId)
3300b57cec5SDimitry Andric RegBalance += numberRCValSuccInSU(SU, RCId);
3310b57cec5SDimitry Andric }
3320b57cec5SDimitry Andric // Kill estimate.
3330b57cec5SDimitry Andric for (unsigned i = 0, e = SU->getNode()->getNumOperands(); i != e; ++i) {
3340b57cec5SDimitry Andric const SDValue &Op = SU->getNode()->getOperand(i);
3350b57cec5SDimitry Andric MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
3360b57cec5SDimitry Andric if (isa<ConstantSDNode>(Op.getNode()))
3370b57cec5SDimitry Andric continue;
3380b57cec5SDimitry Andric
3390b57cec5SDimitry Andric if (TLI->isTypeLegal(VT) && TLI->getRegClassFor(VT)
3400b57cec5SDimitry Andric && TLI->getRegClassFor(VT)->getID() == RCId)
3410b57cec5SDimitry Andric RegBalance -= numberRCValPredInSU(SU, RCId);
3420b57cec5SDimitry Andric }
3430b57cec5SDimitry Andric return RegBalance;
3440b57cec5SDimitry Andric }
3450b57cec5SDimitry Andric
3460b57cec5SDimitry Andric /// Estimates change in reg pressure from this SU.
3470b57cec5SDimitry Andric /// It is achieved by trivial tracking of defined
3480b57cec5SDimitry Andric /// and used vregs in dependent instructions.
3490b57cec5SDimitry Andric /// The RawPressure flag makes this function to ignore
3500b57cec5SDimitry Andric /// existing reg file sizes, and report raw def/use
3510b57cec5SDimitry Andric /// balance.
regPressureDelta(SUnit * SU,bool RawPressure)3520b57cec5SDimitry Andric int ResourcePriorityQueue::regPressureDelta(SUnit *SU, bool RawPressure) {
3530b57cec5SDimitry Andric int RegBalance = 0;
3540b57cec5SDimitry Andric
3550b57cec5SDimitry Andric if (!SU || !SU->getNode() || !SU->getNode()->isMachineOpcode())
3560b57cec5SDimitry Andric return RegBalance;
3570b57cec5SDimitry Andric
3580b57cec5SDimitry Andric if (RawPressure) {
3590b57cec5SDimitry Andric for (const TargetRegisterClass *RC : TRI->regclasses())
3600b57cec5SDimitry Andric RegBalance += rawRegPressureDelta(SU, RC->getID());
3610b57cec5SDimitry Andric }
3620b57cec5SDimitry Andric else {
3630b57cec5SDimitry Andric for (const TargetRegisterClass *RC : TRI->regclasses()) {
3640b57cec5SDimitry Andric if ((RegPressure[RC->getID()] +
3650b57cec5SDimitry Andric rawRegPressureDelta(SU, RC->getID()) > 0) &&
3660b57cec5SDimitry Andric (RegPressure[RC->getID()] +
3670b57cec5SDimitry Andric rawRegPressureDelta(SU, RC->getID()) >= RegLimit[RC->getID()]))
3680b57cec5SDimitry Andric RegBalance += rawRegPressureDelta(SU, RC->getID());
3690b57cec5SDimitry Andric }
3700b57cec5SDimitry Andric }
3710b57cec5SDimitry Andric
3720b57cec5SDimitry Andric return RegBalance;
3730b57cec5SDimitry Andric }
3740b57cec5SDimitry Andric
3750b57cec5SDimitry Andric // Constants used to denote relative importance of
3760b57cec5SDimitry Andric // heuristic components for cost computation.
3770b57cec5SDimitry Andric static const unsigned PriorityOne = 200;
3780b57cec5SDimitry Andric static const unsigned PriorityTwo = 50;
3790b57cec5SDimitry Andric static const unsigned PriorityThree = 15;
3800b57cec5SDimitry Andric static const unsigned PriorityFour = 5;
3810b57cec5SDimitry Andric static const unsigned ScaleOne = 20;
3820b57cec5SDimitry Andric static const unsigned ScaleTwo = 10;
3830b57cec5SDimitry Andric static const unsigned ScaleThree = 5;
3840b57cec5SDimitry Andric static const unsigned FactorOne = 2;
3850b57cec5SDimitry Andric
3860b57cec5SDimitry Andric /// Returns single number reflecting benefit of scheduling SU
3870b57cec5SDimitry Andric /// in the current cycle.
SUSchedulingCost(SUnit * SU)3880b57cec5SDimitry Andric int ResourcePriorityQueue::SUSchedulingCost(SUnit *SU) {
3890b57cec5SDimitry Andric // Initial trivial priority.
3900b57cec5SDimitry Andric int ResCount = 1;
3910b57cec5SDimitry Andric
3920b57cec5SDimitry Andric // Do not waste time on a node that is already scheduled.
3930b57cec5SDimitry Andric if (SU->isScheduled)
3940b57cec5SDimitry Andric return ResCount;
3950b57cec5SDimitry Andric
3960b57cec5SDimitry Andric // Forced priority is high.
3970b57cec5SDimitry Andric if (SU->isScheduleHigh)
3980b57cec5SDimitry Andric ResCount += PriorityOne;
3990b57cec5SDimitry Andric
4000b57cec5SDimitry Andric // Adaptable scheduling
4010b57cec5SDimitry Andric // A small, but very parallel
4020b57cec5SDimitry Andric // region, where reg pressure is an issue.
4030b57cec5SDimitry Andric if (HorizontalVerticalBalance > RegPressureThreshold) {
4040b57cec5SDimitry Andric // Critical path first
4050b57cec5SDimitry Andric ResCount += (SU->getHeight() * ScaleTwo);
4060b57cec5SDimitry Andric // If resources are available for it, multiply the
4070b57cec5SDimitry Andric // chance of scheduling.
4080b57cec5SDimitry Andric if (isResourceAvailable(SU))
4090b57cec5SDimitry Andric ResCount <<= FactorOne;
4100b57cec5SDimitry Andric
4110b57cec5SDimitry Andric // Consider change to reg pressure from scheduling
4120b57cec5SDimitry Andric // this SU.
4130b57cec5SDimitry Andric ResCount -= (regPressureDelta(SU,true) * ScaleOne);
4140b57cec5SDimitry Andric }
4150b57cec5SDimitry Andric // Default heuristic, greeady and
4160b57cec5SDimitry Andric // critical path driven.
4170b57cec5SDimitry Andric else {
4180b57cec5SDimitry Andric // Critical path first.
4190b57cec5SDimitry Andric ResCount += (SU->getHeight() * ScaleTwo);
4200b57cec5SDimitry Andric // Now see how many instructions is blocked by this SU.
4210b57cec5SDimitry Andric ResCount += (NumNodesSolelyBlocking[SU->NodeNum] * ScaleTwo);
4220b57cec5SDimitry Andric // If resources are available for it, multiply the
4230b57cec5SDimitry Andric // chance of scheduling.
4240b57cec5SDimitry Andric if (isResourceAvailable(SU))
4250b57cec5SDimitry Andric ResCount <<= FactorOne;
4260b57cec5SDimitry Andric
4270b57cec5SDimitry Andric ResCount -= (regPressureDelta(SU) * ScaleTwo);
4280b57cec5SDimitry Andric }
4290b57cec5SDimitry Andric
4300b57cec5SDimitry Andric // These are platform-specific things.
4310b57cec5SDimitry Andric // Will need to go into the back end
4320b57cec5SDimitry Andric // and accessed from here via a hook.
4330b57cec5SDimitry Andric for (SDNode *N = SU->getNode(); N; N = N->getGluedNode()) {
4340b57cec5SDimitry Andric if (N->isMachineOpcode()) {
4350b57cec5SDimitry Andric const MCInstrDesc &TID = TII->get(N->getMachineOpcode());
4360b57cec5SDimitry Andric if (TID.isCall())
4370b57cec5SDimitry Andric ResCount += (PriorityTwo + (ScaleThree*N->getNumValues()));
4380b57cec5SDimitry Andric }
4390b57cec5SDimitry Andric else
4400b57cec5SDimitry Andric switch (N->getOpcode()) {
4410b57cec5SDimitry Andric default: break;
4420b57cec5SDimitry Andric case ISD::TokenFactor:
4430b57cec5SDimitry Andric case ISD::CopyFromReg:
4440b57cec5SDimitry Andric case ISD::CopyToReg:
4450b57cec5SDimitry Andric ResCount += PriorityFour;
4460b57cec5SDimitry Andric break;
4470b57cec5SDimitry Andric
4480b57cec5SDimitry Andric case ISD::INLINEASM:
4490b57cec5SDimitry Andric case ISD::INLINEASM_BR:
4500b57cec5SDimitry Andric ResCount += PriorityThree;
4510b57cec5SDimitry Andric break;
4520b57cec5SDimitry Andric }
4530b57cec5SDimitry Andric }
4540b57cec5SDimitry Andric return ResCount;
4550b57cec5SDimitry Andric }
4560b57cec5SDimitry Andric
4570b57cec5SDimitry Andric
4580b57cec5SDimitry Andric /// Main resource tracking point.
scheduledNode(SUnit * SU)4590b57cec5SDimitry Andric void ResourcePriorityQueue::scheduledNode(SUnit *SU) {
4600b57cec5SDimitry Andric // Use NULL entry as an event marker to reset
4610b57cec5SDimitry Andric // the DFA state.
4620b57cec5SDimitry Andric if (!SU) {
4630b57cec5SDimitry Andric ResourcesModel->clearResources();
4640b57cec5SDimitry Andric Packet.clear();
4650b57cec5SDimitry Andric return;
4660b57cec5SDimitry Andric }
4670b57cec5SDimitry Andric
4680b57cec5SDimitry Andric const SDNode *ScegN = SU->getNode();
4690b57cec5SDimitry Andric // Update reg pressure tracking.
4700b57cec5SDimitry Andric // First update current node.
4710b57cec5SDimitry Andric if (ScegN->isMachineOpcode()) {
4720b57cec5SDimitry Andric // Estimate generated regs.
4730b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumValues(); i != e; ++i) {
4740b57cec5SDimitry Andric MVT VT = ScegN->getSimpleValueType(i);
4750b57cec5SDimitry Andric
4760b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)) {
4770b57cec5SDimitry Andric const TargetRegisterClass *RC = TLI->getRegClassFor(VT);
4780b57cec5SDimitry Andric if (RC)
4790b57cec5SDimitry Andric RegPressure[RC->getID()] += numberRCValSuccInSU(SU, RC->getID());
4800b57cec5SDimitry Andric }
4810b57cec5SDimitry Andric }
4820b57cec5SDimitry Andric // Estimate killed regs.
4830b57cec5SDimitry Andric for (unsigned i = 0, e = ScegN->getNumOperands(); i != e; ++i) {
4840b57cec5SDimitry Andric const SDValue &Op = ScegN->getOperand(i);
4850b57cec5SDimitry Andric MVT VT = Op.getNode()->getSimpleValueType(Op.getResNo());
4860b57cec5SDimitry Andric
4870b57cec5SDimitry Andric if (TLI->isTypeLegal(VT)) {
4880b57cec5SDimitry Andric const TargetRegisterClass *RC = TLI->getRegClassFor(VT);
4890b57cec5SDimitry Andric if (RC) {
4900b57cec5SDimitry Andric if (RegPressure[RC->getID()] >
4910b57cec5SDimitry Andric (numberRCValPredInSU(SU, RC->getID())))
4920b57cec5SDimitry Andric RegPressure[RC->getID()] -= numberRCValPredInSU(SU, RC->getID());
4930b57cec5SDimitry Andric else RegPressure[RC->getID()] = 0;
4940b57cec5SDimitry Andric }
4950b57cec5SDimitry Andric }
4960b57cec5SDimitry Andric }
4970b57cec5SDimitry Andric for (SDep &Pred : SU->Preds) {
4980b57cec5SDimitry Andric if (Pred.isCtrl() || (Pred.getSUnit()->NumRegDefsLeft == 0))
4990b57cec5SDimitry Andric continue;
5000b57cec5SDimitry Andric --Pred.getSUnit()->NumRegDefsLeft;
5010b57cec5SDimitry Andric }
5020b57cec5SDimitry Andric }
5030b57cec5SDimitry Andric
5040b57cec5SDimitry Andric // Reserve resources for this SU.
5050b57cec5SDimitry Andric reserveResources(SU);
5060b57cec5SDimitry Andric
5070b57cec5SDimitry Andric // Adjust number of parallel live ranges.
5080b57cec5SDimitry Andric // Heuristic is simple - node with no data successors reduces
5090b57cec5SDimitry Andric // number of live ranges. All others, increase it.
5100b57cec5SDimitry Andric unsigned NumberNonControlDeps = 0;
5110b57cec5SDimitry Andric
5120b57cec5SDimitry Andric for (const SDep &Succ : SU->Succs) {
5130b57cec5SDimitry Andric adjustPriorityOfUnscheduledPreds(Succ.getSUnit());
5140b57cec5SDimitry Andric if (!Succ.isCtrl())
5150b57cec5SDimitry Andric NumberNonControlDeps++;
5160b57cec5SDimitry Andric }
5170b57cec5SDimitry Andric
5180b57cec5SDimitry Andric if (!NumberNonControlDeps) {
5190b57cec5SDimitry Andric if (ParallelLiveRanges >= SU->NumPreds)
5200b57cec5SDimitry Andric ParallelLiveRanges -= SU->NumPreds;
5210b57cec5SDimitry Andric else
5220b57cec5SDimitry Andric ParallelLiveRanges = 0;
5230b57cec5SDimitry Andric
5240b57cec5SDimitry Andric }
5250b57cec5SDimitry Andric else
5260b57cec5SDimitry Andric ParallelLiveRanges += SU->NumRegDefsLeft;
5270b57cec5SDimitry Andric
5280b57cec5SDimitry Andric // Track parallel live chains.
5290b57cec5SDimitry Andric HorizontalVerticalBalance += (SU->Succs.size() - numberCtrlDepsInSU(SU));
5300b57cec5SDimitry Andric HorizontalVerticalBalance -= (SU->Preds.size() - numberCtrlPredInSU(SU));
5310b57cec5SDimitry Andric }
5320b57cec5SDimitry Andric
initNumRegDefsLeft(SUnit * SU)5330b57cec5SDimitry Andric void ResourcePriorityQueue::initNumRegDefsLeft(SUnit *SU) {
5340b57cec5SDimitry Andric unsigned NodeNumDefs = 0;
5350b57cec5SDimitry Andric for (SDNode *N = SU->getNode(); N; N = N->getGluedNode())
5360b57cec5SDimitry Andric if (N->isMachineOpcode()) {
5370b57cec5SDimitry Andric const MCInstrDesc &TID = TII->get(N->getMachineOpcode());
5380b57cec5SDimitry Andric // No register need be allocated for this.
5390b57cec5SDimitry Andric if (N->getMachineOpcode() == TargetOpcode::IMPLICIT_DEF) {
5400b57cec5SDimitry Andric NodeNumDefs = 0;
5410b57cec5SDimitry Andric break;
5420b57cec5SDimitry Andric }
5430b57cec5SDimitry Andric NodeNumDefs = std::min(N->getNumValues(), TID.getNumDefs());
5440b57cec5SDimitry Andric }
5450b57cec5SDimitry Andric else
5460b57cec5SDimitry Andric switch(N->getOpcode()) {
5470b57cec5SDimitry Andric default: break;
5480b57cec5SDimitry Andric case ISD::CopyFromReg:
5490b57cec5SDimitry Andric NodeNumDefs++;
5500b57cec5SDimitry Andric break;
5510b57cec5SDimitry Andric case ISD::INLINEASM:
5520b57cec5SDimitry Andric case ISD::INLINEASM_BR:
5530b57cec5SDimitry Andric NodeNumDefs++;
5540b57cec5SDimitry Andric break;
5550b57cec5SDimitry Andric }
5560b57cec5SDimitry Andric
5570b57cec5SDimitry Andric SU->NumRegDefsLeft = NodeNumDefs;
5580b57cec5SDimitry Andric }
5590b57cec5SDimitry Andric
5600b57cec5SDimitry Andric /// adjustPriorityOfUnscheduledPreds - One of the predecessors of SU was just
5610b57cec5SDimitry Andric /// scheduled. If SU is not itself available, then there is at least one
5620b57cec5SDimitry Andric /// predecessor node that has not been scheduled yet. If SU has exactly ONE
5630b57cec5SDimitry Andric /// unscheduled predecessor, we want to increase its priority: it getting
5640b57cec5SDimitry Andric /// scheduled will make this node available, so it is better than some other
5650b57cec5SDimitry Andric /// node of the same priority that will not make a node available.
adjustPriorityOfUnscheduledPreds(SUnit * SU)5660b57cec5SDimitry Andric void ResourcePriorityQueue::adjustPriorityOfUnscheduledPreds(SUnit *SU) {
5670b57cec5SDimitry Andric if (SU->isAvailable) return; // All preds scheduled.
5680b57cec5SDimitry Andric
5690b57cec5SDimitry Andric SUnit *OnlyAvailablePred = getSingleUnscheduledPred(SU);
5700b57cec5SDimitry Andric if (!OnlyAvailablePred || !OnlyAvailablePred->isAvailable)
5710b57cec5SDimitry Andric return;
5720b57cec5SDimitry Andric
5730b57cec5SDimitry Andric // Okay, we found a single predecessor that is available, but not scheduled.
5740b57cec5SDimitry Andric // Since it is available, it must be in the priority queue. First remove it.
5750b57cec5SDimitry Andric remove(OnlyAvailablePred);
5760b57cec5SDimitry Andric
5770b57cec5SDimitry Andric // Reinsert the node into the priority queue, which recomputes its
5780b57cec5SDimitry Andric // NumNodesSolelyBlocking value.
5790b57cec5SDimitry Andric push(OnlyAvailablePred);
5800b57cec5SDimitry Andric }
5810b57cec5SDimitry Andric
5820b57cec5SDimitry Andric
5830b57cec5SDimitry Andric /// Main access point - returns next instructions
5840b57cec5SDimitry Andric /// to be placed in scheduling sequence.
pop()5850b57cec5SDimitry Andric SUnit *ResourcePriorityQueue::pop() {
5860b57cec5SDimitry Andric if (empty())
5870b57cec5SDimitry Andric return nullptr;
5880b57cec5SDimitry Andric
5890b57cec5SDimitry Andric std::vector<SUnit *>::iterator Best = Queue.begin();
5900b57cec5SDimitry Andric if (!DisableDFASched) {
5910b57cec5SDimitry Andric int BestCost = SUSchedulingCost(*Best);
5920b57cec5SDimitry Andric for (auto I = std::next(Queue.begin()), E = Queue.end(); I != E; ++I) {
5930b57cec5SDimitry Andric
5940b57cec5SDimitry Andric if (SUSchedulingCost(*I) > BestCost) {
5950b57cec5SDimitry Andric BestCost = SUSchedulingCost(*I);
5960b57cec5SDimitry Andric Best = I;
5970b57cec5SDimitry Andric }
5980b57cec5SDimitry Andric }
5990b57cec5SDimitry Andric }
6000b57cec5SDimitry Andric // Use default TD scheduling mechanism.
6010b57cec5SDimitry Andric else {
6020b57cec5SDimitry Andric for (auto I = std::next(Queue.begin()), E = Queue.end(); I != E; ++I)
6030b57cec5SDimitry Andric if (Picker(*Best, *I))
6040b57cec5SDimitry Andric Best = I;
6050b57cec5SDimitry Andric }
6060b57cec5SDimitry Andric
6070b57cec5SDimitry Andric SUnit *V = *Best;
6080b57cec5SDimitry Andric if (Best != std::prev(Queue.end()))
6090b57cec5SDimitry Andric std::swap(*Best, Queue.back());
6100b57cec5SDimitry Andric
6110b57cec5SDimitry Andric Queue.pop_back();
6120b57cec5SDimitry Andric
6130b57cec5SDimitry Andric return V;
6140b57cec5SDimitry Andric }
6150b57cec5SDimitry Andric
6160b57cec5SDimitry Andric
remove(SUnit * SU)6170b57cec5SDimitry Andric void ResourcePriorityQueue::remove(SUnit *SU) {
6180b57cec5SDimitry Andric assert(!Queue.empty() && "Queue is empty!");
6190b57cec5SDimitry Andric std::vector<SUnit *>::iterator I = find(Queue, SU);
6200b57cec5SDimitry Andric if (I != std::prev(Queue.end()))
6210b57cec5SDimitry Andric std::swap(*I, Queue.back());
6220b57cec5SDimitry Andric
6230b57cec5SDimitry Andric Queue.pop_back();
6240b57cec5SDimitry Andric }
625