ScheduleDAGSDNodes.cpp revision 87896d9368e08d93493427ce7bf8272d1e5cca35
1343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman//===--- ScheduleDAGSDNodes.cpp - Implement the ScheduleDAGSDNodes class --===// 2343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman// 3343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman// The LLVM Compiler Infrastructure 4343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman// 5343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman// This file is distributed under the University of Illinois Open Source 6343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman// License. See LICENSE.TXT for details. 7343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman// 8343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman//===----------------------------------------------------------------------===// 9343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman// 10343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman// This implements the ScheduleDAG class, which is a base class used by 11343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman// scheduling implementation classes. 12343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman// 13343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman//===----------------------------------------------------------------------===// 14343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 15343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman#define DEBUG_TYPE "pre-RA-sched" 16a8efe28a44996978faa42a387f1a6087a7b942c7Evan Cheng#include "SDNodeDbgValue.h" 1784fbac580941548a6ab1121ed3b0ffdc4e2bc080Dan Gohman#include "ScheduleDAGSDNodes.h" 18bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman#include "InstrEmitter.h" 19343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman#include "llvm/CodeGen/SelectionDAG.h" 20343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman#include "llvm/Target/TargetMachine.h" 21343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman#include "llvm/Target/TargetInstrInfo.h" 221cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng#include "llvm/Target/TargetLowering.h" 23343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman#include "llvm/Target/TargetRegisterInfo.h" 24710461688bba935f0ad5c75da7fec2ad0f225c00David Goodwin#include "llvm/Target/TargetSubtarget.h" 25c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng#include "llvm/ADT/DenseMap.h" 26c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng#include "llvm/ADT/SmallPtrSet.h" 27bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng#include "llvm/ADT/SmallSet.h" 28c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng#include "llvm/ADT/SmallVector.h" 29c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng#include "llvm/ADT/Statistic.h" 30e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trick#include "llvm/Support/CommandLine.h" 31343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman#include "llvm/Support/Debug.h" 32343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman#include "llvm/Support/raw_ostream.h" 33343f0c046702831a4a6aec951b6a297a23241a55Dan Gohmanusing namespace llvm; 34343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 35c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan ChengSTATISTIC(LoadsClustered, "Number of loads clustered together"); 36c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng 37e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trick// This allows latency based scheduler to notice high latency instructions 38e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trick// without a target itinerary. The choise if number here has more to do with 39e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trick// balancing scheduler heursitics than with the actual machine latency. 40e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trickstatic cl::opt<int> HighLatencyCycles( 41e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trick "sched-high-latency-cycles", cl::Hidden, cl::init(10), 42e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trick cl::desc("Roughly estimate the number of cycles that 'long latency'" 43e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trick "instructions take for targets with no itinerary")); 44e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trick 4579ce276083ced01256a0eb7d80731e4948ca6e87Dan GohmanScheduleDAGSDNodes::ScheduleDAGSDNodes(MachineFunction &mf) 463ef1c8759a20167457eb7fd82ebcaffe7ccaa1d1Evan Cheng : ScheduleDAG(mf), 473ef1c8759a20167457eb7fd82ebcaffe7ccaa1d1Evan Cheng InstrItins(mf.getTarget().getInstrItineraryData()) {} 48343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 4947ac0f0c7c39289f5970688154e385be22b7f293Dan Gohman/// Run - perform scheduling. 5047ac0f0c7c39289f5970688154e385be22b7f293Dan Gohman/// 5147ac0f0c7c39289f5970688154e385be22b7f293Dan Gohmanvoid ScheduleDAGSDNodes::Run(SelectionDAG *dag, MachineBasicBlock *bb, 5247ac0f0c7c39289f5970688154e385be22b7f293Dan Gohman MachineBasicBlock::iterator insertPos) { 5347ac0f0c7c39289f5970688154e385be22b7f293Dan Gohman DAG = dag; 5447ac0f0c7c39289f5970688154e385be22b7f293Dan Gohman ScheduleDAG::Run(bb, insertPos); 5547ac0f0c7c39289f5970688154e385be22b7f293Dan Gohman} 5647ac0f0c7c39289f5970688154e385be22b7f293Dan Gohman 571cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng/// NewSUnit - Creates a new SUnit and return a ptr to it. 581cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng/// 591cc3984148be113c6e5e470f23c9ddbd37679c5fEvan ChengSUnit *ScheduleDAGSDNodes::NewSUnit(SDNode *N) { 601cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng#ifndef NDEBUG 611cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng const SUnit *Addr = 0; 621cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng if (!SUnits.empty()) 631cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng Addr = &SUnits[0]; 641cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng#endif 651cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng SUnits.push_back(SUnit(N, (unsigned)SUnits.size())); 661cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng assert((Addr == 0 || Addr == &SUnits[0]) && 671cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng "SUnits std::vector reallocated on the fly!"); 681cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng SUnits.back().OrigNode = &SUnits.back(); 691cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng SUnit *SU = &SUnits.back(); 701cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng const TargetLowering &TLI = DAG->getTargetLoweringInfo(); 71c120af45671c75fd1297ac6300c03a6a9e1264daEvan Cheng if (!N || 72c120af45671c75fd1297ac6300c03a6a9e1264daEvan Cheng (N->isMachineOpcode() && 73c120af45671c75fd1297ac6300c03a6a9e1264daEvan Cheng N->getMachineOpcode() == TargetOpcode::IMPLICIT_DEF)) 74046fa3f90a31ebfa10df89ae348f478d492709a9Evan Cheng SU->SchedulingPref = Sched::None; 75046fa3f90a31ebfa10df89ae348f478d492709a9Evan Cheng else 76046fa3f90a31ebfa10df89ae348f478d492709a9Evan Cheng SU->SchedulingPref = TLI.getSchedulingPreference(N); 771cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng return SU; 781cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng} 791cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng 80343f0c046702831a4a6aec951b6a297a23241a55Dan GohmanSUnit *ScheduleDAGSDNodes::Clone(SUnit *Old) { 81343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SUnit *SU = NewSUnit(Old->getNode()); 82343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SU->OrigNode = Old->OrigNode; 83343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SU->Latency = Old->Latency; 8454699765064842fd08d1466adc93453660bc2a85Andrew Trick SU->isVRegCycle = Old->isVRegCycle; 858239daf7c83a65a189c352cce3191cdc3bbfe151Evan Cheng SU->isCall = Old->isCall; 86343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SU->isTwoAddress = Old->isTwoAddress; 87343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SU->isCommutable = Old->isCommutable; 88343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SU->hasPhysRegDefs = Old->hasPhysRegDefs; 893974667c1a6d48686e92f85bc4463bb239af7442Dan Gohman SU->hasPhysRegClobbers = Old->hasPhysRegClobbers; 901cc3984148be113c6e5e470f23c9ddbd37679c5fEvan Cheng SU->SchedulingPref = Old->SchedulingPref; 91e57187cbe321a286f6a7f409a7badd1ae4e4642cEvan Cheng Old->isCloned = true; 92343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman return SU; 93343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman} 94343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 95343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman/// CheckForPhysRegDependency - Check if the dependency between def and use of 96343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman/// a specified operand is a physical register dependency. If so, returns the 97c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng/// register and the cost of copying the register. 98343f0c046702831a4a6aec951b6a297a23241a55Dan Gohmanstatic void CheckForPhysRegDependency(SDNode *Def, SDNode *User, unsigned Op, 99cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick const TargetRegisterInfo *TRI, 100343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman const TargetInstrInfo *TII, 101c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng unsigned &PhysReg, int &Cost) { 102343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (Op != 2 || User->getOpcode() != ISD::CopyToReg) 103343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman return; 104343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 105343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman unsigned Reg = cast<RegisterSDNode>(User->getOperand(1))->getReg(); 106343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (TargetRegisterInfo::isVirtualRegister(Reg)) 107343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman return; 108343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 109343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman unsigned ResNo = User->getOperand(2).getResNo(); 110343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (Def->isMachineOpcode()) { 111343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman const TargetInstrDesc &II = TII->get(Def->getMachineOpcode()); 112343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (ResNo >= II.getNumDefs() && 113c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng II.ImplicitDefs[ResNo - II.getNumDefs()] == Reg) { 114343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman PhysReg = Reg; 115c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng const TargetRegisterClass *RC = 116d31f972bd33de85071c716f69bf5c6d735f730f2Rafael Espindola TRI->getMinimalPhysRegClass(Reg, Def->getValueType(ResNo)); 117c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng Cost = RC->getCopyCost(); 118c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng } 119343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 120343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman} 121343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 12229d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattnerstatic void AddGlue(SDNode *N, SDValue Glue, bool AddGlue, SelectionDAG *DAG) { 123c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng SmallVector<EVT, 4> VTs; 12429d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner SDNode *GlueDestNode = Glue.getNode(); 125151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling 12629d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // Don't add glue from a node to itself. 12729d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner if (GlueDestNode == N) return; 12810707f3b442aa5a6cc55b899d630871f06b8ebbcBill Wendling 12929d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // Don't add glue to something which already has glue. 130f1b4eafbfec976f939ec0ea3e8acf91cef5363e3Chris Lattner if (N->getValueType(N->getNumValues() - 1) == MVT::Glue) return; 13110707f3b442aa5a6cc55b899d630871f06b8ebbcBill Wendling 13210707f3b442aa5a6cc55b899d630871f06b8ebbcBill Wendling for (unsigned I = 0, E = N->getNumValues(); I != E; ++I) 13310707f3b442aa5a6cc55b899d630871f06b8ebbcBill Wendling VTs.push_back(N->getValueType(I)); 134151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling 13529d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner if (AddGlue) 136f1b4eafbfec976f939ec0ea3e8acf91cef5363e3Chris Lattner VTs.push_back(MVT::Glue); 137151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling 138c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng SmallVector<SDValue, 4> Ops; 13910707f3b442aa5a6cc55b899d630871f06b8ebbcBill Wendling for (unsigned I = 0, E = N->getNumOperands(); I != E; ++I) 14010707f3b442aa5a6cc55b899d630871f06b8ebbcBill Wendling Ops.push_back(N->getOperand(I)); 141151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling 14229d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner if (GlueDestNode) 14329d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner Ops.push_back(Glue); 144151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling 145c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng SDVTList VTList = DAG->getVTList(&VTs[0], VTs.size()); 146151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling MachineSDNode::mmo_iterator Begin = 0, End = 0; 147151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling MachineSDNode *MN = dyn_cast<MachineSDNode>(N); 148151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling 149151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling // Store memory references. 150151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling if (MN) { 151151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling Begin = MN->memoperands_begin(); 152151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling End = MN->memoperands_end(); 153151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling } 154151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling 155c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng DAG->MorphNodeTo(N, N->getOpcode(), VTList, &Ops[0], Ops.size()); 156151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling 157151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling // Reset the memory references 158151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling if (MN) 159151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling MN->setMemRefs(Begin, End); 160c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng} 161c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng 16229d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner/// ClusterNeighboringLoads - Force nearby loads together by "gluing" them. 163c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng/// This function finds loads of the same base and different offsets. If the 164f1b4eafbfec976f939ec0ea3e8acf91cef5363e3Chris Lattner/// offsets are not far apart (target specific), it add MVT::Glue inputs and 165c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng/// outputs to ensure they are scheduled together and in order. This 166c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng/// optimization may benefit some targets by improving cache locality. 167302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Chengvoid ScheduleDAGSDNodes::ClusterNeighboringLoads(SDNode *Node) { 168302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng SDNode *Chain = 0; 169302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng unsigned NumOps = Node->getNumOperands(); 170302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng if (Node->getOperand(NumOps-1).getValueType() == MVT::Other) 171302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng Chain = Node->getOperand(NumOps-1).getNode(); 172302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng if (!Chain) 173302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng return; 174302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng 175302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng // Look for other loads of the same chain. Find loads that are loading from 176302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng // the same base pointer and different offsets. 177c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng SmallPtrSet<SDNode*, 16> Visited; 178c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng SmallVector<int64_t, 4> Offsets; 179c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng DenseMap<long long, SDNode*> O2SMap; // Map from offset to SDNode. 180302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng bool Cluster = false; 181302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng SDNode *Base = Node; 182302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng for (SDNode::use_iterator I = Chain->use_begin(), E = Chain->use_end(); 183302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng I != E; ++I) { 184302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng SDNode *User = *I; 185302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng if (User == Node || !Visited.insert(User)) 186c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng continue; 187302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng int64_t Offset1, Offset2; 188302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng if (!TII->areLoadsFromSameBasePtr(Base, User, Offset1, Offset2) || 189302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng Offset1 == Offset2) 190302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng // FIXME: Should be ok if they addresses are identical. But earlier 191302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng // optimizations really should have eliminated one of the loads. 192c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng continue; 193302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng if (O2SMap.insert(std::make_pair(Offset1, Base)).second) 194302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng Offsets.push_back(Offset1); 195302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng O2SMap.insert(std::make_pair(Offset2, User)); 196302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng Offsets.push_back(Offset2); 197b447c4e65b5f6d39db16cb8fc338133965291972Duncan Sands if (Offset2 < Offset1) 198302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng Base = User; 199302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng Cluster = true; 200302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng } 201c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng 202302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng if (!Cluster) 203302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng return; 204c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng 205302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng // Sort them in increasing order. 206302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng std::sort(Offsets.begin(), Offsets.end()); 207c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng 208302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng // Check if the loads are close enough. 209302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng SmallVector<SDNode*, 4> Loads; 210302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng unsigned NumLoads = 0; 211302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng int64_t BaseOff = Offsets[0]; 212302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng SDNode *BaseLoad = O2SMap[BaseOff]; 213302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng Loads.push_back(BaseLoad); 214302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng for (unsigned i = 1, e = Offsets.size(); i != e; ++i) { 215302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng int64_t Offset = Offsets[i]; 216302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng SDNode *Load = O2SMap[Offset]; 217302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng if (!TII->shouldScheduleLoadsNear(BaseLoad, Load, BaseOff, Offset,NumLoads)) 218302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng break; // Stop right here. Ignore loads that are further away. 219302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng Loads.push_back(Load); 220302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng ++NumLoads; 221302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng } 222c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng 223302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng if (NumLoads == 0) 224302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng return; 225c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng 226f1b4eafbfec976f939ec0ea3e8acf91cef5363e3Chris Lattner // Cluster loads by adding MVT::Glue outputs and inputs. This also 227302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng // ensure they are scheduled in order of increasing addresses. 228302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng SDNode *Lead = Loads[0]; 22929d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner AddGlue(Lead, SDValue(0, 0), true, DAG); 23010707f3b442aa5a6cc55b899d630871f06b8ebbcBill Wendling 23129d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner SDValue InGlue = SDValue(Lead, Lead->getNumValues() - 1); 23210707f3b442aa5a6cc55b899d630871f06b8ebbcBill Wendling for (unsigned I = 1, E = Loads.size(); I != E; ++I) { 23329d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner bool OutGlue = I < E - 1; 23410707f3b442aa5a6cc55b899d630871f06b8ebbcBill Wendling SDNode *Load = Loads[I]; 235151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling 23629d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner AddGlue(Load, InGlue, OutGlue, DAG); 237151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling 23829d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner if (OutGlue) 23929d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner InGlue = SDValue(Load, Load->getNumValues() - 1); 240151d26d15dc6fe89329d7cccb0638c324c58f485Bill Wendling 241302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng ++LoadsClustered; 242302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng } 243302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng} 244c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng 245302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng/// ClusterNodes - Cluster certain nodes which should be scheduled together. 246302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng/// 247302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Chengvoid ScheduleDAGSDNodes::ClusterNodes() { 248302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng for (SelectionDAG::allnodes_iterator NI = DAG->allnodes_begin(), 249302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng E = DAG->allnodes_end(); NI != E; ++NI) { 250302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng SDNode *Node = &*NI; 251302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng if (!Node || !Node->isMachineOpcode()) 252c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng continue; 253c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng 254302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng unsigned Opc = Node->getMachineOpcode(); 255302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng const TargetInstrDesc &TID = TII->get(Opc); 256302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng if (TID.mayLoad()) 257302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng // Cluster loads from "near" addresses into combined SUnits. 258302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng ClusterNeighboringLoads(Node); 259c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng } 260c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng} 261c589e03865bb31da70e0037d5c32fdaaa5f79f24Evan Cheng 262343f0c046702831a4a6aec951b6a297a23241a55Dan Gohmanvoid ScheduleDAGSDNodes::BuildSchedUnits() { 263343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman // During scheduling, the NodeId field of SDNode is used to map SDNodes 264343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman // to their associated SUnits by holding SUnits table indices. A value 265343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman // of -1 means the SDNode does not yet have an associated SUnit. 266e1dfc7da8991270db5094aa736fde273bfab6061Dan Gohman unsigned NumNodes = 0; 267343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman for (SelectionDAG::allnodes_iterator NI = DAG->allnodes_begin(), 268e1dfc7da8991270db5094aa736fde273bfab6061Dan Gohman E = DAG->allnodes_end(); NI != E; ++NI) { 269343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman NI->setNodeId(-1); 270e1dfc7da8991270db5094aa736fde273bfab6061Dan Gohman ++NumNodes; 271e1dfc7da8991270db5094aa736fde273bfab6061Dan Gohman } 272343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 273e1dfc7da8991270db5094aa736fde273bfab6061Dan Gohman // Reserve entries in the vector for each of the SUnits we are creating. This 274e1dfc7da8991270db5094aa736fde273bfab6061Dan Gohman // ensure that reallocation of the vector won't happen, so SUnit*'s won't get 275e1dfc7da8991270db5094aa736fde273bfab6061Dan Gohman // invalidated. 276e1dfc7da8991270db5094aa736fde273bfab6061Dan Gohman // FIXME: Multiply by 2 because we may clone nodes during scheduling. 277e1dfc7da8991270db5094aa736fde273bfab6061Dan Gohman // This is a temporary workaround. 278e1dfc7da8991270db5094aa736fde273bfab6061Dan Gohman SUnits.reserve(NumNodes * 2); 279cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 280736a6ea3a2a5322db0e09d97651a1acc07502e41Chris Lattner // Add all nodes in depth first order. 281736a6ea3a2a5322db0e09d97651a1acc07502e41Chris Lattner SmallVector<SDNode*, 64> Worklist; 282736a6ea3a2a5322db0e09d97651a1acc07502e41Chris Lattner SmallPtrSet<SDNode*, 64> Visited; 283736a6ea3a2a5322db0e09d97651a1acc07502e41Chris Lattner Worklist.push_back(DAG->getRoot().getNode()); 284736a6ea3a2a5322db0e09d97651a1acc07502e41Chris Lattner Visited.insert(DAG->getRoot().getNode()); 285cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 286736a6ea3a2a5322db0e09d97651a1acc07502e41Chris Lattner while (!Worklist.empty()) { 287736a6ea3a2a5322db0e09d97651a1acc07502e41Chris Lattner SDNode *NI = Worklist.pop_back_val(); 288cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 289736a6ea3a2a5322db0e09d97651a1acc07502e41Chris Lattner // Add all operands to the worklist unless they've already been added. 290736a6ea3a2a5322db0e09d97651a1acc07502e41Chris Lattner for (unsigned i = 0, e = NI->getNumOperands(); i != e; ++i) 291736a6ea3a2a5322db0e09d97651a1acc07502e41Chris Lattner if (Visited.insert(NI->getOperand(i).getNode())) 292736a6ea3a2a5322db0e09d97651a1acc07502e41Chris Lattner Worklist.push_back(NI->getOperand(i).getNode()); 293cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 294343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (isPassiveNode(NI)) // Leaf node, e.g. a TargetImmediate. 295343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman continue; 296cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 297343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman // If this node has already been processed, stop now. 298343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (NI->getNodeId() != -1) continue; 299cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 300343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SUnit *NodeSUnit = NewSUnit(NI); 301cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 30229d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // See if anything is glued to this node, if so, add them to glued 30329d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // nodes. Nodes can have at most one glue input and one glue output. Glue 30429d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // is required to be the last operand and result of a node. 305cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 30629d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // Scan up to find glued preds. 307343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SDNode *N = NI; 308db95fa131a229652f925794ca7a5b84e9490050bDan Gohman while (N->getNumOperands() && 309f1b4eafbfec976f939ec0ea3e8acf91cef5363e3Chris Lattner N->getOperand(N->getNumOperands()-1).getValueType() == MVT::Glue) { 310db95fa131a229652f925794ca7a5b84e9490050bDan Gohman N = N->getOperand(N->getNumOperands()-1).getNode(); 311db95fa131a229652f925794ca7a5b84e9490050bDan Gohman assert(N->getNodeId() == -1 && "Node already inserted!"); 312db95fa131a229652f925794ca7a5b84e9490050bDan Gohman N->setNodeId(NodeSUnit->NodeNum); 3138239daf7c83a65a189c352cce3191cdc3bbfe151Evan Cheng if (N->isMachineOpcode() && TII->get(N->getMachineOpcode()).isCall()) 3148239daf7c83a65a189c352cce3191cdc3bbfe151Evan Cheng NodeSUnit->isCall = true; 315343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 316cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 31729d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // Scan down to find any glued succs. 318343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman N = NI; 319f1b4eafbfec976f939ec0ea3e8acf91cef5363e3Chris Lattner while (N->getValueType(N->getNumValues()-1) == MVT::Glue) { 32029d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner SDValue GlueVal(N, N->getNumValues()-1); 321cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 32229d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // There are either zero or one users of the Glue result. 32329d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner bool HasGlueUse = false; 324cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick for (SDNode::use_iterator UI = N->use_begin(), E = N->use_end(); 325343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman UI != E; ++UI) 32629d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner if (GlueVal.isOperandOf(*UI)) { 32729d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner HasGlueUse = true; 328343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman assert(N->getNodeId() == -1 && "Node already inserted!"); 329343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman N->setNodeId(NodeSUnit->NodeNum); 330343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman N = *UI; 3318239daf7c83a65a189c352cce3191cdc3bbfe151Evan Cheng if (N->isMachineOpcode() && TII->get(N->getMachineOpcode()).isCall()) 3328239daf7c83a65a189c352cce3191cdc3bbfe151Evan Cheng NodeSUnit->isCall = true; 333343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman break; 334343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 33529d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner if (!HasGlueUse) break; 336343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 337cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 33829d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // If there are glue operands involved, N is now the bottom-most node 33929d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // of the sequence of nodes that are glued together. 340343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman // Update the SUnit. 341343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman NodeSUnit->setNode(N); 342343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman assert(N->getNodeId() == -1 && "Node already inserted!"); 343343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman N->setNodeId(NodeSUnit->NodeNum); 344343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 34592e946630d5f9bb092853b93501387dd216899b9Andrew Trick // Compute NumRegDefsLeft. This must be done before AddSchedEdges. 34692e946630d5f9bb092853b93501387dd216899b9Andrew Trick InitNumRegDefsLeft(NodeSUnit); 34792e946630d5f9bb092853b93501387dd216899b9Andrew Trick 348787782f4ca0cca2523825131c24a6f78535a3eb8Dan Gohman // Assign the Latency field of NodeSUnit using target-provided information. 349e163168aab987dc3df0845b9e92310f764d8b158Evan Cheng ComputeLatency(NodeSUnit); 350343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 351c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohman} 352c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohman 353c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohmanvoid ScheduleDAGSDNodes::AddSchedEdges() { 354710461688bba935f0ad5c75da7fec2ad0f225c00David Goodwin const TargetSubtarget &ST = TM.getSubtarget<TargetSubtarget>(); 355710461688bba935f0ad5c75da7fec2ad0f225c00David Goodwin 356dc4bdcdef1c8dd1a28b82deb08df039e5c0ffc5aDavid Goodwin // Check to see if the scheduler cares about latencies. 357dc4bdcdef1c8dd1a28b82deb08df039e5c0ffc5aDavid Goodwin bool UnitLatencies = ForceUnitLatencies(); 358dc4bdcdef1c8dd1a28b82deb08df039e5c0ffc5aDavid Goodwin 359343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman // Pass 2: add the preds, succs, etc. 360343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman for (unsigned su = 0, e = SUnits.size(); su != e; ++su) { 361343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SUnit *SU = &SUnits[su]; 362343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SDNode *MainNode = SU->getNode(); 363cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 364343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (MainNode->isMachineOpcode()) { 365343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman unsigned Opc = MainNode->getMachineOpcode(); 366343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman const TargetInstrDesc &TID = TII->get(Opc); 367343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman for (unsigned i = 0; i != TID.getNumOperands(); ++i) { 368343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (TID.getOperandConstraint(i, TOI::TIED_TO) != -1) { 369343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SU->isTwoAddress = true; 370343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman break; 371343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 372343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 373343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (TID.isCommutable()) 374343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SU->isCommutable = true; 375343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 376cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 377343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman // Find all predecessors and successors of the group. 37829d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner for (SDNode *N = SU->getNode(); N; N = N->getGluedNode()) { 379343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (N->isMachineOpcode() && 3803974667c1a6d48686e92f85bc4463bb239af7442Dan Gohman TII->get(N->getMachineOpcode()).getImplicitDefs()) { 3813974667c1a6d48686e92f85bc4463bb239af7442Dan Gohman SU->hasPhysRegClobbers = true; 382bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman unsigned NumUsed = InstrEmitter::CountResults(N); 3838cccf0ef0ced7f4d75ca574b596036a9b6cd4315Dan Gohman while (NumUsed != 0 && !N->hasAnyUseOfValue(NumUsed - 1)) 3848cccf0ef0ced7f4d75ca574b596036a9b6cd4315Dan Gohman --NumUsed; // Skip over unused values at the end. 3858cccf0ef0ced7f4d75ca574b596036a9b6cd4315Dan Gohman if (NumUsed > TII->get(N->getMachineOpcode()).getNumDefs()) 3863974667c1a6d48686e92f85bc4463bb239af7442Dan Gohman SU->hasPhysRegDefs = true; 3873974667c1a6d48686e92f85bc4463bb239af7442Dan Gohman } 388cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 389343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) { 390343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SDNode *OpN = N->getOperand(i).getNode(); 391343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (isPassiveNode(OpN)) continue; // Not scheduled. 392343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SUnit *OpSU = &SUnits[OpN->getNodeId()]; 393343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman assert(OpSU && "Node has no SUnit!"); 394343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman if (OpSU == SU) continue; // In the same group. 395343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 396e50ed30282bb5b4a9ed952580523f2dda16215acOwen Anderson EVT OpVT = N->getOperand(i).getValueType(); 39729d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner assert(OpVT != MVT::Glue && "Glued nodes should be in same sunit!"); 398825b72b0571821bf2d378749f69d6c4cfb52d2f9Owen Anderson bool isChain = OpVT == MVT::Other; 399343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 400343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman unsigned PhysReg = 0; 401c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng int Cost = 1; 402343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman // Determine if this is a physical register dependency. 403c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng CheckForPhysRegDependency(OpN, N, i, TRI, TII, PhysReg, Cost); 40454e4c36a7349e94a84773afb56eccd4ca65b49e9Dan Gohman assert((PhysReg == 0 || !isChain) && 40554e4c36a7349e94a84773afb56eccd4ca65b49e9Dan Gohman "Chain dependence via physreg data?"); 406c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng // FIXME: See ScheduleDAGSDNodes::EmitCopyFromReg. For now, scheduler 407c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng // emits a copy from the physical register to a virtual register unless 408c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng // it requires a cross class copy (cost < 0). That means we are only 409c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng // treating "expensive to copy" register dependency as physical register 410c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng // dependency. This may change in the future though. 411c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng if (Cost >= 0) 412c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng PhysReg = 0; 413710461688bba935f0ad5c75da7fec2ad0f225c00David Goodwin 414046fa3f90a31ebfa10df89ae348f478d492709a9Evan Cheng // If this is a ctrl dep, latency is 1. 415c558bf397257f5ef902bdb45a28e622ee2b5b4f2Andrew Trick unsigned OpLatency = isChain ? 1 : OpSU->Latency; 41687896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick // Special-case TokenFactor chains as zero-latency. 41787896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick if(isChain && OpN->getOpcode() == ISD::TokenFactor) 41887896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick OpLatency = 0; 41987896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick 420046fa3f90a31ebfa10df89ae348f478d492709a9Evan Cheng const SDep &dep = SDep(OpSU, isChain ? SDep::Order : SDep::Data, 421046fa3f90a31ebfa10df89ae348f478d492709a9Evan Cheng OpLatency, PhysReg); 422dc4bdcdef1c8dd1a28b82deb08df039e5c0ffc5aDavid Goodwin if (!isChain && !UnitLatencies) { 42315a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng ComputeOperandLatency(OpN, N, i, const_cast<SDep &>(dep)); 4243fb150a9024a38872ec4abbc3300e08a8bfc1812Dan Gohman ST.adjustSchedDependency(OpSU, SU, const_cast<SDep &>(dep)); 425dc4bdcdef1c8dd1a28b82deb08df039e5c0ffc5aDavid Goodwin } 426710461688bba935f0ad5c75da7fec2ad0f225c00David Goodwin 4274bbf4678e341e9bf899c0faa3e3bcfe134db81ebAndrew Trick if (!SU->addPred(dep) && !dep.isCtrl() && OpSU->NumRegDefsLeft > 1) { 42892e946630d5f9bb092853b93501387dd216899b9Andrew Trick // Multiple register uses are combined in the same SUnit. For example, 42992e946630d5f9bb092853b93501387dd216899b9Andrew Trick // we could have a set of glued nodes with all their defs consumed by 43092e946630d5f9bb092853b93501387dd216899b9Andrew Trick // another set of glued nodes. Register pressure tracking sees this as 43192e946630d5f9bb092853b93501387dd216899b9Andrew Trick // a single use, so to keep pressure balanced we reduce the defs. 4324bbf4678e341e9bf899c0faa3e3bcfe134db81ebAndrew Trick // 4334bbf4678e341e9bf899c0faa3e3bcfe134db81ebAndrew Trick // We can't tell (without more book-keeping) if this results from 4344bbf4678e341e9bf899c0faa3e3bcfe134db81ebAndrew Trick // glued nodes or duplicate operands. As long as we don't reduce 4354bbf4678e341e9bf899c0faa3e3bcfe134db81ebAndrew Trick // NumRegDefsLeft to zero, we handle the common cases well. 43692e946630d5f9bb092853b93501387dd216899b9Andrew Trick --OpSU->NumRegDefsLeft; 43792e946630d5f9bb092853b93501387dd216899b9Andrew Trick } 438343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 439343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 440343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 441343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman} 442343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 443c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohman/// BuildSchedGraph - Build the SUnit graph from the selection dag that we 444c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohman/// are input. This SUnit graph is similar to the SelectionDAG, but 445c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohman/// excludes nodes that aren't interesting to scheduling, and represents 44629d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner/// glued together nodes with a single SUnit. 44798976e4dcd18adbbe676048c0069e67346eb4adeDan Gohmanvoid ScheduleDAGSDNodes::BuildSchedGraph(AliasAnalysis *AA) { 448302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng // Cluster certain nodes which should be scheduled together. 449302ef834e0a2fd03e4b435079a9fa6c1e1cdc23bEvan Cheng ClusterNodes(); 450c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohman // Populate the SUnits array. 451c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohman BuildSchedUnits(); 452c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohman // Compute all the scheduling dependencies between nodes. 453c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohman AddSchedEdges(); 454c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohman} 455c9a5b9e38b442c2ae6b115213a07df3fcd14708dDan Gohman 45692e946630d5f9bb092853b93501387dd216899b9Andrew Trick// Initialize NumNodeDefs for the current Node's opcode. 45792e946630d5f9bb092853b93501387dd216899b9Andrew Trickvoid ScheduleDAGSDNodes::RegDefIter::InitNodeNumDefs() { 45829449448b0f0420dfcf52e278fc01adbf1690d70Eric Christopher // Check for phys reg copy. 45929449448b0f0420dfcf52e278fc01adbf1690d70Eric Christopher if (!Node) 46029449448b0f0420dfcf52e278fc01adbf1690d70Eric Christopher return; 46129449448b0f0420dfcf52e278fc01adbf1690d70Eric Christopher 46292e946630d5f9bb092853b93501387dd216899b9Andrew Trick if (!Node->isMachineOpcode()) { 46392e946630d5f9bb092853b93501387dd216899b9Andrew Trick if (Node->getOpcode() == ISD::CopyFromReg) 46492e946630d5f9bb092853b93501387dd216899b9Andrew Trick NodeNumDefs = 1; 46592e946630d5f9bb092853b93501387dd216899b9Andrew Trick else 46692e946630d5f9bb092853b93501387dd216899b9Andrew Trick NodeNumDefs = 0; 46792e946630d5f9bb092853b93501387dd216899b9Andrew Trick return; 46892e946630d5f9bb092853b93501387dd216899b9Andrew Trick } 46992e946630d5f9bb092853b93501387dd216899b9Andrew Trick unsigned POpc = Node->getMachineOpcode(); 47092e946630d5f9bb092853b93501387dd216899b9Andrew Trick if (POpc == TargetOpcode::IMPLICIT_DEF) { 47192e946630d5f9bb092853b93501387dd216899b9Andrew Trick // No register need be allocated for this. 47292e946630d5f9bb092853b93501387dd216899b9Andrew Trick NodeNumDefs = 0; 47392e946630d5f9bb092853b93501387dd216899b9Andrew Trick return; 47492e946630d5f9bb092853b93501387dd216899b9Andrew Trick } 47592e946630d5f9bb092853b93501387dd216899b9Andrew Trick unsigned NRegDefs = SchedDAG->TII->get(Node->getMachineOpcode()).getNumDefs(); 47692e946630d5f9bb092853b93501387dd216899b9Andrew Trick // Some instructions define regs that are not represented in the selection DAG 47792e946630d5f9bb092853b93501387dd216899b9Andrew Trick // (e.g. unused flags). See tMOVi8. Make sure we don't access past NumValues. 47892e946630d5f9bb092853b93501387dd216899b9Andrew Trick NodeNumDefs = std::min(Node->getNumValues(), NRegDefs); 47992e946630d5f9bb092853b93501387dd216899b9Andrew Trick DefIdx = 0; 48092e946630d5f9bb092853b93501387dd216899b9Andrew Trick} 48192e946630d5f9bb092853b93501387dd216899b9Andrew Trick 48292e946630d5f9bb092853b93501387dd216899b9Andrew Trick// Construct a RegDefIter for this SUnit and find the first valid value. 48392e946630d5f9bb092853b93501387dd216899b9Andrew TrickScheduleDAGSDNodes::RegDefIter::RegDefIter(const SUnit *SU, 48492e946630d5f9bb092853b93501387dd216899b9Andrew Trick const ScheduleDAGSDNodes *SD) 48592e946630d5f9bb092853b93501387dd216899b9Andrew Trick : SchedDAG(SD), Node(SU->getNode()), DefIdx(0), NodeNumDefs(0) { 48692e946630d5f9bb092853b93501387dd216899b9Andrew Trick InitNodeNumDefs(); 48792e946630d5f9bb092853b93501387dd216899b9Andrew Trick Advance(); 48892e946630d5f9bb092853b93501387dd216899b9Andrew Trick} 48992e946630d5f9bb092853b93501387dd216899b9Andrew Trick 49092e946630d5f9bb092853b93501387dd216899b9Andrew Trick// Advance to the next valid value defined by the SUnit. 49192e946630d5f9bb092853b93501387dd216899b9Andrew Trickvoid ScheduleDAGSDNodes::RegDefIter::Advance() { 49292e946630d5f9bb092853b93501387dd216899b9Andrew Trick for (;Node;) { // Visit all glued nodes. 49392e946630d5f9bb092853b93501387dd216899b9Andrew Trick for (;DefIdx < NodeNumDefs; ++DefIdx) { 49492e946630d5f9bb092853b93501387dd216899b9Andrew Trick if (!Node->hasAnyUseOfValue(DefIdx)) 49592e946630d5f9bb092853b93501387dd216899b9Andrew Trick continue; 49692e946630d5f9bb092853b93501387dd216899b9Andrew Trick if (Node->isMachineOpcode() && 49792e946630d5f9bb092853b93501387dd216899b9Andrew Trick Node->getMachineOpcode() == TargetOpcode::EXTRACT_SUBREG) { 49892e946630d5f9bb092853b93501387dd216899b9Andrew Trick // Propagate the incoming (full-register) type. I doubt it's needed. 49992e946630d5f9bb092853b93501387dd216899b9Andrew Trick ValueType = Node->getOperand(0).getValueType(); 50092e946630d5f9bb092853b93501387dd216899b9Andrew Trick } 50192e946630d5f9bb092853b93501387dd216899b9Andrew Trick else { 50292e946630d5f9bb092853b93501387dd216899b9Andrew Trick ValueType = Node->getValueType(DefIdx); 50392e946630d5f9bb092853b93501387dd216899b9Andrew Trick } 50492e946630d5f9bb092853b93501387dd216899b9Andrew Trick ++DefIdx; 50592e946630d5f9bb092853b93501387dd216899b9Andrew Trick return; // Found a normal regdef. 50692e946630d5f9bb092853b93501387dd216899b9Andrew Trick } 50792e946630d5f9bb092853b93501387dd216899b9Andrew Trick Node = Node->getGluedNode(); 50892e946630d5f9bb092853b93501387dd216899b9Andrew Trick if (Node == NULL) { 50992e946630d5f9bb092853b93501387dd216899b9Andrew Trick return; // No values left to visit. 51092e946630d5f9bb092853b93501387dd216899b9Andrew Trick } 51192e946630d5f9bb092853b93501387dd216899b9Andrew Trick InitNodeNumDefs(); 51292e946630d5f9bb092853b93501387dd216899b9Andrew Trick } 51392e946630d5f9bb092853b93501387dd216899b9Andrew Trick} 51492e946630d5f9bb092853b93501387dd216899b9Andrew Trick 51592e946630d5f9bb092853b93501387dd216899b9Andrew Trickvoid ScheduleDAGSDNodes::InitNumRegDefsLeft(SUnit *SU) { 51692e946630d5f9bb092853b93501387dd216899b9Andrew Trick assert(SU->NumRegDefsLeft == 0 && "expect a new node"); 51792e946630d5f9bb092853b93501387dd216899b9Andrew Trick for (RegDefIter I(SU, this); I.IsValid(); I.Advance()) { 51892e946630d5f9bb092853b93501387dd216899b9Andrew Trick assert(SU->NumRegDefsLeft < USHRT_MAX && "overflow is ok but unexpected"); 51992e946630d5f9bb092853b93501387dd216899b9Andrew Trick ++SU->NumRegDefsLeft; 52092e946630d5f9bb092853b93501387dd216899b9Andrew Trick } 52192e946630d5f9bb092853b93501387dd216899b9Andrew Trick} 52292e946630d5f9bb092853b93501387dd216899b9Andrew Trick 523343f0c046702831a4a6aec951b6a297a23241a55Dan Gohmanvoid ScheduleDAGSDNodes::ComputeLatency(SUnit *SU) { 52487896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick SDNode *N = SU->getNode(); 52587896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick 52687896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick // TokenFactor operands are considered zero latency, and some schedulers 52787896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick // (e.g. Top-Down list) may rely on the fact that operand latency is nonzero 52887896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick // whenever node latency is nonzero. 52987896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick if (N && N->getOpcode() == ISD::TokenFactor) { 53087896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick SU->Latency = 0; 53187896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick return; 53287896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick } 53387896d9368e08d93493427ce7bf8272d1e5cca35Andrew Trick 534e163168aab987dc3df0845b9e92310f764d8b158Evan Cheng // Check to see if the scheduler cares about latencies. 535e163168aab987dc3df0845b9e92310f764d8b158Evan Cheng if (ForceUnitLatencies()) { 536e163168aab987dc3df0845b9e92310f764d8b158Evan Cheng SU->Latency = 1; 537e163168aab987dc3df0845b9e92310f764d8b158Evan Cheng return; 538e163168aab987dc3df0845b9e92310f764d8b158Evan Cheng } 539e163168aab987dc3df0845b9e92310f764d8b158Evan Cheng 5403ef1c8759a20167457eb7fd82ebcaffe7ccaa1d1Evan Cheng if (!InstrItins || InstrItins->isEmpty()) { 5415e84e3ccaa555bd48ecca384e93e55abd76fb40aAndrew Trick if (N && N->isMachineOpcode() && 5425e84e3ccaa555bd48ecca384e93e55abd76fb40aAndrew Trick TII->isHighLatencyDef(N->getMachineOpcode())) 543e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trick SU->Latency = HighLatencyCycles; 544e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trick else 545e0ef509aeb47b396cf1bdc170ca4f468f799719fAndrew Trick SU->Latency = 1; 54615a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng return; 54715a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng } 548cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trick 549343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman // Compute the latency for the node. We use the sum of the latencies for 55029d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // all nodes glued together into this SUnit. 551343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman SU->Latency = 0; 55229d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner for (SDNode *N = SU->getNode(); N; N = N->getGluedNode()) 5538239daf7c83a65a189c352cce3191cdc3bbfe151Evan Cheng if (N->isMachineOpcode()) 5548239daf7c83a65a189c352cce3191cdc3bbfe151Evan Cheng SU->Latency += TII->getInstrLatency(InstrItins, N); 555343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman} 556343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman 55715a16def6e70c8f7df1023da80ceb89887203b40Evan Chengvoid ScheduleDAGSDNodes::ComputeOperandLatency(SDNode *Def, SDNode *Use, 55815a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng unsigned OpIdx, SDep& dep) const{ 55915a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng // Check to see if the scheduler cares about latencies. 56015a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng if (ForceUnitLatencies()) 56115a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng return; 56215a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng 56315a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng if (dep.getKind() != SDep::Data) 56415a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng return; 56515a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng 56615a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng unsigned DefIdx = Use->getOperand(OpIdx).getResNo(); 5677e2fe9150f905167f6685c9730911c2abc08293cEvan Cheng if (Use->isMachineOpcode()) 5687e2fe9150f905167f6685c9730911c2abc08293cEvan Cheng // Adjust the use operand index by num of defs. 5697e2fe9150f905167f6685c9730911c2abc08293cEvan Cheng OpIdx += TII->get(Use->getMachineOpcode()).getNumDefs(); 570a0792de66c8364d47b0a688c7f408efb7b10f31bEvan Cheng int Latency = TII->getOperandLatency(InstrItins, Def, DefIdx, Use, OpIdx); 571089751535d6e9adf65842e2ca5867bf9a70e1e95Evan Cheng if (Latency > 1 && Use->getOpcode() == ISD::CopyToReg && 572089751535d6e9adf65842e2ca5867bf9a70e1e95Evan Cheng !BB->succ_empty()) { 573089751535d6e9adf65842e2ca5867bf9a70e1e95Evan Cheng unsigned Reg = cast<RegisterSDNode>(Use->getOperand(1))->getReg(); 574089751535d6e9adf65842e2ca5867bf9a70e1e95Evan Cheng if (TargetRegisterInfo::isVirtualRegister(Reg)) 575089751535d6e9adf65842e2ca5867bf9a70e1e95Evan Cheng // This copy is a liveout value. It is likely coalesced, so reduce the 576089751535d6e9adf65842e2ca5867bf9a70e1e95Evan Cheng // latency so not to penalize the def. 577089751535d6e9adf65842e2ca5867bf9a70e1e95Evan Cheng // FIXME: need target specific adjustment here? 578089751535d6e9adf65842e2ca5867bf9a70e1e95Evan Cheng Latency = (Latency > 1) ? Latency - 1 : 1; 579089751535d6e9adf65842e2ca5867bf9a70e1e95Evan Cheng } 5803881cb7a5d54c0011b40997adcd742e1c7b91abdEvan Cheng if (Latency >= 0) 5813881cb7a5d54c0011b40997adcd742e1c7b91abdEvan Cheng dep.setLatency(Latency); 58215a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng} 58315a16def6e70c8f7df1023da80ceb89887203b40Evan Cheng 584343f0c046702831a4a6aec951b6a297a23241a55Dan Gohmanvoid ScheduleDAGSDNodes::dumpNode(const SUnit *SU) const { 585c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng if (!SU->getNode()) { 58684fa8229bbd3813505b7e8d6555fb2e522104e30David Greene dbgs() << "PHYS REG COPY\n"; 587c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng return; 588c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng } 589c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng 590c29a56dedbe4297dad94b9bf2e19035c5903fd1fEvan Cheng SU->getNode()->dump(DAG); 59184fa8229bbd3813505b7e8d6555fb2e522104e30David Greene dbgs() << "\n"; 59229d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner SmallVector<SDNode *, 4> GluedNodes; 59329d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner for (SDNode *N = SU->getNode()->getGluedNode(); N; N = N->getGluedNode()) 59429d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner GluedNodes.push_back(N); 59529d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner while (!GluedNodes.empty()) { 59684fa8229bbd3813505b7e8d6555fb2e522104e30David Greene dbgs() << " "; 59729d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner GluedNodes.back()->dump(DAG); 59884fa8229bbd3813505b7e8d6555fb2e522104e30David Greene dbgs() << "\n"; 59929d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner GluedNodes.pop_back(); 600343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman } 601343f0c046702831a4a6aec951b6a297a23241a55Dan Gohman} 602bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman 603bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Chengnamespace { 604bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng struct OrderSorter { 605bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng bool operator()(const std::pair<unsigned, MachineInstr*> &A, 606bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng const std::pair<unsigned, MachineInstr*> &B) { 607bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng return A.first < B.first; 608bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng } 609bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng }; 610bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng} 611bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng 61255d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel/// ProcessSDDbgValues - Process SDDbgValues assoicated with this node. 613cd5af07c4573c6b1270d6737e76ef3219091a733Andrew Trickstatic void ProcessSDDbgValues(SDNode *N, SelectionDAG *DAG, 61455d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel InstrEmitter &Emitter, 61555d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel SmallVector<std::pair<unsigned, MachineInstr*>, 32> &Orders, 61655d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel DenseMap<SDValue, unsigned> &VRBaseMap, 61755d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel unsigned Order) { 61855d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel if (!N->getHasDebugValue()) 61955d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel return; 62055d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel 62155d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel // Opportunistically insert immediate dbg_value uses, i.e. those with source 62255d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel // order number right after the N. 62355d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel MachineBasicBlock *BB = Emitter.getBlock(); 62455d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel MachineBasicBlock::iterator InsertPos = Emitter.getInsertPos(); 62555d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel SmallVector<SDDbgValue*,2> &DVs = DAG->GetDbgValues(N); 62655d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel for (unsigned i = 0, e = DVs.size(); i != e; ++i) { 62755d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel if (DVs[i]->isInvalidated()) 62855d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel continue; 62955d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel unsigned DVOrder = DVs[i]->getOrder(); 63055d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel if (!Order || DVOrder == ++Order) { 63155d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel MachineInstr *DbgMI = Emitter.EmitDbgValue(DVs[i], VRBaseMap); 63255d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel if (DbgMI) { 63355d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel Orders.push_back(std::make_pair(DVOrder, DbgMI)); 63455d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel BB->insert(InsertPos, DbgMI); 63555d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel } 63655d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel DVs[i]->setIsInvalidated(); 63755d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel } 63855d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel } 63955d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel} 64055d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel 641bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng// ProcessSourceNode - Process nodes with source order numbers. These are added 642d27946d1d4272d7e2bbee00fac020dc8147dfd25Jim Grosbach// to a vector which EmitSchedule uses to determine how to insert dbg_value 643bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng// instructions in the right order. 644bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Chengstatic void ProcessSourceNode(SDNode *N, SelectionDAG *DAG, 645bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng InstrEmitter &Emitter, 646bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng DenseMap<SDValue, unsigned> &VRBaseMap, 647bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng SmallVector<std::pair<unsigned, MachineInstr*>, 32> &Orders, 648bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng SmallSet<unsigned, 8> &Seen) { 649bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng unsigned Order = DAG->GetOrdering(N); 65039078a8bde256ee22e981713a4d2ff8235dc7706Devang Patel if (!Order || !Seen.insert(Order)) { 65139078a8bde256ee22e981713a4d2ff8235dc7706Devang Patel // Process any valid SDDbgValues even if node does not have any order 65239078a8bde256ee22e981713a4d2ff8235dc7706Devang Patel // assigned. 65339078a8bde256ee22e981713a4d2ff8235dc7706Devang Patel ProcessSDDbgValues(N, DAG, Emitter, Orders, VRBaseMap, 0); 654bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng return; 65539078a8bde256ee22e981713a4d2ff8235dc7706Devang Patel } 656bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng 657bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng MachineBasicBlock *BB = Emitter.getBlock(); 65884023e0fbefc406a4c611d3d64a10df5d3a97dd7Dan Gohman if (Emitter.getInsertPos() == BB->begin() || BB->back().isPHI()) { 659bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng // Did not insert any instruction. 660bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng Orders.push_back(std::make_pair(Order, (MachineInstr*)0)); 661bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng return; 662bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng } 663bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng 66484023e0fbefc406a4c611d3d64a10df5d3a97dd7Dan Gohman Orders.push_back(std::make_pair(Order, prior(Emitter.getInsertPos()))); 66555d20e8ff1e458f177302386d14f1a4dbdd86028Devang Patel ProcessSDDbgValues(N, DAG, Emitter, Orders, VRBaseMap, Order); 666bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng} 667bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng 668bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng 669bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman/// EmitSchedule - Emit the machine code in scheduled order. 670af1d8ca44a18f304f207e209b3bdb94b590f86ffDan GohmanMachineBasicBlock *ScheduleDAGSDNodes::EmitSchedule() { 671bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman InstrEmitter Emitter(BB, InsertPos); 672bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman DenseMap<SDValue, unsigned> VRBaseMap; 673bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman DenseMap<SUnit*, unsigned> CopyVRBaseMap; 674bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng SmallVector<std::pair<unsigned, MachineInstr*>, 32> Orders; 675bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng SmallSet<unsigned, 8> Seen; 676bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng bool HasDbg = DAG->hasDebugValues(); 677bfdf7f38523bd38ae0538861a2bfd8bdc46e5c33Dale Johannesen 678fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen // If this is the first BB, emit byval parameter dbg_value's. 679fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen if (HasDbg && BB->getParent()->begin() == MachineFunction::iterator(BB)) { 680fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen SDDbgInfo::DbgIterator PDI = DAG->ByvalParmDbgBegin(); 681fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen SDDbgInfo::DbgIterator PDE = DAG->ByvalParmDbgEnd(); 682fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen for (; PDI != PDE; ++PDI) { 683891ff8fbd61a06ef8ea57461fa377ebbb663ed09Dan Gohman MachineInstr *DbgMI= Emitter.EmitDbgValue(*PDI, VRBaseMap); 684fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen if (DbgMI) 68584023e0fbefc406a4c611d3d64a10df5d3a97dd7Dan Gohman BB->insert(InsertPos, DbgMI); 686fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen } 687fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen } 688fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen 689bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman for (unsigned i = 0, e = Sequence.size(); i != e; i++) { 690bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman SUnit *SU = Sequence[i]; 691bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman if (!SU) { 692bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman // Null SUnit* is a noop. 693bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman EmitNoop(); 694bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman continue; 695bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman } 696bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman 697bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman // For pre-regalloc scheduling, create instructions corresponding to the 69829d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner // SDNode and any glued SDNodes and append them to the block. 699bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman if (!SU->getNode()) { 700bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman // Emit a copy. 701bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman EmitPhysRegCopy(SU, CopyVRBaseMap); 702bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman continue; 703bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman } 704bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman 70529d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner SmallVector<SDNode *, 4> GluedNodes; 70629d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner for (SDNode *N = SU->getNode()->getGluedNode(); N; 70729d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner N = N->getGluedNode()) 70829d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner GluedNodes.push_back(N); 70929d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner while (!GluedNodes.empty()) { 71029d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner SDNode *N = GluedNodes.back(); 71129d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner Emitter.EmitNode(GluedNodes.back(), SU->OrigNode != SU, SU->isCloned, 712af1d8ca44a18f304f207e209b3bdb94b590f86ffDan Gohman VRBaseMap); 713fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen // Remember the source order of the inserted instruction. 714bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng if (HasDbg) 715891ff8fbd61a06ef8ea57461fa377ebbb663ed09Dan Gohman ProcessSourceNode(N, DAG, Emitter, VRBaseMap, Orders, Seen); 71629d8f0cae425f1bba583565227eaebf58f26ce73Chris Lattner GluedNodes.pop_back(); 717bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman } 718bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman Emitter.EmitNode(SU->getNode(), SU->OrigNode != SU, SU->isCloned, 719af1d8ca44a18f304f207e209b3bdb94b590f86ffDan Gohman VRBaseMap); 720fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen // Remember the source order of the inserted instruction. 721bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng if (HasDbg) 722891ff8fbd61a06ef8ea57461fa377ebbb663ed09Dan Gohman ProcessSourceNode(SU->getNode(), DAG, Emitter, VRBaseMap, Orders, 723bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng Seen); 724bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng } 725bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng 726fdb42fa5fe794cc2c89e2ed7f57a89ed24d9952aDale Johannesen // Insert all the dbg_values which have not already been inserted in source 727bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng // order sequence. 728bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng if (HasDbg) { 72984023e0fbefc406a4c611d3d64a10df5d3a97dd7Dan Gohman MachineBasicBlock::iterator BBBegin = BB->getFirstNonPHI(); 730bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng 731bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng // Sort the source order instructions and use the order to insert debug 732bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng // values. 733bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng std::sort(Orders.begin(), Orders.end(), OrderSorter()); 734bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng 735bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng SDDbgInfo::DbgIterator DI = DAG->DbgBegin(); 736bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng SDDbgInfo::DbgIterator DE = DAG->DbgEnd(); 737bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng // Now emit the rest according to source order. 738bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng unsigned LastOrder = 0; 739bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng for (unsigned i = 0, e = Orders.size(); i != e && DI != DE; ++i) { 740bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng unsigned Order = Orders[i].first; 741bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng MachineInstr *MI = Orders[i].second; 742bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng // Insert all SDDbgValue's whose order(s) are before "Order". 743bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng if (!MI) 744bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng continue; 745bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng for (; DI != DE && 746bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng (*DI)->getOrder() >= LastOrder && (*DI)->getOrder() < Order; ++DI) { 747bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng if ((*DI)->isInvalidated()) 748bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng continue; 749891ff8fbd61a06ef8ea57461fa377ebbb663ed09Dan Gohman MachineInstr *DbgMI = Emitter.EmitDbgValue(*DI, VRBaseMap); 750962021bc7f6721c20c7dfe8ca809e2d98b1c554aEvan Cheng if (DbgMI) { 751962021bc7f6721c20c7dfe8ca809e2d98b1c554aEvan Cheng if (!LastOrder) 752962021bc7f6721c20c7dfe8ca809e2d98b1c554aEvan Cheng // Insert to start of the BB (after PHIs). 753962021bc7f6721c20c7dfe8ca809e2d98b1c554aEvan Cheng BB->insert(BBBegin, DbgMI); 754962021bc7f6721c20c7dfe8ca809e2d98b1c554aEvan Cheng else { 755a8dab36f3dfdfcd3f74224afa4ffb32776674c93Dan Gohman // Insert at the instruction, which may be in a different 756a8dab36f3dfdfcd3f74224afa4ffb32776674c93Dan Gohman // block, if the block was split by a custom inserter. 757962021bc7f6721c20c7dfe8ca809e2d98b1c554aEvan Cheng MachineBasicBlock::iterator Pos = MI; 758a8dab36f3dfdfcd3f74224afa4ffb32776674c93Dan Gohman MI->getParent()->insert(llvm::next(Pos), DbgMI); 759962021bc7f6721c20c7dfe8ca809e2d98b1c554aEvan Cheng } 760bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng } 761bfdf7f38523bd38ae0538861a2bfd8bdc46e5c33Dale Johannesen } 762bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng LastOrder = Order; 763bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng } 764bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng // Add trailing DbgValue's before the terminator. FIXME: May want to add 765bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng // some of them before one or more conditional branches? 766bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng while (DI != DE) { 767bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng MachineBasicBlock *InsertBB = Emitter.getBlock(); 768bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng MachineBasicBlock::iterator Pos= Emitter.getBlock()->getFirstTerminator(); 769bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng if (!(*DI)->isInvalidated()) { 770891ff8fbd61a06ef8ea57461fa377ebbb663ed09Dan Gohman MachineInstr *DbgMI= Emitter.EmitDbgValue(*DI, VRBaseMap); 771962021bc7f6721c20c7dfe8ca809e2d98b1c554aEvan Cheng if (DbgMI) 772962021bc7f6721c20c7dfe8ca809e2d98b1c554aEvan Cheng InsertBB->insert(Pos, DbgMI); 773bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng } 774bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng ++DI; 775bfcb3051899b7141a946d769fcf6e8a8453bc530Evan Cheng } 776bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman } 777bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman 778bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman BB = Emitter.getBlock(); 779bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman InsertPos = Emitter.getInsertPos(); 780bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman return BB; 781bcea859fc1dd1af9ac66ec93ea04ce9a19c8451cDan Gohman} 782