1*9880d681SAndroid Build Coastguard Worker //===-- R600MachineScheduler.cpp - R600 Scheduler Interface -*- C++ -*-----===//
2*9880d681SAndroid Build Coastguard Worker //
3*9880d681SAndroid Build Coastguard Worker // The LLVM Compiler Infrastructure
4*9880d681SAndroid Build Coastguard Worker //
5*9880d681SAndroid Build Coastguard Worker // This file is distributed under the University of Illinois Open Source
6*9880d681SAndroid Build Coastguard Worker // License. See LICENSE.TXT for details.
7*9880d681SAndroid Build Coastguard Worker //
8*9880d681SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
9*9880d681SAndroid Build Coastguard Worker //
10*9880d681SAndroid Build Coastguard Worker /// \file
11*9880d681SAndroid Build Coastguard Worker /// \brief R600 Machine Scheduler interface
12*9880d681SAndroid Build Coastguard Worker //
13*9880d681SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
14*9880d681SAndroid Build Coastguard Worker
15*9880d681SAndroid Build Coastguard Worker #include "R600MachineScheduler.h"
16*9880d681SAndroid Build Coastguard Worker #include "R600InstrInfo.h"
17*9880d681SAndroid Build Coastguard Worker #include "AMDGPUSubtarget.h"
18*9880d681SAndroid Build Coastguard Worker #include "llvm/CodeGen/MachineRegisterInfo.h"
19*9880d681SAndroid Build Coastguard Worker #include "llvm/Pass.h"
20*9880d681SAndroid Build Coastguard Worker #include "llvm/IR/LegacyPassManager.h"
21*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/raw_ostream.h"
22*9880d681SAndroid Build Coastguard Worker
23*9880d681SAndroid Build Coastguard Worker using namespace llvm;
24*9880d681SAndroid Build Coastguard Worker
25*9880d681SAndroid Build Coastguard Worker #define DEBUG_TYPE "misched"
26*9880d681SAndroid Build Coastguard Worker
initialize(ScheduleDAGMI * dag)27*9880d681SAndroid Build Coastguard Worker void R600SchedStrategy::initialize(ScheduleDAGMI *dag) {
28*9880d681SAndroid Build Coastguard Worker assert(dag->hasVRegLiveness() && "R600SchedStrategy needs vreg liveness");
29*9880d681SAndroid Build Coastguard Worker DAG = static_cast<ScheduleDAGMILive*>(dag);
30*9880d681SAndroid Build Coastguard Worker const R600Subtarget &ST = DAG->MF.getSubtarget<R600Subtarget>();
31*9880d681SAndroid Build Coastguard Worker TII = static_cast<const R600InstrInfo*>(DAG->TII);
32*9880d681SAndroid Build Coastguard Worker TRI = static_cast<const R600RegisterInfo*>(DAG->TRI);
33*9880d681SAndroid Build Coastguard Worker VLIW5 = !ST.hasCaymanISA();
34*9880d681SAndroid Build Coastguard Worker MRI = &DAG->MRI;
35*9880d681SAndroid Build Coastguard Worker CurInstKind = IDOther;
36*9880d681SAndroid Build Coastguard Worker CurEmitted = 0;
37*9880d681SAndroid Build Coastguard Worker OccupedSlotsMask = 31;
38*9880d681SAndroid Build Coastguard Worker InstKindLimit[IDAlu] = TII->getMaxAlusPerClause();
39*9880d681SAndroid Build Coastguard Worker InstKindLimit[IDOther] = 32;
40*9880d681SAndroid Build Coastguard Worker InstKindLimit[IDFetch] = ST.getTexVTXClauseSize();
41*9880d681SAndroid Build Coastguard Worker AluInstCount = 0;
42*9880d681SAndroid Build Coastguard Worker FetchInstCount = 0;
43*9880d681SAndroid Build Coastguard Worker }
44*9880d681SAndroid Build Coastguard Worker
MoveUnits(std::vector<SUnit * > & QSrc,std::vector<SUnit * > & QDst)45*9880d681SAndroid Build Coastguard Worker void R600SchedStrategy::MoveUnits(std::vector<SUnit *> &QSrc,
46*9880d681SAndroid Build Coastguard Worker std::vector<SUnit *> &QDst)
47*9880d681SAndroid Build Coastguard Worker {
48*9880d681SAndroid Build Coastguard Worker QDst.insert(QDst.end(), QSrc.begin(), QSrc.end());
49*9880d681SAndroid Build Coastguard Worker QSrc.clear();
50*9880d681SAndroid Build Coastguard Worker }
51*9880d681SAndroid Build Coastguard Worker
getWFCountLimitedByGPR(unsigned GPRCount)52*9880d681SAndroid Build Coastguard Worker static unsigned getWFCountLimitedByGPR(unsigned GPRCount) {
53*9880d681SAndroid Build Coastguard Worker assert (GPRCount && "GPRCount cannot be 0");
54*9880d681SAndroid Build Coastguard Worker return 248 / GPRCount;
55*9880d681SAndroid Build Coastguard Worker }
56*9880d681SAndroid Build Coastguard Worker
pickNode(bool & IsTopNode)57*9880d681SAndroid Build Coastguard Worker SUnit* R600SchedStrategy::pickNode(bool &IsTopNode) {
58*9880d681SAndroid Build Coastguard Worker SUnit *SU = nullptr;
59*9880d681SAndroid Build Coastguard Worker NextInstKind = IDOther;
60*9880d681SAndroid Build Coastguard Worker
61*9880d681SAndroid Build Coastguard Worker IsTopNode = false;
62*9880d681SAndroid Build Coastguard Worker
63*9880d681SAndroid Build Coastguard Worker // check if we might want to switch current clause type
64*9880d681SAndroid Build Coastguard Worker bool AllowSwitchToAlu = (CurEmitted >= InstKindLimit[CurInstKind]) ||
65*9880d681SAndroid Build Coastguard Worker (Available[CurInstKind].empty());
66*9880d681SAndroid Build Coastguard Worker bool AllowSwitchFromAlu = (CurEmitted >= InstKindLimit[CurInstKind]) &&
67*9880d681SAndroid Build Coastguard Worker (!Available[IDFetch].empty() || !Available[IDOther].empty());
68*9880d681SAndroid Build Coastguard Worker
69*9880d681SAndroid Build Coastguard Worker if (CurInstKind == IDAlu && !Available[IDFetch].empty()) {
70*9880d681SAndroid Build Coastguard Worker // We use the heuristic provided by AMD Accelerated Parallel Processing
71*9880d681SAndroid Build Coastguard Worker // OpenCL Programming Guide :
72*9880d681SAndroid Build Coastguard Worker // The approx. number of WF that allows TEX inst to hide ALU inst is :
73*9880d681SAndroid Build Coastguard Worker // 500 (cycles for TEX) / (AluFetchRatio * 8 (cycles for ALU))
74*9880d681SAndroid Build Coastguard Worker float ALUFetchRationEstimate =
75*9880d681SAndroid Build Coastguard Worker (AluInstCount + AvailablesAluCount() + Pending[IDAlu].size()) /
76*9880d681SAndroid Build Coastguard Worker (FetchInstCount + Available[IDFetch].size());
77*9880d681SAndroid Build Coastguard Worker if (ALUFetchRationEstimate == 0) {
78*9880d681SAndroid Build Coastguard Worker AllowSwitchFromAlu = true;
79*9880d681SAndroid Build Coastguard Worker } else {
80*9880d681SAndroid Build Coastguard Worker unsigned NeededWF = 62.5f / ALUFetchRationEstimate;
81*9880d681SAndroid Build Coastguard Worker DEBUG( dbgs() << NeededWF << " approx. Wavefronts Required\n" );
82*9880d681SAndroid Build Coastguard Worker // We assume the local GPR requirements to be "dominated" by the requirement
83*9880d681SAndroid Build Coastguard Worker // of the TEX clause (which consumes 128 bits regs) ; ALU inst before and
84*9880d681SAndroid Build Coastguard Worker // after TEX are indeed likely to consume or generate values from/for the
85*9880d681SAndroid Build Coastguard Worker // TEX clause.
86*9880d681SAndroid Build Coastguard Worker // Available[IDFetch].size() * 2 : GPRs required in the Fetch clause
87*9880d681SAndroid Build Coastguard Worker // We assume that fetch instructions are either TnXYZW = TEX TnXYZW (need
88*9880d681SAndroid Build Coastguard Worker // one GPR) or TmXYZW = TnXYZW (need 2 GPR).
89*9880d681SAndroid Build Coastguard Worker // (TODO : use RegisterPressure)
90*9880d681SAndroid Build Coastguard Worker // If we are going too use too many GPR, we flush Fetch instruction to lower
91*9880d681SAndroid Build Coastguard Worker // register pressure on 128 bits regs.
92*9880d681SAndroid Build Coastguard Worker unsigned NearRegisterRequirement = 2 * Available[IDFetch].size();
93*9880d681SAndroid Build Coastguard Worker if (NeededWF > getWFCountLimitedByGPR(NearRegisterRequirement))
94*9880d681SAndroid Build Coastguard Worker AllowSwitchFromAlu = true;
95*9880d681SAndroid Build Coastguard Worker }
96*9880d681SAndroid Build Coastguard Worker }
97*9880d681SAndroid Build Coastguard Worker
98*9880d681SAndroid Build Coastguard Worker if (!SU && ((AllowSwitchToAlu && CurInstKind != IDAlu) ||
99*9880d681SAndroid Build Coastguard Worker (!AllowSwitchFromAlu && CurInstKind == IDAlu))) {
100*9880d681SAndroid Build Coastguard Worker // try to pick ALU
101*9880d681SAndroid Build Coastguard Worker SU = pickAlu();
102*9880d681SAndroid Build Coastguard Worker if (!SU && !PhysicalRegCopy.empty()) {
103*9880d681SAndroid Build Coastguard Worker SU = PhysicalRegCopy.front();
104*9880d681SAndroid Build Coastguard Worker PhysicalRegCopy.erase(PhysicalRegCopy.begin());
105*9880d681SAndroid Build Coastguard Worker }
106*9880d681SAndroid Build Coastguard Worker if (SU) {
107*9880d681SAndroid Build Coastguard Worker if (CurEmitted >= InstKindLimit[IDAlu])
108*9880d681SAndroid Build Coastguard Worker CurEmitted = 0;
109*9880d681SAndroid Build Coastguard Worker NextInstKind = IDAlu;
110*9880d681SAndroid Build Coastguard Worker }
111*9880d681SAndroid Build Coastguard Worker }
112*9880d681SAndroid Build Coastguard Worker
113*9880d681SAndroid Build Coastguard Worker if (!SU) {
114*9880d681SAndroid Build Coastguard Worker // try to pick FETCH
115*9880d681SAndroid Build Coastguard Worker SU = pickOther(IDFetch);
116*9880d681SAndroid Build Coastguard Worker if (SU)
117*9880d681SAndroid Build Coastguard Worker NextInstKind = IDFetch;
118*9880d681SAndroid Build Coastguard Worker }
119*9880d681SAndroid Build Coastguard Worker
120*9880d681SAndroid Build Coastguard Worker // try to pick other
121*9880d681SAndroid Build Coastguard Worker if (!SU) {
122*9880d681SAndroid Build Coastguard Worker SU = pickOther(IDOther);
123*9880d681SAndroid Build Coastguard Worker if (SU)
124*9880d681SAndroid Build Coastguard Worker NextInstKind = IDOther;
125*9880d681SAndroid Build Coastguard Worker }
126*9880d681SAndroid Build Coastguard Worker
127*9880d681SAndroid Build Coastguard Worker DEBUG(
128*9880d681SAndroid Build Coastguard Worker if (SU) {
129*9880d681SAndroid Build Coastguard Worker dbgs() << " ** Pick node **\n";
130*9880d681SAndroid Build Coastguard Worker SU->dump(DAG);
131*9880d681SAndroid Build Coastguard Worker } else {
132*9880d681SAndroid Build Coastguard Worker dbgs() << "NO NODE \n";
133*9880d681SAndroid Build Coastguard Worker for (unsigned i = 0; i < DAG->SUnits.size(); i++) {
134*9880d681SAndroid Build Coastguard Worker const SUnit &S = DAG->SUnits[i];
135*9880d681SAndroid Build Coastguard Worker if (!S.isScheduled)
136*9880d681SAndroid Build Coastguard Worker S.dump(DAG);
137*9880d681SAndroid Build Coastguard Worker }
138*9880d681SAndroid Build Coastguard Worker }
139*9880d681SAndroid Build Coastguard Worker );
140*9880d681SAndroid Build Coastguard Worker
141*9880d681SAndroid Build Coastguard Worker return SU;
142*9880d681SAndroid Build Coastguard Worker }
143*9880d681SAndroid Build Coastguard Worker
schedNode(SUnit * SU,bool IsTopNode)144*9880d681SAndroid Build Coastguard Worker void R600SchedStrategy::schedNode(SUnit *SU, bool IsTopNode) {
145*9880d681SAndroid Build Coastguard Worker if (NextInstKind != CurInstKind) {
146*9880d681SAndroid Build Coastguard Worker DEBUG(dbgs() << "Instruction Type Switch\n");
147*9880d681SAndroid Build Coastguard Worker if (NextInstKind != IDAlu)
148*9880d681SAndroid Build Coastguard Worker OccupedSlotsMask |= 31;
149*9880d681SAndroid Build Coastguard Worker CurEmitted = 0;
150*9880d681SAndroid Build Coastguard Worker CurInstKind = NextInstKind;
151*9880d681SAndroid Build Coastguard Worker }
152*9880d681SAndroid Build Coastguard Worker
153*9880d681SAndroid Build Coastguard Worker if (CurInstKind == IDAlu) {
154*9880d681SAndroid Build Coastguard Worker AluInstCount ++;
155*9880d681SAndroid Build Coastguard Worker switch (getAluKind(SU)) {
156*9880d681SAndroid Build Coastguard Worker case AluT_XYZW:
157*9880d681SAndroid Build Coastguard Worker CurEmitted += 4;
158*9880d681SAndroid Build Coastguard Worker break;
159*9880d681SAndroid Build Coastguard Worker case AluDiscarded:
160*9880d681SAndroid Build Coastguard Worker break;
161*9880d681SAndroid Build Coastguard Worker default: {
162*9880d681SAndroid Build Coastguard Worker ++CurEmitted;
163*9880d681SAndroid Build Coastguard Worker for (MachineInstr::mop_iterator It = SU->getInstr()->operands_begin(),
164*9880d681SAndroid Build Coastguard Worker E = SU->getInstr()->operands_end(); It != E; ++It) {
165*9880d681SAndroid Build Coastguard Worker MachineOperand &MO = *It;
166*9880d681SAndroid Build Coastguard Worker if (MO.isReg() && MO.getReg() == AMDGPU::ALU_LITERAL_X)
167*9880d681SAndroid Build Coastguard Worker ++CurEmitted;
168*9880d681SAndroid Build Coastguard Worker }
169*9880d681SAndroid Build Coastguard Worker }
170*9880d681SAndroid Build Coastguard Worker }
171*9880d681SAndroid Build Coastguard Worker } else {
172*9880d681SAndroid Build Coastguard Worker ++CurEmitted;
173*9880d681SAndroid Build Coastguard Worker }
174*9880d681SAndroid Build Coastguard Worker
175*9880d681SAndroid Build Coastguard Worker
176*9880d681SAndroid Build Coastguard Worker DEBUG(dbgs() << CurEmitted << " Instructions Emitted in this clause\n");
177*9880d681SAndroid Build Coastguard Worker
178*9880d681SAndroid Build Coastguard Worker if (CurInstKind != IDFetch) {
179*9880d681SAndroid Build Coastguard Worker MoveUnits(Pending[IDFetch], Available[IDFetch]);
180*9880d681SAndroid Build Coastguard Worker } else
181*9880d681SAndroid Build Coastguard Worker FetchInstCount++;
182*9880d681SAndroid Build Coastguard Worker }
183*9880d681SAndroid Build Coastguard Worker
184*9880d681SAndroid Build Coastguard Worker static bool
isPhysicalRegCopy(MachineInstr * MI)185*9880d681SAndroid Build Coastguard Worker isPhysicalRegCopy(MachineInstr *MI) {
186*9880d681SAndroid Build Coastguard Worker if (MI->getOpcode() != AMDGPU::COPY)
187*9880d681SAndroid Build Coastguard Worker return false;
188*9880d681SAndroid Build Coastguard Worker
189*9880d681SAndroid Build Coastguard Worker return !TargetRegisterInfo::isVirtualRegister(MI->getOperand(1).getReg());
190*9880d681SAndroid Build Coastguard Worker }
191*9880d681SAndroid Build Coastguard Worker
releaseTopNode(SUnit * SU)192*9880d681SAndroid Build Coastguard Worker void R600SchedStrategy::releaseTopNode(SUnit *SU) {
193*9880d681SAndroid Build Coastguard Worker DEBUG(dbgs() << "Top Releasing ";SU->dump(DAG););
194*9880d681SAndroid Build Coastguard Worker }
195*9880d681SAndroid Build Coastguard Worker
releaseBottomNode(SUnit * SU)196*9880d681SAndroid Build Coastguard Worker void R600SchedStrategy::releaseBottomNode(SUnit *SU) {
197*9880d681SAndroid Build Coastguard Worker DEBUG(dbgs() << "Bottom Releasing ";SU->dump(DAG););
198*9880d681SAndroid Build Coastguard Worker if (isPhysicalRegCopy(SU->getInstr())) {
199*9880d681SAndroid Build Coastguard Worker PhysicalRegCopy.push_back(SU);
200*9880d681SAndroid Build Coastguard Worker return;
201*9880d681SAndroid Build Coastguard Worker }
202*9880d681SAndroid Build Coastguard Worker
203*9880d681SAndroid Build Coastguard Worker int IK = getInstKind(SU);
204*9880d681SAndroid Build Coastguard Worker
205*9880d681SAndroid Build Coastguard Worker // There is no export clause, we can schedule one as soon as its ready
206*9880d681SAndroid Build Coastguard Worker if (IK == IDOther)
207*9880d681SAndroid Build Coastguard Worker Available[IDOther].push_back(SU);
208*9880d681SAndroid Build Coastguard Worker else
209*9880d681SAndroid Build Coastguard Worker Pending[IK].push_back(SU);
210*9880d681SAndroid Build Coastguard Worker
211*9880d681SAndroid Build Coastguard Worker }
212*9880d681SAndroid Build Coastguard Worker
regBelongsToClass(unsigned Reg,const TargetRegisterClass * RC) const213*9880d681SAndroid Build Coastguard Worker bool R600SchedStrategy::regBelongsToClass(unsigned Reg,
214*9880d681SAndroid Build Coastguard Worker const TargetRegisterClass *RC) const {
215*9880d681SAndroid Build Coastguard Worker if (!TargetRegisterInfo::isVirtualRegister(Reg)) {
216*9880d681SAndroid Build Coastguard Worker return RC->contains(Reg);
217*9880d681SAndroid Build Coastguard Worker } else {
218*9880d681SAndroid Build Coastguard Worker return MRI->getRegClass(Reg) == RC;
219*9880d681SAndroid Build Coastguard Worker }
220*9880d681SAndroid Build Coastguard Worker }
221*9880d681SAndroid Build Coastguard Worker
getAluKind(SUnit * SU) const222*9880d681SAndroid Build Coastguard Worker R600SchedStrategy::AluKind R600SchedStrategy::getAluKind(SUnit *SU) const {
223*9880d681SAndroid Build Coastguard Worker MachineInstr *MI = SU->getInstr();
224*9880d681SAndroid Build Coastguard Worker
225*9880d681SAndroid Build Coastguard Worker if (TII->isTransOnly(*MI))
226*9880d681SAndroid Build Coastguard Worker return AluTrans;
227*9880d681SAndroid Build Coastguard Worker
228*9880d681SAndroid Build Coastguard Worker switch (MI->getOpcode()) {
229*9880d681SAndroid Build Coastguard Worker case AMDGPU::PRED_X:
230*9880d681SAndroid Build Coastguard Worker return AluPredX;
231*9880d681SAndroid Build Coastguard Worker case AMDGPU::INTERP_PAIR_XY:
232*9880d681SAndroid Build Coastguard Worker case AMDGPU::INTERP_PAIR_ZW:
233*9880d681SAndroid Build Coastguard Worker case AMDGPU::INTERP_VEC_LOAD:
234*9880d681SAndroid Build Coastguard Worker case AMDGPU::DOT_4:
235*9880d681SAndroid Build Coastguard Worker return AluT_XYZW;
236*9880d681SAndroid Build Coastguard Worker case AMDGPU::COPY:
237*9880d681SAndroid Build Coastguard Worker if (MI->getOperand(1).isUndef()) {
238*9880d681SAndroid Build Coastguard Worker // MI will become a KILL, don't considers it in scheduling
239*9880d681SAndroid Build Coastguard Worker return AluDiscarded;
240*9880d681SAndroid Build Coastguard Worker }
241*9880d681SAndroid Build Coastguard Worker default:
242*9880d681SAndroid Build Coastguard Worker break;
243*9880d681SAndroid Build Coastguard Worker }
244*9880d681SAndroid Build Coastguard Worker
245*9880d681SAndroid Build Coastguard Worker // Does the instruction take a whole IG ?
246*9880d681SAndroid Build Coastguard Worker // XXX: Is it possible to add a helper function in R600InstrInfo that can
247*9880d681SAndroid Build Coastguard Worker // be used here and in R600PacketizerList::isSoloInstruction() ?
248*9880d681SAndroid Build Coastguard Worker if(TII->isVector(*MI) ||
249*9880d681SAndroid Build Coastguard Worker TII->isCubeOp(MI->getOpcode()) ||
250*9880d681SAndroid Build Coastguard Worker TII->isReductionOp(MI->getOpcode()) ||
251*9880d681SAndroid Build Coastguard Worker MI->getOpcode() == AMDGPU::GROUP_BARRIER) {
252*9880d681SAndroid Build Coastguard Worker return AluT_XYZW;
253*9880d681SAndroid Build Coastguard Worker }
254*9880d681SAndroid Build Coastguard Worker
255*9880d681SAndroid Build Coastguard Worker if (TII->isLDSInstr(MI->getOpcode())) {
256*9880d681SAndroid Build Coastguard Worker return AluT_X;
257*9880d681SAndroid Build Coastguard Worker }
258*9880d681SAndroid Build Coastguard Worker
259*9880d681SAndroid Build Coastguard Worker // Is the result already assigned to a channel ?
260*9880d681SAndroid Build Coastguard Worker unsigned DestSubReg = MI->getOperand(0).getSubReg();
261*9880d681SAndroid Build Coastguard Worker switch (DestSubReg) {
262*9880d681SAndroid Build Coastguard Worker case AMDGPU::sub0:
263*9880d681SAndroid Build Coastguard Worker return AluT_X;
264*9880d681SAndroid Build Coastguard Worker case AMDGPU::sub1:
265*9880d681SAndroid Build Coastguard Worker return AluT_Y;
266*9880d681SAndroid Build Coastguard Worker case AMDGPU::sub2:
267*9880d681SAndroid Build Coastguard Worker return AluT_Z;
268*9880d681SAndroid Build Coastguard Worker case AMDGPU::sub3:
269*9880d681SAndroid Build Coastguard Worker return AluT_W;
270*9880d681SAndroid Build Coastguard Worker default:
271*9880d681SAndroid Build Coastguard Worker break;
272*9880d681SAndroid Build Coastguard Worker }
273*9880d681SAndroid Build Coastguard Worker
274*9880d681SAndroid Build Coastguard Worker // Is the result already member of a X/Y/Z/W class ?
275*9880d681SAndroid Build Coastguard Worker unsigned DestReg = MI->getOperand(0).getReg();
276*9880d681SAndroid Build Coastguard Worker if (regBelongsToClass(DestReg, &AMDGPU::R600_TReg32_XRegClass) ||
277*9880d681SAndroid Build Coastguard Worker regBelongsToClass(DestReg, &AMDGPU::R600_AddrRegClass))
278*9880d681SAndroid Build Coastguard Worker return AluT_X;
279*9880d681SAndroid Build Coastguard Worker if (regBelongsToClass(DestReg, &AMDGPU::R600_TReg32_YRegClass))
280*9880d681SAndroid Build Coastguard Worker return AluT_Y;
281*9880d681SAndroid Build Coastguard Worker if (regBelongsToClass(DestReg, &AMDGPU::R600_TReg32_ZRegClass))
282*9880d681SAndroid Build Coastguard Worker return AluT_Z;
283*9880d681SAndroid Build Coastguard Worker if (regBelongsToClass(DestReg, &AMDGPU::R600_TReg32_WRegClass))
284*9880d681SAndroid Build Coastguard Worker return AluT_W;
285*9880d681SAndroid Build Coastguard Worker if (regBelongsToClass(DestReg, &AMDGPU::R600_Reg128RegClass))
286*9880d681SAndroid Build Coastguard Worker return AluT_XYZW;
287*9880d681SAndroid Build Coastguard Worker
288*9880d681SAndroid Build Coastguard Worker // LDS src registers cannot be used in the Trans slot.
289*9880d681SAndroid Build Coastguard Worker if (TII->readsLDSSrcReg(*MI))
290*9880d681SAndroid Build Coastguard Worker return AluT_XYZW;
291*9880d681SAndroid Build Coastguard Worker
292*9880d681SAndroid Build Coastguard Worker return AluAny;
293*9880d681SAndroid Build Coastguard Worker }
294*9880d681SAndroid Build Coastguard Worker
getInstKind(SUnit * SU)295*9880d681SAndroid Build Coastguard Worker int R600SchedStrategy::getInstKind(SUnit* SU) {
296*9880d681SAndroid Build Coastguard Worker int Opcode = SU->getInstr()->getOpcode();
297*9880d681SAndroid Build Coastguard Worker
298*9880d681SAndroid Build Coastguard Worker if (TII->usesTextureCache(Opcode) || TII->usesVertexCache(Opcode))
299*9880d681SAndroid Build Coastguard Worker return IDFetch;
300*9880d681SAndroid Build Coastguard Worker
301*9880d681SAndroid Build Coastguard Worker if (TII->isALUInstr(Opcode)) {
302*9880d681SAndroid Build Coastguard Worker return IDAlu;
303*9880d681SAndroid Build Coastguard Worker }
304*9880d681SAndroid Build Coastguard Worker
305*9880d681SAndroid Build Coastguard Worker switch (Opcode) {
306*9880d681SAndroid Build Coastguard Worker case AMDGPU::PRED_X:
307*9880d681SAndroid Build Coastguard Worker case AMDGPU::COPY:
308*9880d681SAndroid Build Coastguard Worker case AMDGPU::CONST_COPY:
309*9880d681SAndroid Build Coastguard Worker case AMDGPU::INTERP_PAIR_XY:
310*9880d681SAndroid Build Coastguard Worker case AMDGPU::INTERP_PAIR_ZW:
311*9880d681SAndroid Build Coastguard Worker case AMDGPU::INTERP_VEC_LOAD:
312*9880d681SAndroid Build Coastguard Worker case AMDGPU::DOT_4:
313*9880d681SAndroid Build Coastguard Worker return IDAlu;
314*9880d681SAndroid Build Coastguard Worker default:
315*9880d681SAndroid Build Coastguard Worker return IDOther;
316*9880d681SAndroid Build Coastguard Worker }
317*9880d681SAndroid Build Coastguard Worker }
318*9880d681SAndroid Build Coastguard Worker
PopInst(std::vector<SUnit * > & Q,bool AnyALU)319*9880d681SAndroid Build Coastguard Worker SUnit *R600SchedStrategy::PopInst(std::vector<SUnit *> &Q, bool AnyALU) {
320*9880d681SAndroid Build Coastguard Worker if (Q.empty())
321*9880d681SAndroid Build Coastguard Worker return nullptr;
322*9880d681SAndroid Build Coastguard Worker for (std::vector<SUnit *>::reverse_iterator It = Q.rbegin(), E = Q.rend();
323*9880d681SAndroid Build Coastguard Worker It != E; ++It) {
324*9880d681SAndroid Build Coastguard Worker SUnit *SU = *It;
325*9880d681SAndroid Build Coastguard Worker InstructionsGroupCandidate.push_back(SU->getInstr());
326*9880d681SAndroid Build Coastguard Worker if (TII->fitsConstReadLimitations(InstructionsGroupCandidate) &&
327*9880d681SAndroid Build Coastguard Worker (!AnyALU || !TII->isVectorOnly(*SU->getInstr()))) {
328*9880d681SAndroid Build Coastguard Worker InstructionsGroupCandidate.pop_back();
329*9880d681SAndroid Build Coastguard Worker Q.erase((It + 1).base());
330*9880d681SAndroid Build Coastguard Worker return SU;
331*9880d681SAndroid Build Coastguard Worker } else {
332*9880d681SAndroid Build Coastguard Worker InstructionsGroupCandidate.pop_back();
333*9880d681SAndroid Build Coastguard Worker }
334*9880d681SAndroid Build Coastguard Worker }
335*9880d681SAndroid Build Coastguard Worker return nullptr;
336*9880d681SAndroid Build Coastguard Worker }
337*9880d681SAndroid Build Coastguard Worker
LoadAlu()338*9880d681SAndroid Build Coastguard Worker void R600SchedStrategy::LoadAlu() {
339*9880d681SAndroid Build Coastguard Worker std::vector<SUnit *> &QSrc = Pending[IDAlu];
340*9880d681SAndroid Build Coastguard Worker for (unsigned i = 0, e = QSrc.size(); i < e; ++i) {
341*9880d681SAndroid Build Coastguard Worker AluKind AK = getAluKind(QSrc[i]);
342*9880d681SAndroid Build Coastguard Worker AvailableAlus[AK].push_back(QSrc[i]);
343*9880d681SAndroid Build Coastguard Worker }
344*9880d681SAndroid Build Coastguard Worker QSrc.clear();
345*9880d681SAndroid Build Coastguard Worker }
346*9880d681SAndroid Build Coastguard Worker
PrepareNextSlot()347*9880d681SAndroid Build Coastguard Worker void R600SchedStrategy::PrepareNextSlot() {
348*9880d681SAndroid Build Coastguard Worker DEBUG(dbgs() << "New Slot\n");
349*9880d681SAndroid Build Coastguard Worker assert (OccupedSlotsMask && "Slot wasn't filled");
350*9880d681SAndroid Build Coastguard Worker OccupedSlotsMask = 0;
351*9880d681SAndroid Build Coastguard Worker // if (HwGen == R600Subtarget::NORTHERN_ISLANDS)
352*9880d681SAndroid Build Coastguard Worker // OccupedSlotsMask |= 16;
353*9880d681SAndroid Build Coastguard Worker InstructionsGroupCandidate.clear();
354*9880d681SAndroid Build Coastguard Worker LoadAlu();
355*9880d681SAndroid Build Coastguard Worker }
356*9880d681SAndroid Build Coastguard Worker
AssignSlot(MachineInstr * MI,unsigned Slot)357*9880d681SAndroid Build Coastguard Worker void R600SchedStrategy::AssignSlot(MachineInstr* MI, unsigned Slot) {
358*9880d681SAndroid Build Coastguard Worker int DstIndex = TII->getOperandIdx(MI->getOpcode(), AMDGPU::OpName::dst);
359*9880d681SAndroid Build Coastguard Worker if (DstIndex == -1) {
360*9880d681SAndroid Build Coastguard Worker return;
361*9880d681SAndroid Build Coastguard Worker }
362*9880d681SAndroid Build Coastguard Worker unsigned DestReg = MI->getOperand(DstIndex).getReg();
363*9880d681SAndroid Build Coastguard Worker // PressureRegister crashes if an operand is def and used in the same inst
364*9880d681SAndroid Build Coastguard Worker // and we try to constraint its regclass
365*9880d681SAndroid Build Coastguard Worker for (MachineInstr::mop_iterator It = MI->operands_begin(),
366*9880d681SAndroid Build Coastguard Worker E = MI->operands_end(); It != E; ++It) {
367*9880d681SAndroid Build Coastguard Worker MachineOperand &MO = *It;
368*9880d681SAndroid Build Coastguard Worker if (MO.isReg() && !MO.isDef() &&
369*9880d681SAndroid Build Coastguard Worker MO.getReg() == DestReg)
370*9880d681SAndroid Build Coastguard Worker return;
371*9880d681SAndroid Build Coastguard Worker }
372*9880d681SAndroid Build Coastguard Worker // Constrains the regclass of DestReg to assign it to Slot
373*9880d681SAndroid Build Coastguard Worker switch (Slot) {
374*9880d681SAndroid Build Coastguard Worker case 0:
375*9880d681SAndroid Build Coastguard Worker MRI->constrainRegClass(DestReg, &AMDGPU::R600_TReg32_XRegClass);
376*9880d681SAndroid Build Coastguard Worker break;
377*9880d681SAndroid Build Coastguard Worker case 1:
378*9880d681SAndroid Build Coastguard Worker MRI->constrainRegClass(DestReg, &AMDGPU::R600_TReg32_YRegClass);
379*9880d681SAndroid Build Coastguard Worker break;
380*9880d681SAndroid Build Coastguard Worker case 2:
381*9880d681SAndroid Build Coastguard Worker MRI->constrainRegClass(DestReg, &AMDGPU::R600_TReg32_ZRegClass);
382*9880d681SAndroid Build Coastguard Worker break;
383*9880d681SAndroid Build Coastguard Worker case 3:
384*9880d681SAndroid Build Coastguard Worker MRI->constrainRegClass(DestReg, &AMDGPU::R600_TReg32_WRegClass);
385*9880d681SAndroid Build Coastguard Worker break;
386*9880d681SAndroid Build Coastguard Worker }
387*9880d681SAndroid Build Coastguard Worker }
388*9880d681SAndroid Build Coastguard Worker
AttemptFillSlot(unsigned Slot,bool AnyAlu)389*9880d681SAndroid Build Coastguard Worker SUnit *R600SchedStrategy::AttemptFillSlot(unsigned Slot, bool AnyAlu) {
390*9880d681SAndroid Build Coastguard Worker static const AluKind IndexToID[] = {AluT_X, AluT_Y, AluT_Z, AluT_W};
391*9880d681SAndroid Build Coastguard Worker SUnit *SlotedSU = PopInst(AvailableAlus[IndexToID[Slot]], AnyAlu);
392*9880d681SAndroid Build Coastguard Worker if (SlotedSU)
393*9880d681SAndroid Build Coastguard Worker return SlotedSU;
394*9880d681SAndroid Build Coastguard Worker SUnit *UnslotedSU = PopInst(AvailableAlus[AluAny], AnyAlu);
395*9880d681SAndroid Build Coastguard Worker if (UnslotedSU)
396*9880d681SAndroid Build Coastguard Worker AssignSlot(UnslotedSU->getInstr(), Slot);
397*9880d681SAndroid Build Coastguard Worker return UnslotedSU;
398*9880d681SAndroid Build Coastguard Worker }
399*9880d681SAndroid Build Coastguard Worker
AvailablesAluCount() const400*9880d681SAndroid Build Coastguard Worker unsigned R600SchedStrategy::AvailablesAluCount() const {
401*9880d681SAndroid Build Coastguard Worker return AvailableAlus[AluAny].size() + AvailableAlus[AluT_XYZW].size() +
402*9880d681SAndroid Build Coastguard Worker AvailableAlus[AluT_X].size() + AvailableAlus[AluT_Y].size() +
403*9880d681SAndroid Build Coastguard Worker AvailableAlus[AluT_Z].size() + AvailableAlus[AluT_W].size() +
404*9880d681SAndroid Build Coastguard Worker AvailableAlus[AluTrans].size() + AvailableAlus[AluDiscarded].size() +
405*9880d681SAndroid Build Coastguard Worker AvailableAlus[AluPredX].size();
406*9880d681SAndroid Build Coastguard Worker }
407*9880d681SAndroid Build Coastguard Worker
pickAlu()408*9880d681SAndroid Build Coastguard Worker SUnit* R600SchedStrategy::pickAlu() {
409*9880d681SAndroid Build Coastguard Worker while (AvailablesAluCount() || !Pending[IDAlu].empty()) {
410*9880d681SAndroid Build Coastguard Worker if (!OccupedSlotsMask) {
411*9880d681SAndroid Build Coastguard Worker // Bottom up scheduling : predX must comes first
412*9880d681SAndroid Build Coastguard Worker if (!AvailableAlus[AluPredX].empty()) {
413*9880d681SAndroid Build Coastguard Worker OccupedSlotsMask |= 31;
414*9880d681SAndroid Build Coastguard Worker return PopInst(AvailableAlus[AluPredX], false);
415*9880d681SAndroid Build Coastguard Worker }
416*9880d681SAndroid Build Coastguard Worker // Flush physical reg copies (RA will discard them)
417*9880d681SAndroid Build Coastguard Worker if (!AvailableAlus[AluDiscarded].empty()) {
418*9880d681SAndroid Build Coastguard Worker OccupedSlotsMask |= 31;
419*9880d681SAndroid Build Coastguard Worker return PopInst(AvailableAlus[AluDiscarded], false);
420*9880d681SAndroid Build Coastguard Worker }
421*9880d681SAndroid Build Coastguard Worker // If there is a T_XYZW alu available, use it
422*9880d681SAndroid Build Coastguard Worker if (!AvailableAlus[AluT_XYZW].empty()) {
423*9880d681SAndroid Build Coastguard Worker OccupedSlotsMask |= 15;
424*9880d681SAndroid Build Coastguard Worker return PopInst(AvailableAlus[AluT_XYZW], false);
425*9880d681SAndroid Build Coastguard Worker }
426*9880d681SAndroid Build Coastguard Worker }
427*9880d681SAndroid Build Coastguard Worker bool TransSlotOccuped = OccupedSlotsMask & 16;
428*9880d681SAndroid Build Coastguard Worker if (!TransSlotOccuped && VLIW5) {
429*9880d681SAndroid Build Coastguard Worker if (!AvailableAlus[AluTrans].empty()) {
430*9880d681SAndroid Build Coastguard Worker OccupedSlotsMask |= 16;
431*9880d681SAndroid Build Coastguard Worker return PopInst(AvailableAlus[AluTrans], false);
432*9880d681SAndroid Build Coastguard Worker }
433*9880d681SAndroid Build Coastguard Worker SUnit *SU = AttemptFillSlot(3, true);
434*9880d681SAndroid Build Coastguard Worker if (SU) {
435*9880d681SAndroid Build Coastguard Worker OccupedSlotsMask |= 16;
436*9880d681SAndroid Build Coastguard Worker return SU;
437*9880d681SAndroid Build Coastguard Worker }
438*9880d681SAndroid Build Coastguard Worker }
439*9880d681SAndroid Build Coastguard Worker for (int Chan = 3; Chan > -1; --Chan) {
440*9880d681SAndroid Build Coastguard Worker bool isOccupied = OccupedSlotsMask & (1 << Chan);
441*9880d681SAndroid Build Coastguard Worker if (!isOccupied) {
442*9880d681SAndroid Build Coastguard Worker SUnit *SU = AttemptFillSlot(Chan, false);
443*9880d681SAndroid Build Coastguard Worker if (SU) {
444*9880d681SAndroid Build Coastguard Worker OccupedSlotsMask |= (1 << Chan);
445*9880d681SAndroid Build Coastguard Worker InstructionsGroupCandidate.push_back(SU->getInstr());
446*9880d681SAndroid Build Coastguard Worker return SU;
447*9880d681SAndroid Build Coastguard Worker }
448*9880d681SAndroid Build Coastguard Worker }
449*9880d681SAndroid Build Coastguard Worker }
450*9880d681SAndroid Build Coastguard Worker PrepareNextSlot();
451*9880d681SAndroid Build Coastguard Worker }
452*9880d681SAndroid Build Coastguard Worker return nullptr;
453*9880d681SAndroid Build Coastguard Worker }
454*9880d681SAndroid Build Coastguard Worker
pickOther(int QID)455*9880d681SAndroid Build Coastguard Worker SUnit* R600SchedStrategy::pickOther(int QID) {
456*9880d681SAndroid Build Coastguard Worker SUnit *SU = nullptr;
457*9880d681SAndroid Build Coastguard Worker std::vector<SUnit *> &AQ = Available[QID];
458*9880d681SAndroid Build Coastguard Worker
459*9880d681SAndroid Build Coastguard Worker if (AQ.empty()) {
460*9880d681SAndroid Build Coastguard Worker MoveUnits(Pending[QID], AQ);
461*9880d681SAndroid Build Coastguard Worker }
462*9880d681SAndroid Build Coastguard Worker if (!AQ.empty()) {
463*9880d681SAndroid Build Coastguard Worker SU = AQ.back();
464*9880d681SAndroid Build Coastguard Worker AQ.resize(AQ.size() - 1);
465*9880d681SAndroid Build Coastguard Worker }
466*9880d681SAndroid Build Coastguard Worker return SU;
467*9880d681SAndroid Build Coastguard Worker }
468