xref: /aosp_15_r20/external/llvm/lib/Target/AArch64/AArch64PBQPRegAlloc.cpp (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker //===-- AArch64PBQPRegAlloc.cpp - AArch64 specific PBQP constraints -------===//
2*9880d681SAndroid Build Coastguard Worker //
3*9880d681SAndroid Build Coastguard Worker //                     The LLVM Compiler Infrastructure
4*9880d681SAndroid Build Coastguard Worker //
5*9880d681SAndroid Build Coastguard Worker // This file is distributed under the University of Illinois Open Source
6*9880d681SAndroid Build Coastguard Worker // License. See LICENSE.TXT for details.
7*9880d681SAndroid Build Coastguard Worker //
8*9880d681SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
9*9880d681SAndroid Build Coastguard Worker // This file contains the AArch64 / Cortex-A57 specific register allocation
10*9880d681SAndroid Build Coastguard Worker // constraints for use by the PBQP register allocator.
11*9880d681SAndroid Build Coastguard Worker //
12*9880d681SAndroid Build Coastguard Worker // It is essentially a transcription of what is contained in
13*9880d681SAndroid Build Coastguard Worker // AArch64A57FPLoadBalancing, which tries to use a balanced
14*9880d681SAndroid Build Coastguard Worker // mix of odd and even D-registers when performing a critical sequence of
15*9880d681SAndroid Build Coastguard Worker // independent, non-quadword FP/ASIMD floating-point multiply-accumulates.
16*9880d681SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
17*9880d681SAndroid Build Coastguard Worker 
18*9880d681SAndroid Build Coastguard Worker #define DEBUG_TYPE "aarch64-pbqp"
19*9880d681SAndroid Build Coastguard Worker 
20*9880d681SAndroid Build Coastguard Worker #include "AArch64.h"
21*9880d681SAndroid Build Coastguard Worker #include "AArch64PBQPRegAlloc.h"
22*9880d681SAndroid Build Coastguard Worker #include "AArch64RegisterInfo.h"
23*9880d681SAndroid Build Coastguard Worker #include "llvm/CodeGen/LiveIntervalAnalysis.h"
24*9880d681SAndroid Build Coastguard Worker #include "llvm/CodeGen/MachineBasicBlock.h"
25*9880d681SAndroid Build Coastguard Worker #include "llvm/CodeGen/MachineFunction.h"
26*9880d681SAndroid Build Coastguard Worker #include "llvm/CodeGen/MachineRegisterInfo.h"
27*9880d681SAndroid Build Coastguard Worker #include "llvm/CodeGen/RegAllocPBQP.h"
28*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/Debug.h"
29*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/ErrorHandling.h"
30*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/raw_ostream.h"
31*9880d681SAndroid Build Coastguard Worker 
32*9880d681SAndroid Build Coastguard Worker using namespace llvm;
33*9880d681SAndroid Build Coastguard Worker 
34*9880d681SAndroid Build Coastguard Worker namespace {
35*9880d681SAndroid Build Coastguard Worker 
36*9880d681SAndroid Build Coastguard Worker #ifndef NDEBUG
isFPReg(unsigned reg)37*9880d681SAndroid Build Coastguard Worker bool isFPReg(unsigned reg) {
38*9880d681SAndroid Build Coastguard Worker   return AArch64::FPR32RegClass.contains(reg) ||
39*9880d681SAndroid Build Coastguard Worker          AArch64::FPR64RegClass.contains(reg) ||
40*9880d681SAndroid Build Coastguard Worker          AArch64::FPR128RegClass.contains(reg);
41*9880d681SAndroid Build Coastguard Worker }
42*9880d681SAndroid Build Coastguard Worker #endif
43*9880d681SAndroid Build Coastguard Worker 
isOdd(unsigned reg)44*9880d681SAndroid Build Coastguard Worker bool isOdd(unsigned reg) {
45*9880d681SAndroid Build Coastguard Worker   switch (reg) {
46*9880d681SAndroid Build Coastguard Worker   default:
47*9880d681SAndroid Build Coastguard Worker     llvm_unreachable("Register is not from the expected class !");
48*9880d681SAndroid Build Coastguard Worker   case AArch64::S1:
49*9880d681SAndroid Build Coastguard Worker   case AArch64::S3:
50*9880d681SAndroid Build Coastguard Worker   case AArch64::S5:
51*9880d681SAndroid Build Coastguard Worker   case AArch64::S7:
52*9880d681SAndroid Build Coastguard Worker   case AArch64::S9:
53*9880d681SAndroid Build Coastguard Worker   case AArch64::S11:
54*9880d681SAndroid Build Coastguard Worker   case AArch64::S13:
55*9880d681SAndroid Build Coastguard Worker   case AArch64::S15:
56*9880d681SAndroid Build Coastguard Worker   case AArch64::S17:
57*9880d681SAndroid Build Coastguard Worker   case AArch64::S19:
58*9880d681SAndroid Build Coastguard Worker   case AArch64::S21:
59*9880d681SAndroid Build Coastguard Worker   case AArch64::S23:
60*9880d681SAndroid Build Coastguard Worker   case AArch64::S25:
61*9880d681SAndroid Build Coastguard Worker   case AArch64::S27:
62*9880d681SAndroid Build Coastguard Worker   case AArch64::S29:
63*9880d681SAndroid Build Coastguard Worker   case AArch64::S31:
64*9880d681SAndroid Build Coastguard Worker   case AArch64::D1:
65*9880d681SAndroid Build Coastguard Worker   case AArch64::D3:
66*9880d681SAndroid Build Coastguard Worker   case AArch64::D5:
67*9880d681SAndroid Build Coastguard Worker   case AArch64::D7:
68*9880d681SAndroid Build Coastguard Worker   case AArch64::D9:
69*9880d681SAndroid Build Coastguard Worker   case AArch64::D11:
70*9880d681SAndroid Build Coastguard Worker   case AArch64::D13:
71*9880d681SAndroid Build Coastguard Worker   case AArch64::D15:
72*9880d681SAndroid Build Coastguard Worker   case AArch64::D17:
73*9880d681SAndroid Build Coastguard Worker   case AArch64::D19:
74*9880d681SAndroid Build Coastguard Worker   case AArch64::D21:
75*9880d681SAndroid Build Coastguard Worker   case AArch64::D23:
76*9880d681SAndroid Build Coastguard Worker   case AArch64::D25:
77*9880d681SAndroid Build Coastguard Worker   case AArch64::D27:
78*9880d681SAndroid Build Coastguard Worker   case AArch64::D29:
79*9880d681SAndroid Build Coastguard Worker   case AArch64::D31:
80*9880d681SAndroid Build Coastguard Worker   case AArch64::Q1:
81*9880d681SAndroid Build Coastguard Worker   case AArch64::Q3:
82*9880d681SAndroid Build Coastguard Worker   case AArch64::Q5:
83*9880d681SAndroid Build Coastguard Worker   case AArch64::Q7:
84*9880d681SAndroid Build Coastguard Worker   case AArch64::Q9:
85*9880d681SAndroid Build Coastguard Worker   case AArch64::Q11:
86*9880d681SAndroid Build Coastguard Worker   case AArch64::Q13:
87*9880d681SAndroid Build Coastguard Worker   case AArch64::Q15:
88*9880d681SAndroid Build Coastguard Worker   case AArch64::Q17:
89*9880d681SAndroid Build Coastguard Worker   case AArch64::Q19:
90*9880d681SAndroid Build Coastguard Worker   case AArch64::Q21:
91*9880d681SAndroid Build Coastguard Worker   case AArch64::Q23:
92*9880d681SAndroid Build Coastguard Worker   case AArch64::Q25:
93*9880d681SAndroid Build Coastguard Worker   case AArch64::Q27:
94*9880d681SAndroid Build Coastguard Worker   case AArch64::Q29:
95*9880d681SAndroid Build Coastguard Worker   case AArch64::Q31:
96*9880d681SAndroid Build Coastguard Worker     return true;
97*9880d681SAndroid Build Coastguard Worker   case AArch64::S0:
98*9880d681SAndroid Build Coastguard Worker   case AArch64::S2:
99*9880d681SAndroid Build Coastguard Worker   case AArch64::S4:
100*9880d681SAndroid Build Coastguard Worker   case AArch64::S6:
101*9880d681SAndroid Build Coastguard Worker   case AArch64::S8:
102*9880d681SAndroid Build Coastguard Worker   case AArch64::S10:
103*9880d681SAndroid Build Coastguard Worker   case AArch64::S12:
104*9880d681SAndroid Build Coastguard Worker   case AArch64::S14:
105*9880d681SAndroid Build Coastguard Worker   case AArch64::S16:
106*9880d681SAndroid Build Coastguard Worker   case AArch64::S18:
107*9880d681SAndroid Build Coastguard Worker   case AArch64::S20:
108*9880d681SAndroid Build Coastguard Worker   case AArch64::S22:
109*9880d681SAndroid Build Coastguard Worker   case AArch64::S24:
110*9880d681SAndroid Build Coastguard Worker   case AArch64::S26:
111*9880d681SAndroid Build Coastguard Worker   case AArch64::S28:
112*9880d681SAndroid Build Coastguard Worker   case AArch64::S30:
113*9880d681SAndroid Build Coastguard Worker   case AArch64::D0:
114*9880d681SAndroid Build Coastguard Worker   case AArch64::D2:
115*9880d681SAndroid Build Coastguard Worker   case AArch64::D4:
116*9880d681SAndroid Build Coastguard Worker   case AArch64::D6:
117*9880d681SAndroid Build Coastguard Worker   case AArch64::D8:
118*9880d681SAndroid Build Coastguard Worker   case AArch64::D10:
119*9880d681SAndroid Build Coastguard Worker   case AArch64::D12:
120*9880d681SAndroid Build Coastguard Worker   case AArch64::D14:
121*9880d681SAndroid Build Coastguard Worker   case AArch64::D16:
122*9880d681SAndroid Build Coastguard Worker   case AArch64::D18:
123*9880d681SAndroid Build Coastguard Worker   case AArch64::D20:
124*9880d681SAndroid Build Coastguard Worker   case AArch64::D22:
125*9880d681SAndroid Build Coastguard Worker   case AArch64::D24:
126*9880d681SAndroid Build Coastguard Worker   case AArch64::D26:
127*9880d681SAndroid Build Coastguard Worker   case AArch64::D28:
128*9880d681SAndroid Build Coastguard Worker   case AArch64::D30:
129*9880d681SAndroid Build Coastguard Worker   case AArch64::Q0:
130*9880d681SAndroid Build Coastguard Worker   case AArch64::Q2:
131*9880d681SAndroid Build Coastguard Worker   case AArch64::Q4:
132*9880d681SAndroid Build Coastguard Worker   case AArch64::Q6:
133*9880d681SAndroid Build Coastguard Worker   case AArch64::Q8:
134*9880d681SAndroid Build Coastguard Worker   case AArch64::Q10:
135*9880d681SAndroid Build Coastguard Worker   case AArch64::Q12:
136*9880d681SAndroid Build Coastguard Worker   case AArch64::Q14:
137*9880d681SAndroid Build Coastguard Worker   case AArch64::Q16:
138*9880d681SAndroid Build Coastguard Worker   case AArch64::Q18:
139*9880d681SAndroid Build Coastguard Worker   case AArch64::Q20:
140*9880d681SAndroid Build Coastguard Worker   case AArch64::Q22:
141*9880d681SAndroid Build Coastguard Worker   case AArch64::Q24:
142*9880d681SAndroid Build Coastguard Worker   case AArch64::Q26:
143*9880d681SAndroid Build Coastguard Worker   case AArch64::Q28:
144*9880d681SAndroid Build Coastguard Worker   case AArch64::Q30:
145*9880d681SAndroid Build Coastguard Worker     return false;
146*9880d681SAndroid Build Coastguard Worker 
147*9880d681SAndroid Build Coastguard Worker   }
148*9880d681SAndroid Build Coastguard Worker }
149*9880d681SAndroid Build Coastguard Worker 
haveSameParity(unsigned reg1,unsigned reg2)150*9880d681SAndroid Build Coastguard Worker bool haveSameParity(unsigned reg1, unsigned reg2) {
151*9880d681SAndroid Build Coastguard Worker   assert(isFPReg(reg1) && "Expecting an FP register for reg1");
152*9880d681SAndroid Build Coastguard Worker   assert(isFPReg(reg2) && "Expecting an FP register for reg2");
153*9880d681SAndroid Build Coastguard Worker 
154*9880d681SAndroid Build Coastguard Worker   return isOdd(reg1) == isOdd(reg2);
155*9880d681SAndroid Build Coastguard Worker }
156*9880d681SAndroid Build Coastguard Worker 
157*9880d681SAndroid Build Coastguard Worker }
158*9880d681SAndroid Build Coastguard Worker 
addIntraChainConstraint(PBQPRAGraph & G,unsigned Rd,unsigned Ra)159*9880d681SAndroid Build Coastguard Worker bool A57ChainingConstraint::addIntraChainConstraint(PBQPRAGraph &G, unsigned Rd,
160*9880d681SAndroid Build Coastguard Worker                                                  unsigned Ra) {
161*9880d681SAndroid Build Coastguard Worker   if (Rd == Ra)
162*9880d681SAndroid Build Coastguard Worker     return false;
163*9880d681SAndroid Build Coastguard Worker 
164*9880d681SAndroid Build Coastguard Worker   LiveIntervals &LIs = G.getMetadata().LIS;
165*9880d681SAndroid Build Coastguard Worker 
166*9880d681SAndroid Build Coastguard Worker   if (TRI->isPhysicalRegister(Rd) || TRI->isPhysicalRegister(Ra)) {
167*9880d681SAndroid Build Coastguard Worker     DEBUG(dbgs() << "Rd is a physical reg:" << TRI->isPhysicalRegister(Rd)
168*9880d681SAndroid Build Coastguard Worker           << '\n');
169*9880d681SAndroid Build Coastguard Worker     DEBUG(dbgs() << "Ra is a physical reg:" << TRI->isPhysicalRegister(Ra)
170*9880d681SAndroid Build Coastguard Worker           << '\n');
171*9880d681SAndroid Build Coastguard Worker     return false;
172*9880d681SAndroid Build Coastguard Worker   }
173*9880d681SAndroid Build Coastguard Worker 
174*9880d681SAndroid Build Coastguard Worker   PBQPRAGraph::NodeId node1 = G.getMetadata().getNodeIdForVReg(Rd);
175*9880d681SAndroid Build Coastguard Worker   PBQPRAGraph::NodeId node2 = G.getMetadata().getNodeIdForVReg(Ra);
176*9880d681SAndroid Build Coastguard Worker 
177*9880d681SAndroid Build Coastguard Worker   const PBQPRAGraph::NodeMetadata::AllowedRegVector *vRdAllowed =
178*9880d681SAndroid Build Coastguard Worker     &G.getNodeMetadata(node1).getAllowedRegs();
179*9880d681SAndroid Build Coastguard Worker   const PBQPRAGraph::NodeMetadata::AllowedRegVector *vRaAllowed =
180*9880d681SAndroid Build Coastguard Worker     &G.getNodeMetadata(node2).getAllowedRegs();
181*9880d681SAndroid Build Coastguard Worker 
182*9880d681SAndroid Build Coastguard Worker   PBQPRAGraph::EdgeId edge = G.findEdge(node1, node2);
183*9880d681SAndroid Build Coastguard Worker 
184*9880d681SAndroid Build Coastguard Worker   // The edge does not exist. Create one with the appropriate interference
185*9880d681SAndroid Build Coastguard Worker   // costs.
186*9880d681SAndroid Build Coastguard Worker   if (edge == G.invalidEdgeId()) {
187*9880d681SAndroid Build Coastguard Worker     const LiveInterval &ld = LIs.getInterval(Rd);
188*9880d681SAndroid Build Coastguard Worker     const LiveInterval &la = LIs.getInterval(Ra);
189*9880d681SAndroid Build Coastguard Worker     bool livesOverlap = ld.overlaps(la);
190*9880d681SAndroid Build Coastguard Worker 
191*9880d681SAndroid Build Coastguard Worker     PBQPRAGraph::RawMatrix costs(vRdAllowed->size() + 1,
192*9880d681SAndroid Build Coastguard Worker                                  vRaAllowed->size() + 1, 0);
193*9880d681SAndroid Build Coastguard Worker     for (unsigned i = 0, ie = vRdAllowed->size(); i != ie; ++i) {
194*9880d681SAndroid Build Coastguard Worker       unsigned pRd = (*vRdAllowed)[i];
195*9880d681SAndroid Build Coastguard Worker       for (unsigned j = 0, je = vRaAllowed->size(); j != je; ++j) {
196*9880d681SAndroid Build Coastguard Worker         unsigned pRa = (*vRaAllowed)[j];
197*9880d681SAndroid Build Coastguard Worker         if (livesOverlap && TRI->regsOverlap(pRd, pRa))
198*9880d681SAndroid Build Coastguard Worker           costs[i + 1][j + 1] = std::numeric_limits<PBQP::PBQPNum>::infinity();
199*9880d681SAndroid Build Coastguard Worker         else
200*9880d681SAndroid Build Coastguard Worker           costs[i + 1][j + 1] = haveSameParity(pRd, pRa) ? 0.0 : 1.0;
201*9880d681SAndroid Build Coastguard Worker       }
202*9880d681SAndroid Build Coastguard Worker     }
203*9880d681SAndroid Build Coastguard Worker     G.addEdge(node1, node2, std::move(costs));
204*9880d681SAndroid Build Coastguard Worker     return true;
205*9880d681SAndroid Build Coastguard Worker   }
206*9880d681SAndroid Build Coastguard Worker 
207*9880d681SAndroid Build Coastguard Worker   if (G.getEdgeNode1Id(edge) == node2) {
208*9880d681SAndroid Build Coastguard Worker     std::swap(node1, node2);
209*9880d681SAndroid Build Coastguard Worker     std::swap(vRdAllowed, vRaAllowed);
210*9880d681SAndroid Build Coastguard Worker   }
211*9880d681SAndroid Build Coastguard Worker 
212*9880d681SAndroid Build Coastguard Worker   // Enforce minCost(sameParity(RaClass)) > maxCost(otherParity(RdClass))
213*9880d681SAndroid Build Coastguard Worker   PBQPRAGraph::RawMatrix costs(G.getEdgeCosts(edge));
214*9880d681SAndroid Build Coastguard Worker   for (unsigned i = 0, ie = vRdAllowed->size(); i != ie; ++i) {
215*9880d681SAndroid Build Coastguard Worker     unsigned pRd = (*vRdAllowed)[i];
216*9880d681SAndroid Build Coastguard Worker 
217*9880d681SAndroid Build Coastguard Worker     // Get the maximum cost (excluding unallocatable reg) for same parity
218*9880d681SAndroid Build Coastguard Worker     // registers
219*9880d681SAndroid Build Coastguard Worker     PBQP::PBQPNum sameParityMax = std::numeric_limits<PBQP::PBQPNum>::min();
220*9880d681SAndroid Build Coastguard Worker     for (unsigned j = 0, je = vRaAllowed->size(); j != je; ++j) {
221*9880d681SAndroid Build Coastguard Worker       unsigned pRa = (*vRaAllowed)[j];
222*9880d681SAndroid Build Coastguard Worker       if (haveSameParity(pRd, pRa))
223*9880d681SAndroid Build Coastguard Worker         if (costs[i + 1][j + 1] !=
224*9880d681SAndroid Build Coastguard Worker                 std::numeric_limits<PBQP::PBQPNum>::infinity() &&
225*9880d681SAndroid Build Coastguard Worker             costs[i + 1][j + 1] > sameParityMax)
226*9880d681SAndroid Build Coastguard Worker           sameParityMax = costs[i + 1][j + 1];
227*9880d681SAndroid Build Coastguard Worker     }
228*9880d681SAndroid Build Coastguard Worker 
229*9880d681SAndroid Build Coastguard Worker     // Ensure all registers with a different parity have a higher cost
230*9880d681SAndroid Build Coastguard Worker     // than sameParityMax
231*9880d681SAndroid Build Coastguard Worker     for (unsigned j = 0, je = vRaAllowed->size(); j != je; ++j) {
232*9880d681SAndroid Build Coastguard Worker       unsigned pRa = (*vRaAllowed)[j];
233*9880d681SAndroid Build Coastguard Worker       if (!haveSameParity(pRd, pRa))
234*9880d681SAndroid Build Coastguard Worker         if (sameParityMax > costs[i + 1][j + 1])
235*9880d681SAndroid Build Coastguard Worker           costs[i + 1][j + 1] = sameParityMax + 1.0;
236*9880d681SAndroid Build Coastguard Worker     }
237*9880d681SAndroid Build Coastguard Worker   }
238*9880d681SAndroid Build Coastguard Worker   G.updateEdgeCosts(edge, std::move(costs));
239*9880d681SAndroid Build Coastguard Worker 
240*9880d681SAndroid Build Coastguard Worker   return true;
241*9880d681SAndroid Build Coastguard Worker }
242*9880d681SAndroid Build Coastguard Worker 
addInterChainConstraint(PBQPRAGraph & G,unsigned Rd,unsigned Ra)243*9880d681SAndroid Build Coastguard Worker void A57ChainingConstraint::addInterChainConstraint(PBQPRAGraph &G, unsigned Rd,
244*9880d681SAndroid Build Coastguard Worker                                                  unsigned Ra) {
245*9880d681SAndroid Build Coastguard Worker   LiveIntervals &LIs = G.getMetadata().LIS;
246*9880d681SAndroid Build Coastguard Worker 
247*9880d681SAndroid Build Coastguard Worker   // Do some Chain management
248*9880d681SAndroid Build Coastguard Worker   if (Chains.count(Ra)) {
249*9880d681SAndroid Build Coastguard Worker     if (Rd != Ra) {
250*9880d681SAndroid Build Coastguard Worker       DEBUG(dbgs() << "Moving acc chain from " << PrintReg(Ra, TRI) << " to "
251*9880d681SAndroid Build Coastguard Worker                    << PrintReg(Rd, TRI) << '\n';);
252*9880d681SAndroid Build Coastguard Worker       Chains.remove(Ra);
253*9880d681SAndroid Build Coastguard Worker       Chains.insert(Rd);
254*9880d681SAndroid Build Coastguard Worker     }
255*9880d681SAndroid Build Coastguard Worker   } else {
256*9880d681SAndroid Build Coastguard Worker     DEBUG(dbgs() << "Creating new acc chain for " << PrintReg(Rd, TRI)
257*9880d681SAndroid Build Coastguard Worker                  << '\n';);
258*9880d681SAndroid Build Coastguard Worker     Chains.insert(Rd);
259*9880d681SAndroid Build Coastguard Worker   }
260*9880d681SAndroid Build Coastguard Worker 
261*9880d681SAndroid Build Coastguard Worker   PBQPRAGraph::NodeId node1 = G.getMetadata().getNodeIdForVReg(Rd);
262*9880d681SAndroid Build Coastguard Worker 
263*9880d681SAndroid Build Coastguard Worker   const LiveInterval &ld = LIs.getInterval(Rd);
264*9880d681SAndroid Build Coastguard Worker   for (auto r : Chains) {
265*9880d681SAndroid Build Coastguard Worker     // Skip self
266*9880d681SAndroid Build Coastguard Worker     if (r == Rd)
267*9880d681SAndroid Build Coastguard Worker       continue;
268*9880d681SAndroid Build Coastguard Worker 
269*9880d681SAndroid Build Coastguard Worker     const LiveInterval &lr = LIs.getInterval(r);
270*9880d681SAndroid Build Coastguard Worker     if (ld.overlaps(lr)) {
271*9880d681SAndroid Build Coastguard Worker       const PBQPRAGraph::NodeMetadata::AllowedRegVector *vRdAllowed =
272*9880d681SAndroid Build Coastguard Worker         &G.getNodeMetadata(node1).getAllowedRegs();
273*9880d681SAndroid Build Coastguard Worker 
274*9880d681SAndroid Build Coastguard Worker       PBQPRAGraph::NodeId node2 = G.getMetadata().getNodeIdForVReg(r);
275*9880d681SAndroid Build Coastguard Worker       const PBQPRAGraph::NodeMetadata::AllowedRegVector *vRrAllowed =
276*9880d681SAndroid Build Coastguard Worker         &G.getNodeMetadata(node2).getAllowedRegs();
277*9880d681SAndroid Build Coastguard Worker 
278*9880d681SAndroid Build Coastguard Worker       PBQPRAGraph::EdgeId edge = G.findEdge(node1, node2);
279*9880d681SAndroid Build Coastguard Worker       assert(edge != G.invalidEdgeId() &&
280*9880d681SAndroid Build Coastguard Worker              "PBQP error ! The edge should exist !");
281*9880d681SAndroid Build Coastguard Worker 
282*9880d681SAndroid Build Coastguard Worker       DEBUG(dbgs() << "Refining constraint !\n";);
283*9880d681SAndroid Build Coastguard Worker 
284*9880d681SAndroid Build Coastguard Worker       if (G.getEdgeNode1Id(edge) == node2) {
285*9880d681SAndroid Build Coastguard Worker         std::swap(node1, node2);
286*9880d681SAndroid Build Coastguard Worker         std::swap(vRdAllowed, vRrAllowed);
287*9880d681SAndroid Build Coastguard Worker       }
288*9880d681SAndroid Build Coastguard Worker 
289*9880d681SAndroid Build Coastguard Worker       // Enforce that cost is higher with all other Chains of the same parity
290*9880d681SAndroid Build Coastguard Worker       PBQP::Matrix costs(G.getEdgeCosts(edge));
291*9880d681SAndroid Build Coastguard Worker       for (unsigned i = 0, ie = vRdAllowed->size(); i != ie; ++i) {
292*9880d681SAndroid Build Coastguard Worker         unsigned pRd = (*vRdAllowed)[i];
293*9880d681SAndroid Build Coastguard Worker 
294*9880d681SAndroid Build Coastguard Worker         // Get the maximum cost (excluding unallocatable reg) for all other
295*9880d681SAndroid Build Coastguard Worker         // parity registers
296*9880d681SAndroid Build Coastguard Worker         PBQP::PBQPNum sameParityMax = std::numeric_limits<PBQP::PBQPNum>::min();
297*9880d681SAndroid Build Coastguard Worker         for (unsigned j = 0, je = vRrAllowed->size(); j != je; ++j) {
298*9880d681SAndroid Build Coastguard Worker           unsigned pRa = (*vRrAllowed)[j];
299*9880d681SAndroid Build Coastguard Worker           if (!haveSameParity(pRd, pRa))
300*9880d681SAndroid Build Coastguard Worker             if (costs[i + 1][j + 1] !=
301*9880d681SAndroid Build Coastguard Worker                     std::numeric_limits<PBQP::PBQPNum>::infinity() &&
302*9880d681SAndroid Build Coastguard Worker                 costs[i + 1][j + 1] > sameParityMax)
303*9880d681SAndroid Build Coastguard Worker               sameParityMax = costs[i + 1][j + 1];
304*9880d681SAndroid Build Coastguard Worker         }
305*9880d681SAndroid Build Coastguard Worker 
306*9880d681SAndroid Build Coastguard Worker         // Ensure all registers with same parity have a higher cost
307*9880d681SAndroid Build Coastguard Worker         // than sameParityMax
308*9880d681SAndroid Build Coastguard Worker         for (unsigned j = 0, je = vRrAllowed->size(); j != je; ++j) {
309*9880d681SAndroid Build Coastguard Worker           unsigned pRa = (*vRrAllowed)[j];
310*9880d681SAndroid Build Coastguard Worker           if (haveSameParity(pRd, pRa))
311*9880d681SAndroid Build Coastguard Worker             if (sameParityMax > costs[i + 1][j + 1])
312*9880d681SAndroid Build Coastguard Worker               costs[i + 1][j + 1] = sameParityMax + 1.0;
313*9880d681SAndroid Build Coastguard Worker         }
314*9880d681SAndroid Build Coastguard Worker       }
315*9880d681SAndroid Build Coastguard Worker       G.updateEdgeCosts(edge, std::move(costs));
316*9880d681SAndroid Build Coastguard Worker     }
317*9880d681SAndroid Build Coastguard Worker   }
318*9880d681SAndroid Build Coastguard Worker }
319*9880d681SAndroid Build Coastguard Worker 
regJustKilledBefore(const LiveIntervals & LIs,unsigned reg,const MachineInstr & MI)320*9880d681SAndroid Build Coastguard Worker static bool regJustKilledBefore(const LiveIntervals &LIs, unsigned reg,
321*9880d681SAndroid Build Coastguard Worker                                 const MachineInstr &MI) {
322*9880d681SAndroid Build Coastguard Worker   const LiveInterval &LI = LIs.getInterval(reg);
323*9880d681SAndroid Build Coastguard Worker   SlotIndex SI = LIs.getInstructionIndex(MI);
324*9880d681SAndroid Build Coastguard Worker   return LI.expiredAt(SI);
325*9880d681SAndroid Build Coastguard Worker }
326*9880d681SAndroid Build Coastguard Worker 
apply(PBQPRAGraph & G)327*9880d681SAndroid Build Coastguard Worker void A57ChainingConstraint::apply(PBQPRAGraph &G) {
328*9880d681SAndroid Build Coastguard Worker   const MachineFunction &MF = G.getMetadata().MF;
329*9880d681SAndroid Build Coastguard Worker   LiveIntervals &LIs = G.getMetadata().LIS;
330*9880d681SAndroid Build Coastguard Worker 
331*9880d681SAndroid Build Coastguard Worker   TRI = MF.getSubtarget().getRegisterInfo();
332*9880d681SAndroid Build Coastguard Worker   DEBUG(MF.dump());
333*9880d681SAndroid Build Coastguard Worker 
334*9880d681SAndroid Build Coastguard Worker   for (const auto &MBB: MF) {
335*9880d681SAndroid Build Coastguard Worker     Chains.clear(); // FIXME: really needed ? Could not work at MF level ?
336*9880d681SAndroid Build Coastguard Worker 
337*9880d681SAndroid Build Coastguard Worker     for (const auto &MI: MBB) {
338*9880d681SAndroid Build Coastguard Worker 
339*9880d681SAndroid Build Coastguard Worker       // Forget Chains which have expired
340*9880d681SAndroid Build Coastguard Worker       for (auto r : Chains) {
341*9880d681SAndroid Build Coastguard Worker         SmallVector<unsigned, 8> toDel;
342*9880d681SAndroid Build Coastguard Worker         if(regJustKilledBefore(LIs, r, MI)) {
343*9880d681SAndroid Build Coastguard Worker           DEBUG(dbgs() << "Killing chain " << PrintReg(r, TRI) << " at ";
344*9880d681SAndroid Build Coastguard Worker                 MI.print(dbgs()););
345*9880d681SAndroid Build Coastguard Worker           toDel.push_back(r);
346*9880d681SAndroid Build Coastguard Worker         }
347*9880d681SAndroid Build Coastguard Worker 
348*9880d681SAndroid Build Coastguard Worker         while (!toDel.empty()) {
349*9880d681SAndroid Build Coastguard Worker           Chains.remove(toDel.back());
350*9880d681SAndroid Build Coastguard Worker           toDel.pop_back();
351*9880d681SAndroid Build Coastguard Worker         }
352*9880d681SAndroid Build Coastguard Worker       }
353*9880d681SAndroid Build Coastguard Worker 
354*9880d681SAndroid Build Coastguard Worker       switch (MI.getOpcode()) {
355*9880d681SAndroid Build Coastguard Worker       case AArch64::FMSUBSrrr:
356*9880d681SAndroid Build Coastguard Worker       case AArch64::FMADDSrrr:
357*9880d681SAndroid Build Coastguard Worker       case AArch64::FNMSUBSrrr:
358*9880d681SAndroid Build Coastguard Worker       case AArch64::FNMADDSrrr:
359*9880d681SAndroid Build Coastguard Worker       case AArch64::FMSUBDrrr:
360*9880d681SAndroid Build Coastguard Worker       case AArch64::FMADDDrrr:
361*9880d681SAndroid Build Coastguard Worker       case AArch64::FNMSUBDrrr:
362*9880d681SAndroid Build Coastguard Worker       case AArch64::FNMADDDrrr: {
363*9880d681SAndroid Build Coastguard Worker         unsigned Rd = MI.getOperand(0).getReg();
364*9880d681SAndroid Build Coastguard Worker         unsigned Ra = MI.getOperand(3).getReg();
365*9880d681SAndroid Build Coastguard Worker 
366*9880d681SAndroid Build Coastguard Worker         if (addIntraChainConstraint(G, Rd, Ra))
367*9880d681SAndroid Build Coastguard Worker           addInterChainConstraint(G, Rd, Ra);
368*9880d681SAndroid Build Coastguard Worker         break;
369*9880d681SAndroid Build Coastguard Worker       }
370*9880d681SAndroid Build Coastguard Worker 
371*9880d681SAndroid Build Coastguard Worker       case AArch64::FMLAv2f32:
372*9880d681SAndroid Build Coastguard Worker       case AArch64::FMLSv2f32: {
373*9880d681SAndroid Build Coastguard Worker         unsigned Rd = MI.getOperand(0).getReg();
374*9880d681SAndroid Build Coastguard Worker         addInterChainConstraint(G, Rd, Rd);
375*9880d681SAndroid Build Coastguard Worker         break;
376*9880d681SAndroid Build Coastguard Worker       }
377*9880d681SAndroid Build Coastguard Worker 
378*9880d681SAndroid Build Coastguard Worker       default:
379*9880d681SAndroid Build Coastguard Worker         break;
380*9880d681SAndroid Build Coastguard Worker       }
381*9880d681SAndroid Build Coastguard Worker     }
382*9880d681SAndroid Build Coastguard Worker   }
383*9880d681SAndroid Build Coastguard Worker }
384