xref: /XiangShan/src/main/scala/xiangshan/backend/Backend.scala (revision 8a1d27c4ec2c33952123718593e9478190b50880)
1package xiangshan.backend
2
3import bus.simplebus.SimpleBusUC
4import chisel3._
5import chisel3.util._
6import chisel3.util.experimental.BoringUtils
7import noop.MemMMUIO
8import xiangshan._
9import xiangshan.backend.decode.{DecodeBuffer, DecodeStage}
10import xiangshan.backend.rename.Rename
11import xiangshan.backend.brq.Brq
12import xiangshan.backend.dispatch.Dispatch
13import xiangshan.backend.exu._
14import xiangshan.backend.fu.FunctionUnit
15import xiangshan.backend.issue.{IssueQueue, ReservationStation}
16import xiangshan.backend.regfile.{Regfile, RfWritePort}
17import xiangshan.backend.roq.Roq
18import xiangshan.mem._
19import utils.ParallelOR
20
21/** Backend Pipeline:
22  * Decode -> Rename -> Dispatch-1 -> Dispatch-2 -> Issue -> Exe
23  */
24class Backend extends XSModule
25  with NeedImpl {
26  val io = IO(new Bundle {
27    // val dmem = new SimpleBusUC(addrBits = VAddrBits)
28    val memMMU = Flipped(new MemMMUIO)
29    val frontend = Flipped(new FrontendToBackendIO)
30    val mem = Flipped(new MemToBackendIO)
31  })
32
33
34  val aluExeUnits = Array.tabulate(exuParameters.AluCnt)(_ => Module(new AluExeUnit))
35  val jmpExeUnit = Module(new JmpExeUnit)
36  val mulExeUnits = Array.tabulate(exuParameters.MulCnt)(_ => Module(new MulExeUnit))
37  val mduExeUnits = Array.tabulate(exuParameters.MduCnt)(_ => Module(new MulDivExeUnit))
38  // val fmacExeUnits = Array.tabulate(exuParameters.FmacCnt)(_ => Module(new Fmac))
39  // val fmiscExeUnits = Array.tabulate(exuParameters.FmiscCnt)(_ => Module(new Fmisc))
40  // val fmiscDivSqrtExeUnits = Array.tabulate(exuParameters.FmiscDivSqrtCnt)(_ => Module(new FmiscDivSqrt))
41  val exeUnits = jmpExeUnit +: (aluExeUnits ++ mulExeUnits ++ mduExeUnits)
42  exeUnits.foreach(_.io.exception := DontCare)
43  exeUnits.foreach(_.io.dmem := DontCare)
44  exeUnits.foreach(_.io.mcommit := DontCare)
45
46  val decode = Module(new DecodeStage)
47  val brq = Module(new Brq)
48  val decBuf = Module(new DecodeBuffer)
49  val rename = Module(new Rename)
50  val dispatch = Module(new Dispatch())
51  val roq = Module(new Roq)
52  val intRf = Module(new Regfile(
53    numReadPorts = NRIntReadPorts,
54    numWirtePorts = NRIntWritePorts,
55    hasZero = true
56  ))
57  val fpRf = Module(new Regfile(
58    numReadPorts = NRFpReadPorts,
59    numWirtePorts = NRFpWritePorts,
60    hasZero = false
61  ))
62  val memRf = Module(new Regfile(
63    numReadPorts = 2*exuParameters.StuCnt + exuParameters.LduCnt,
64    numWirtePorts = NRIntWritePorts,
65    hasZero = true,
66    isMemRf = true
67  ))
68
69  // backend redirect, flush pipeline
70  val redirect = Mux(
71    roq.io.redirect.valid,
72    roq.io.redirect,
73    Mux(
74      brq.io.redirect.valid,
75      brq.io.redirect,
76      io.mem.replayAll
77    )
78  )
79
80  io.frontend.redirect := redirect
81  io.frontend.redirect.valid := redirect.valid && !redirect.bits.isReplay
82
83  val memConfigs =
84    Seq.fill(exuParameters.LduCnt)(Exu.ldExeUnitCfg) ++
85    Seq.fill(exuParameters.StuCnt)(Exu.stExeUnitCfg)
86
87  val exuConfigs = exeUnits.map(_.config) ++ memConfigs
88
89  val exeWbReqs = exeUnits.map(_.io.out) ++ io.mem.ldout ++ io.mem.stout
90
91  def needWakeup(cfg: ExuConfig): Boolean =
92    (cfg.readIntRf && cfg.writeIntRf) || (cfg.readFpRf && cfg.writeFpRf)
93
94  def needData(a: ExuConfig, b: ExuConfig): Boolean =
95    (a.readIntRf && b.writeIntRf) || (a.readFpRf && b.writeFpRf)
96
97  val reservedStations = exeUnits.
98    zipWithIndex.
99    map({ case (exu, i) =>
100
101      val cfg = exu.config
102
103      val wakeUpDateVec = exuConfigs.zip(exeWbReqs).filter(x => needData(cfg, x._1)).map(_._2)
104      val bypassCnt = exuConfigs.count(c => c.enableBypass && needData(cfg, c))
105
106      println(s"exu:${cfg.name} wakeupCnt:${wakeUpDateVec.length} bypassCnt:$bypassCnt")
107
108      val rs = Module(new ReservationStation(
109        cfg, wakeUpDateVec.length, bypassCnt, cfg.enableBypass, false
110      ))
111      rs.io.redirect <> redirect
112      rs.io.numExist <> dispatch.io.numExist(i)
113      rs.io.enqCtrl <> dispatch.io.enqIQCtrl(i)
114      rs.io.enqData <> dispatch.io.enqIQData(i)
115      for(
116        (wakeUpPort, exuOut) <-
117        rs.io.wakeUpPorts.zip(wakeUpDateVec)
118      ){
119        wakeUpPort.bits := exuOut.bits
120        wakeUpPort.valid := exuOut.valid
121      }
122
123      exu.io.in <> rs.io.deq
124      exu.io.redirect <> redirect
125      rs
126    })
127
128  for( rs <- reservedStations){
129    rs.io.bypassUops <> reservedStations.
130      filter(x => x.enableBypass && needData(rs.exuCfg, x.exuCfg)).
131      map(_.io.selectedUop)
132
133    val bypassDataVec = exuConfigs.zip(exeWbReqs).
134      filter(x => x._1.enableBypass && needData(rs.exuCfg, x._1)).map(_._2)
135
136    for(i <- bypassDataVec.indices){
137      rs.io.bypassData(i).valid := bypassDataVec(i).valid
138      rs.io.bypassData(i).bits := bypassDataVec(i).bits
139    }
140  }
141
142  val issueQueues = exuConfigs.
143    zipWithIndex.
144    takeRight(exuParameters.LduCnt + exuParameters.StuCnt).
145    map({case (cfg, i) =>
146      val wakeUpDateVec = exuConfigs.zip(exeWbReqs).filter(x => needData(cfg, x._1)).map(_._2)
147      val bypassUopVec = reservedStations.
148        filter(r => r.exuCfg.enableBypass && needData(cfg, r.exuCfg)).map(_.io.selectedUop)
149      val bypassDataVec = exuConfigs.zip(exeWbReqs).
150        filter(x => x._1.enableBypass && needData(cfg, x._1)).map(_._2)
151
152      val iq = Module(new IssueQueue(
153        cfg, wakeUpDateVec.length, bypassUopVec.length
154      ))
155      println(s"exu:${cfg.name} wakeupCnt:${wakeUpDateVec.length} bypassCnt:${bypassUopVec.length}")
156      iq.io.redirect <> redirect
157      iq.io.tlbFeedback := io.mem.tlbFeedback(i - exuParameters.ExuCnt + exuParameters.LduCnt + exuParameters.StuCnt)
158      iq.io.enq <> dispatch.io.enqIQCtrl(i)
159      dispatch.io.numExist(i) := iq.io.numExist
160      for(
161        (wakeUpPort, exuOut) <-
162        iq.io.wakeUpPorts.zip(wakeUpDateVec)
163      ){
164        wakeUpPort.bits := exuOut.bits
165        wakeUpPort.valid := exuOut.fire() // data after arbit
166      }
167      iq.io.bypassUops <> bypassUopVec
168      for(i <- bypassDataVec.indices){
169        iq.io.bypassData(i).valid := bypassDataVec(i).valid
170        iq.io.bypassData(i).bits := bypassDataVec(i).bits
171      }
172      iq
173    })
174
175  io.mem.mcommit := roq.io.mcommit
176  io.mem.ldin <> issueQueues.filter(_.exuCfg == Exu.ldExeUnitCfg).map(_.io.deq)
177  io.mem.stin <> issueQueues.filter(_.exuCfg == Exu.stExeUnitCfg).map(_.io.deq)
178  jmpExeUnit.io.exception.valid := roq.io.redirect.valid
179  jmpExeUnit.io.exception.bits := roq.io.exception
180
181  io.frontend.outOfOrderBrInfo <> brq.io.outOfOrderBrInfo
182  io.frontend.inOrderBrInfo <> brq.io.inOrderBrInfo
183
184  decode.io.in <> io.frontend.cfVec
185  brq.io.roqRedirect <> roq.io.redirect
186  brq.io.memRedirect <> io.mem.replayAll
187  brq.io.bcommit := roq.io.bcommit
188  brq.io.enqReqs <> decode.io.toBrq
189  for ((x, y) <- brq.io.exuRedirect.zip(exeUnits.filter(_.config.hasRedirect))) {
190    x.bits := y.io.out.bits
191    x.valid := y.io.out.fire() && y.io.out.bits.redirectValid
192  }
193  decode.io.brTags <> brq.io.brTags
194  decBuf.io.isWalking := ParallelOR(roq.io.commits.map(c => c.valid && c.bits.isWalk)) // TODO: opt this
195  decBuf.io.redirect <> redirect
196  decBuf.io.in <> decode.io.out
197
198  rename.io.redirect <> redirect
199  rename.io.roqCommits <> roq.io.commits
200  rename.io.in <> decBuf.io.out
201  rename.io.intRfReadAddr <> dispatch.io.readIntRf.map(_.addr) ++ dispatch.io.intMemRegAddr
202  rename.io.intPregRdy <> dispatch.io.intPregRdy ++ dispatch.io.intMemRegRdy
203  rename.io.fpRfReadAddr <> dispatch.io.readFpRf.map(_.addr) ++ dispatch.io.fpMemRegAddr
204  rename.io.fpPregRdy <> dispatch.io.fpPregRdy ++ dispatch.io.fpMemRegRdy
205  dispatch.io.redirect <> redirect
206  dispatch.io.fromRename <> rename.io.out
207
208  roq.io.brqRedirect <> brq.io.redirect
209  roq.io.dp1Req <> dispatch.io.toRoq
210  dispatch.io.roqIdxs <> roq.io.roqIdxs
211  io.mem.dp1Req <> dispatch.io.toMoq
212  dispatch.io.moqIdxs <> io.mem.moqIdxs
213  dispatch.io.commits <> roq.io.commits
214
215  intRf.io.readPorts <> dispatch.io.readIntRf
216  fpRf.io.readPorts <> dispatch.io.readFpRf ++ issueQueues.flatMap(_.io.readFpRf)
217  memRf.io.readPorts <> issueQueues.flatMap(_.io.readIntRf)
218
219  io.mem.redirect <> redirect
220
221  val wbu = Module(new Wbu(exuConfigs))
222  wbu.io.in <> exeWbReqs
223
224  val wbIntResults = wbu.io.toIntRf
225  val wbFpResults = wbu.io.toFpRf
226
227  def exuOutToRfWrite(x: Valid[ExuOutput]): RfWritePort = {
228    val rfWrite = Wire(new RfWritePort)
229    rfWrite.wen := x.valid
230    rfWrite.addr := x.bits.uop.pdest
231    rfWrite.data := x.bits.data
232    rfWrite
233  }
234  val intRfWrite = wbIntResults.map(exuOutToRfWrite)
235  intRf.io.writePorts <> intRfWrite
236  memRf.io.writePorts <> intRfWrite
237  fpRf.io.writePorts <> wbFpResults.map(exuOutToRfWrite)
238
239  rename.io.wbIntResults <> wbIntResults
240  rename.io.wbFpResults <> wbFpResults
241
242  roq.io.exeWbResults.take(exeWbReqs.length).zip(wbu.io.toRoq).foreach(x => x._1 := x._2)
243  roq.io.exeWbResults.last := brq.io.out
244
245
246  // TODO: Remove sink and source
247  val tmp = WireInit(0.U)
248  val sinks = Array[String](
249    "DTLBFINISH",
250    "DTLBPF",
251    "DTLBENABLE",
252    "perfCntCondMdcacheLoss",
253    "perfCntCondMl2cacheLoss",
254    "perfCntCondMdcacheHit",
255    "lsuMMIO",
256    "perfCntCondMl2cacheHit",
257    "perfCntCondMl2cacheReq",
258    "mtip",
259    "perfCntCondMdcacheReq",
260    "meip"
261  )
262  for (s <- sinks) {
263    BoringUtils.addSink(tmp, s)
264  }
265
266  val debugIntReg, debugFpReg = WireInit(VecInit(Seq.fill(32)(0.U(XLEN.W))))
267  BoringUtils.addSink(debugIntReg, "DEBUG_INT_ARCH_REG")
268  BoringUtils.addSink(debugFpReg, "DEBUG_FP_ARCH_REG")
269  val debugArchReg = WireInit(VecInit(debugIntReg ++ debugFpReg))
270  if (!env.FPGAPlatform) {
271    BoringUtils.addSource(debugArchReg, "difftestRegs")
272  }
273
274}
275