xref: /XiangShan/src/main/scala/xiangshan/backend/CtrlBlock.scala (revision faf3cfa90dfe63bff51eb0b3139b22f3762be300)
18921b337SYinan Xupackage xiangshan.backend
28921b337SYinan Xu
38921b337SYinan Xuimport chisel3._
48921b337SYinan Xuimport chisel3.util._
521732575SYinan Xuimport utils._
68921b337SYinan Xuimport xiangshan._
7b424051cSYinan Xuimport xiangshan.backend.decode.DecodeStage
88926ac22SLinJiaweiimport xiangshan.backend.rename.{BusyTable, Rename}
98921b337SYinan Xuimport xiangshan.backend.dispatch.Dispatch
108921b337SYinan Xuimport xiangshan.backend.exu._
11694b0180SLinJiaweiimport xiangshan.backend.exu.Exu.exuConfigs
12884dbb3bSLinJiaweiimport xiangshan.backend.ftq.{Ftq, FtqRead, GetPcByFtq}
138921b337SYinan Xuimport xiangshan.backend.regfile.RfReadPort
148926ac22SLinJiaweiimport xiangshan.backend.roq.{Roq, RoqCSRIO, RoqPtr}
15780ade3fSYinan Xuimport xiangshan.mem.LsqEnqIO
168921b337SYinan Xu
178921b337SYinan Xuclass CtrlToIntBlockIO extends XSBundle {
188921b337SYinan Xu  val enqIqCtrl = Vec(exuParameters.IntExuCnt, DecoupledIO(new MicroOp))
19ebd10a1fSYinan Xu  val readRf = Vec(NRIntReadPorts, Flipped(new RfReadPort(XLEN)))
208926ac22SLinJiawei  val jumpPc = Output(UInt(VAddrBits.W))
2182f87dffSYikeZhou  // int block only uses port 0~7
2282f87dffSYikeZhou  val readPortIndex = Vec(exuParameters.IntExuCnt, Output(UInt(log2Ceil(8 / 2).W))) // TODO parameterize 8 here
2366bcc42fSYinan Xu  val redirect = ValidIO(new Redirect)
248921b337SYinan Xu}
258921b337SYinan Xu
268921b337SYinan Xuclass CtrlToFpBlockIO extends XSBundle {
278921b337SYinan Xu  val enqIqCtrl = Vec(exuParameters.FpExuCnt, DecoupledIO(new MicroOp))
28ebd10a1fSYinan Xu  val readRf = Vec(NRFpReadPorts, Flipped(new RfReadPort(XLEN + 1)))
2982f87dffSYikeZhou  // fp block uses port 0~11
3082f87dffSYikeZhou  val readPortIndex = Vec(exuParameters.FpExuCnt, Output(UInt(log2Ceil((NRFpReadPorts - exuParameters.StuCnt) / 3).W)))
3166bcc42fSYinan Xu  val redirect = ValidIO(new Redirect)
328921b337SYinan Xu}
338921b337SYinan Xu
348921b337SYinan Xuclass CtrlToLsBlockIO extends XSBundle {
358921b337SYinan Xu  val enqIqCtrl = Vec(exuParameters.LsExuCnt, DecoupledIO(new MicroOp))
36780ade3fSYinan Xu  val enqLsq = Flipped(new LsqEnqIO)
3766bcc42fSYinan Xu  val redirect = ValidIO(new Redirect)
388921b337SYinan Xu}
398921b337SYinan Xu
40*faf3cfa9SLinJiaweiclass RedirectGenerator extends XSModule with HasCircularQueuePtrHelper {
41884dbb3bSLinJiawei  val io = IO(new Bundle() {
42884dbb3bSLinJiawei    val loadRelay = Flipped(ValidIO(new Redirect))
43884dbb3bSLinJiawei    val exuMispredict = Vec(exuParameters.JmpCnt + exuParameters.AluCnt, Flipped(ValidIO(new ExuOutput)))
44884dbb3bSLinJiawei    val roqRedirect = Flipped(ValidIO(new Redirect))
4536d7aed5SLinJiawei    val stage2FtqRead = new FtqRead
46884dbb3bSLinJiawei    val stage2Redirect = ValidIO(new Redirect)
47*faf3cfa9SLinJiawei    val stage3Redirect = ValidIO(new Redirect)
48884dbb3bSLinJiawei  })
49884dbb3bSLinJiawei  /*
50884dbb3bSLinJiawei        LoadQueue  Jump  ALU0  ALU1  ALU2  ALU3   exception    Stage1
51884dbb3bSLinJiawei          |         |      |    |     |     |         |
52*faf3cfa9SLinJiawei          |============= reg & compare =====|         |       ========
5336d7aed5SLinJiawei                            |                         |
5436d7aed5SLinJiawei                            |                         |
5536d7aed5SLinJiawei                            |                         |        Stage2
56884dbb3bSLinJiawei                            |                         |
57884dbb3bSLinJiawei                    redirect (flush backend)          |
58884dbb3bSLinJiawei                    |                                 |
59884dbb3bSLinJiawei               === reg ===                            |       ========
60884dbb3bSLinJiawei                    |                                 |
61884dbb3bSLinJiawei                    |----- mux (exception first) -----|        Stage3
62884dbb3bSLinJiawei                            |
63884dbb3bSLinJiawei                redirect (send to frontend)
64884dbb3bSLinJiawei   */
65*faf3cfa9SLinJiawei  def selectOlderRedirect(x: Valid[Redirect], y: Valid[Redirect]): Valid[Redirect] = {
66*faf3cfa9SLinJiawei    Mux(isAfter(x.bits, y.bits) && y.valid, y, x)
67*faf3cfa9SLinJiawei  }
68*faf3cfa9SLinJiawei  def selectOlderExuOut(x: Valid[ExuOutput], y: Valid[ExuOutput]): Valid[ExuOutput] = {
69*faf3cfa9SLinJiawei    Mux(isAfter(x.bits.redirect, y.bits.redirect) && y.valid, y, x)
70*faf3cfa9SLinJiawei  }
71*faf3cfa9SLinJiawei  val jumpOut = io.exuMispredict.head
72*faf3cfa9SLinJiawei  val oldestAluOut = ParallelOperation(io.exuMispredict.tail, selectOlderExuOut)
73*faf3cfa9SLinJiawei  val oldestExuOut = selectOlderExuOut(oldestAluOut, jumpOut) // select between jump and alu
74*faf3cfa9SLinJiawei
75*faf3cfa9SLinJiawei  val oldestMispredict = selectOlderRedirect(io.loadRelay, {
76*faf3cfa9SLinJiawei    val redirect = Wire(Valid(new Redirect))
77*faf3cfa9SLinJiawei    redirect.valid := oldestExuOut.valid
78*faf3cfa9SLinJiawei    redirect.bits := oldestExuOut.bits.redirect
79*faf3cfa9SLinJiawei    redirect
80*faf3cfa9SLinJiawei  })
81*faf3cfa9SLinJiawei
82*faf3cfa9SLinJiawei  val s1_isJalr = RegEnable(JumpOpType.jumpOpisJalr(jumpOut.bits.uop.ctrl.fuOpType), jumpOut.valid)
83*faf3cfa9SLinJiawei  val s1_JalrTarget = RegEnable(jumpOut.bits.redirect.cfiUpdate.target, jumpOut.valid)
84*faf3cfa9SLinJiawei  val s1_imm12_reg = RegEnable(oldestExuOut.bits.uop.ctrl.imm(11, 0), oldestExuOut.valid)
85*faf3cfa9SLinJiawei  val s1_pd = RegEnable(oldestExuOut.bits.uop.cf.pd, oldestExuOut.valid)
86*faf3cfa9SLinJiawei  val s1_redirect_bits_reg = Reg(new Redirect)
87*faf3cfa9SLinJiawei  val s1_redirect_valid_reg = RegInit(false.B)
88*faf3cfa9SLinJiawei
89*faf3cfa9SLinJiawei  // stage1 -> stage2
90*faf3cfa9SLinJiawei  when(oldestMispredict.valid && !oldestMispredict.bits.roqIdx.needFlush(io.stage2Redirect)){
91*faf3cfa9SLinJiawei    s1_redirect_bits_reg := oldestMispredict.bits
92*faf3cfa9SLinJiawei    s1_redirect_valid_reg := true.B
93*faf3cfa9SLinJiawei  }.otherwise({
94*faf3cfa9SLinJiawei    s1_redirect_valid_reg := false.B
95*faf3cfa9SLinJiawei  })
96*faf3cfa9SLinJiawei  io.stage2Redirect.valid := s1_redirect_valid_reg
97*faf3cfa9SLinJiawei  io.stage2Redirect.bits := s1_redirect_bits_reg
98*faf3cfa9SLinJiawei  io.stage2Redirect.bits.cfiUpdate := DontCare
99*faf3cfa9SLinJiawei  // at stage2, we read ftq to get pc
100*faf3cfa9SLinJiawei  io.stage2FtqRead.ptr := s1_redirect_bits_reg.ftqIdx
101*faf3cfa9SLinJiawei
102*faf3cfa9SLinJiawei  // stage3, calculate redirect target
103*faf3cfa9SLinJiawei  val s2_isJalr = RegEnable(s1_isJalr, s1_redirect_valid_reg)
104*faf3cfa9SLinJiawei  val s2_JalrTarget = RegEnable(s1_JalrTarget, s1_redirect_valid_reg)
105*faf3cfa9SLinJiawei  val s2_imm12_reg = RegEnable(s1_imm12_reg, s1_redirect_valid_reg)
106*faf3cfa9SLinJiawei  val s2_pd = RegEnable(s1_pd, s1_redirect_valid_reg)
107*faf3cfa9SLinJiawei  val s2_redirect_bits_reg = Reg(new Redirect)
108*faf3cfa9SLinJiawei  val s2_redirect_valid_reg = RegInit(false.B)
109*faf3cfa9SLinJiawei
110*faf3cfa9SLinJiawei  val ftqRead = io.stage2FtqRead.entry
111*faf3cfa9SLinJiawei  val pc = GetPcByFtq(ftqRead.ftqPC, s2_redirect_bits_reg.ftqOffset)
112*faf3cfa9SLinJiawei  val brTarget = pc + SignExt(s2_imm12_reg, XLEN)
113*faf3cfa9SLinJiawei  val isReplay = RedirectLevel.flushItself(s2_redirect_bits_reg.level)
114*faf3cfa9SLinJiawei  val target = Mux(isReplay,
115*faf3cfa9SLinJiawei    pc, // repaly from itself
116*faf3cfa9SLinJiawei    Mux(s2_isJalr,
117*faf3cfa9SLinJiawei      s2_JalrTarget, // jalr already save target
118*faf3cfa9SLinJiawei      brTarget // branch
119*faf3cfa9SLinJiawei    )
120*faf3cfa9SLinJiawei  )
121*faf3cfa9SLinJiawei  io.stage3Redirect.valid := s2_redirect_valid_reg
122*faf3cfa9SLinJiawei  io.stage3Redirect.bits := s2_redirect_bits_reg
123*faf3cfa9SLinJiawei  val stage3CfiUpdate = io.stage3Redirect.bits.cfiUpdate
124*faf3cfa9SLinJiawei  stage3CfiUpdate.pc := pc
125*faf3cfa9SLinJiawei  stage3CfiUpdate.pd := s2_pd
126*faf3cfa9SLinJiawei  stage3CfiUpdate.rasSp := ftqRead.rasSp
127*faf3cfa9SLinJiawei  stage3CfiUpdate.rasEntry := ftqRead.rasTop
128*faf3cfa9SLinJiawei  stage3CfiUpdate.hist := ftqRead.hist
129*faf3cfa9SLinJiawei  stage3CfiUpdate.predHist := ftqRead.predHist
130*faf3cfa9SLinJiawei  stage3CfiUpdate.specCnt := ftqRead.specCnt
131*faf3cfa9SLinJiawei  stage3CfiUpdate.predTaken :=
132*faf3cfa9SLinJiawei    ftqRead.cfiIndex.valid && s2_redirect_bits_reg.ftqOffset === ftqRead.cfiIndex.bits
133*faf3cfa9SLinJiawei  stage3CfiUpdate.sawNotTakenBranch := VecInit((0 until PredictWidth).map{ i =>
134*faf3cfa9SLinJiawei    if(i == 0) false.B else Cat(ftqRead.br_mask.take(i-1)).orR()
135*faf3cfa9SLinJiawei  })(s2_redirect_bits_reg.ftqOffset)
136*faf3cfa9SLinJiawei  stage3CfiUpdate.target := target
137*faf3cfa9SLinJiawei  stage3CfiUpdate.taken := s2_redirect_bits_reg.cfiUpdate.taken
138*faf3cfa9SLinJiawei  stage3CfiUpdate.isMisPred := s2_redirect_bits_reg.cfiUpdate.isMisPred
139884dbb3bSLinJiawei}
140884dbb3bSLinJiawei
14121732575SYinan Xuclass CtrlBlock extends XSModule with HasCircularQueuePtrHelper {
1428921b337SYinan Xu  val io = IO(new Bundle {
1438921b337SYinan Xu    val frontend = Flipped(new FrontendToBackendIO)
1448921b337SYinan Xu    val fromIntBlock = Flipped(new IntBlockToCtrlIO)
1458921b337SYinan Xu    val fromFpBlock = Flipped(new FpBlockToCtrlIO)
1468921b337SYinan Xu    val fromLsBlock = Flipped(new LsBlockToCtrlIO)
1478921b337SYinan Xu    val toIntBlock = new CtrlToIntBlockIO
1488921b337SYinan Xu    val toFpBlock = new CtrlToFpBlockIO
1498921b337SYinan Xu    val toLsBlock = new CtrlToLsBlockIO
1501c2588aaSYinan Xu    val roqio = new Bundle {
1511c2588aaSYinan Xu      // to int block
1521c2588aaSYinan Xu      val toCSR = new RoqCSRIO
1531c2588aaSYinan Xu      val exception = ValidIO(new MicroOp)
1541c2588aaSYinan Xu      val isInterrupt = Output(Bool())
1551c2588aaSYinan Xu      // to mem block
15621e7a6c5SYinan Xu      val commits = new RoqCommitIO
1571c2588aaSYinan Xu      val roqDeqPtr = Output(new RoqPtr)
1581c2588aaSYinan Xu    }
1598921b337SYinan Xu  })
1608921b337SYinan Xu
161884dbb3bSLinJiawei  val ftq = Module(new Ftq)
1628921b337SYinan Xu  val decode = Module(new DecodeStage)
1638921b337SYinan Xu  val rename = Module(new Rename)
164694b0180SLinJiawei  val dispatch = Module(new Dispatch)
1653fae98acSYinan Xu  val intBusyTable = Module(new BusyTable(NRIntReadPorts, NRIntWritePorts))
1663fae98acSYinan Xu  val fpBusyTable = Module(new BusyTable(NRFpReadPorts, NRFpWritePorts))
167884dbb3bSLinJiawei  val redirectGen = Module(new RedirectGenerator)
1688921b337SYinan Xu
169884dbb3bSLinJiawei  val roqWbSize = NRIntWritePorts + NRFpWritePorts + exuParameters.StuCnt
170694b0180SLinJiawei
171694b0180SLinJiawei  val roq = Module(new Roq(roqWbSize))
1728921b337SYinan Xu
173884dbb3bSLinJiawei  val backendRedirect = redirectGen.io.stage2Redirect
174*faf3cfa9SLinJiawei  val frontendRedirect = redirectGen.io.stage3Redirect
175*faf3cfa9SLinJiawei
176*faf3cfa9SLinJiawei  redirectGen.io.exuMispredict.zip(io.fromIntBlock.exuRedirect).map({case (x, y) =>
177*faf3cfa9SLinJiawei    x.valid := y.valid && y.bits.redirect.cfiUpdate.isMisPred
178*faf3cfa9SLinJiawei    x.bits := y.bits
179*faf3cfa9SLinJiawei  })
180*faf3cfa9SLinJiawei  redirectGen.io.loadRelay := io.fromLsBlock.replay
181*faf3cfa9SLinJiawei  redirectGen.io.roqRedirect := roq.io.redirectOut
1828921b337SYinan Xu
183884dbb3bSLinJiawei  ftq.io.enq <> io.frontend.fetchInfo
184884dbb3bSLinJiawei  for(i <- 0 until CommitWidth){
185884dbb3bSLinJiawei    ftq.io.roq_commits(i).valid := roq.io.commits.valid(i)
186884dbb3bSLinJiawei    ftq.io.roq_commits(i).bits := roq.io.commits.info(i)
187884dbb3bSLinJiawei  }
188884dbb3bSLinJiawei  ftq.io.redirect <> backendRedirect
189*faf3cfa9SLinJiawei  ftq.io.frontendRedirect <> frontendRedirect
190884dbb3bSLinJiawei  ftq.io.exuWriteback <> io.fromIntBlock.exuRedirect
191884dbb3bSLinJiawei
19236d7aed5SLinJiawei  ftq.io.ftqRead(1) <> redirectGen.io.stage2FtqRead
19336d7aed5SLinJiawei  ftq.io.ftqRead(2) <> DontCare // TODO: read exception pc form here
194884dbb3bSLinJiawei
195884dbb3bSLinJiawei  io.frontend.redirect_cfiUpdate := frontendRedirect
19603380706SLinJiawei  io.frontend.commit_cfiUpdate := ftq.io.commit_ftqEntry
19766bcc42fSYinan Xu
1988921b337SYinan Xu  decode.io.in <> io.frontend.cfVec
1998921b337SYinan Xu
200884dbb3bSLinJiawei  val jumpInst = dispatch.io.enqIQCtrl(0).bits
201884dbb3bSLinJiawei  ftq.io.ftqRead(0).ptr := jumpInst.cf.ftqPtr // jump
202884dbb3bSLinJiawei  io.toIntBlock.jumpPc := GetPcByFtq(ftq.io.ftqRead(0).entry.ftqPC, jumpInst.cf.ftqOffset)
2030412e00dSLinJiawei
204b424051cSYinan Xu  // pipeline between decode and dispatch
205b424051cSYinan Xu  for (i <- 0 until RenameWidth) {
206884dbb3bSLinJiawei    PipelineConnect(decode.io.out(i), rename.io.in(i), rename.io.in(i).ready,
207884dbb3bSLinJiawei      backendRedirect.valid || frontendRedirect.valid)
208b424051cSYinan Xu  }
2098921b337SYinan Xu
210884dbb3bSLinJiawei  rename.io.redirect <> backendRedirect
2118921b337SYinan Xu  rename.io.roqCommits <> roq.io.commits
2128921b337SYinan Xu  rename.io.out <> dispatch.io.fromRename
21399b8dc2cSYinan Xu  rename.io.renameBypass <> dispatch.io.renameBypass
2148921b337SYinan Xu
215884dbb3bSLinJiawei  dispatch.io.redirect <> backendRedirect
21621b47d38SYinan Xu  dispatch.io.enqRoq <> roq.io.enq
21708fafef0SYinan Xu  dispatch.io.enqLsq <> io.toLsBlock.enqLsq
2182bb6eba1SYinan Xu  dispatch.io.readIntRf <> io.toIntBlock.readRf
2192bb6eba1SYinan Xu  dispatch.io.readFpRf <> io.toFpBlock.readRf
2203fae98acSYinan Xu  dispatch.io.allocPregs.zipWithIndex.foreach { case (preg, i) =>
2213fae98acSYinan Xu    intBusyTable.io.allocPregs(i).valid := preg.isInt
2221c931a03SYinan Xu    fpBusyTable.io.allocPregs(i).valid := preg.isFp
2233fae98acSYinan Xu    intBusyTable.io.allocPregs(i).bits := preg.preg
2243fae98acSYinan Xu    fpBusyTable.io.allocPregs(i).bits := preg.preg
2253fae98acSYinan Xu  }
2268921b337SYinan Xu  dispatch.io.numExist <> io.fromIntBlock.numExist ++ io.fromFpBlock.numExist ++ io.fromLsBlock.numExist
2272bb6eba1SYinan Xu  dispatch.io.enqIQCtrl <> io.toIntBlock.enqIqCtrl ++ io.toFpBlock.enqIqCtrl ++ io.toLsBlock.enqIqCtrl
22876e1d2a4SYikeZhou//  dispatch.io.enqIQData <> io.toIntBlock.enqIqData ++ io.toFpBlock.enqIqData ++ io.toLsBlock.enqIqData
2298921b337SYinan Xu
2300412e00dSLinJiawei
231884dbb3bSLinJiawei  val flush = backendRedirect.valid && RedirectLevel.isUnconditional(backendRedirect.bits.level)
2323fae98acSYinan Xu  fpBusyTable.io.flush := flush
2333fae98acSYinan Xu  intBusyTable.io.flush := flush
2343fae98acSYinan Xu  for((wb, setPhyRegRdy) <- io.fromIntBlock.wbRegs.zip(intBusyTable.io.wbPregs)){
2351e2ad30cSYinan Xu    setPhyRegRdy.valid := wb.valid && wb.bits.uop.ctrl.rfWen
2363fae98acSYinan Xu    setPhyRegRdy.bits := wb.bits.uop.pdest
2373fae98acSYinan Xu  }
2383fae98acSYinan Xu  for((wb, setPhyRegRdy) <- io.fromFpBlock.wbRegs.zip(fpBusyTable.io.wbPregs)){
2393fae98acSYinan Xu    setPhyRegRdy.valid := wb.valid && wb.bits.uop.ctrl.fpWen
2403fae98acSYinan Xu    setPhyRegRdy.bits := wb.bits.uop.pdest
2413fae98acSYinan Xu  }
2423fae98acSYinan Xu  intBusyTable.io.rfReadAddr <> dispatch.io.readIntRf.map(_.addr)
2433fae98acSYinan Xu  intBusyTable.io.pregRdy <> dispatch.io.intPregRdy
2443fae98acSYinan Xu  fpBusyTable.io.rfReadAddr <> dispatch.io.readFpRf.map(_.addr)
2453fae98acSYinan Xu  fpBusyTable.io.pregRdy <> dispatch.io.fpPregRdy
2463fae98acSYinan Xu
247884dbb3bSLinJiawei  roq.io.redirect <> backendRedirect
248c778d2afSLinJiawei  roq.io.exeWbResults.zip(
2490412e00dSLinJiawei    io.fromIntBlock.wbRegs ++ io.fromFpBlock.wbRegs ++ io.fromLsBlock.stOut
2500412e00dSLinJiawei  ).foreach{
2510412e00dSLinJiawei    case(x, y) =>
2520412e00dSLinJiawei      x.bits := y.bits
253884dbb3bSLinJiawei      x.valid := y.valid
2540412e00dSLinJiawei  }
2550412e00dSLinJiawei
256884dbb3bSLinJiawei  // TODO: is 'backendRedirect' necesscary?
257884dbb3bSLinJiawei  io.toIntBlock.redirect <> backendRedirect
258884dbb3bSLinJiawei  io.toFpBlock.redirect <> backendRedirect
259884dbb3bSLinJiawei  io.toLsBlock.redirect <> backendRedirect
2600412e00dSLinJiawei
2619916fbd7SYikeZhou  dispatch.io.readPortIndex.intIndex <> io.toIntBlock.readPortIndex
2629916fbd7SYikeZhou  dispatch.io.readPortIndex.fpIndex <> io.toFpBlock.readPortIndex
2639916fbd7SYikeZhou
2641c2588aaSYinan Xu  // roq to int block
2651c2588aaSYinan Xu  io.roqio.toCSR <> roq.io.csr
266edf53867SYinan Xu  io.roqio.exception.valid := roq.io.redirectOut.valid && roq.io.redirectOut.bits.isException()
2671c2588aaSYinan Xu  io.roqio.exception.bits := roq.io.exception
268edf53867SYinan Xu  io.roqio.isInterrupt := roq.io.redirectOut.bits.interrupt
2691c2588aaSYinan Xu  // roq to mem block
2701c2588aaSYinan Xu  io.roqio.roqDeqPtr := roq.io.roqDeqPtr
2711c2588aaSYinan Xu  io.roqio.commits := roq.io.commits
2728921b337SYinan Xu}
273