xref: /XiangShan/src/main/scala/xiangshan/backend/CtrlBlock.scala (revision fc8a3b3f6f68fb64c11a89cc89f74516cca06b79)
1package xiangshan.backend
2
3import chisel3._
4import chisel3.util._
5import utils._
6import xiangshan._
7import xiangshan.backend.decode.{DecodeStage, ImmUnion}
8import xiangshan.backend.rename.{BusyTable, Rename}
9import xiangshan.backend.dispatch.Dispatch
10import xiangshan.backend.exu._
11import xiangshan.backend.exu.Exu.exuConfigs
12import xiangshan.backend.ftq.{Ftq, FtqRead, GetPcByFtq}
13import xiangshan.backend.regfile.RfReadPort
14import xiangshan.backend.roq.{Roq, RoqCSRIO, RoqLsqIO, RoqPtr}
15import xiangshan.mem.LsqEnqIO
16
17class CtrlToIntBlockIO extends XSBundle {
18  val enqIqCtrl = Vec(exuParameters.IntExuCnt, DecoupledIO(new MicroOp))
19  val readRf = Vec(NRIntReadPorts, Output(UInt(PhyRegIdxWidth.W)))
20  val jumpPc = Output(UInt(VAddrBits.W))
21  val jalr_target = Output(UInt(VAddrBits.W))
22  // int block only uses port 0~7
23  val readPortIndex = Vec(exuParameters.IntExuCnt, Output(UInt(log2Ceil(8 / 2).W))) // TODO parameterize 8 here
24  val redirect = ValidIO(new Redirect)
25  val flush = Output(Bool())
26}
27
28class CtrlToFpBlockIO extends XSBundle {
29  val enqIqCtrl = Vec(exuParameters.FpExuCnt, DecoupledIO(new MicroOp))
30  val readRf = Vec(NRFpReadPorts, Output(UInt(PhyRegIdxWidth.W)))
31  // fp block uses port 0~11
32  val readPortIndex = Vec(exuParameters.FpExuCnt, Output(UInt(log2Ceil((NRFpReadPorts - exuParameters.StuCnt) / 3).W)))
33  val redirect = ValidIO(new Redirect)
34  val flush = Output(Bool())
35}
36
37class CtrlToLsBlockIO extends XSBundle {
38  val enqIqCtrl = Vec(exuParameters.LsExuCnt, DecoupledIO(new MicroOp))
39  val enqLsq = Flipped(new LsqEnqIO)
40  val redirect = ValidIO(new Redirect)
41  val flush = Output(Bool())
42}
43
44class RedirectGenerator extends XSModule with HasCircularQueuePtrHelper {
45  val io = IO(new Bundle() {
46    val loadRelay = Flipped(ValidIO(new Redirect))
47    val exuMispredict = Vec(exuParameters.JmpCnt + exuParameters.AluCnt, Flipped(ValidIO(new ExuOutput)))
48    val flush = Input(Bool())
49    val stage2FtqRead = new FtqRead
50    val stage2Redirect = ValidIO(new Redirect)
51    val stage3Redirect = ValidIO(new Redirect)
52  })
53  /*
54        LoadQueue  Jump  ALU0  ALU1  ALU2  ALU3   exception    Stage1
55          |         |      |    |     |     |         |
56          |============= reg & compare =====|         |       ========
57                            |                         |
58                            |                         |
59                            |                         |        Stage2
60                            |                         |
61                    redirect (flush backend)          |
62                    |                                 |
63               === reg ===                            |       ========
64                    |                                 |
65                    |----- mux (exception first) -----|        Stage3
66                            |
67                redirect (send to frontend)
68   */
69  def selectOlderRedirect(x: Valid[Redirect], y: Valid[Redirect]): Valid[Redirect] = {
70    Mux(x.valid,
71      Mux(y.valid,
72        Mux(isAfter(x.bits.roqIdx, y.bits.roqIdx), y, x),
73        x
74      ),
75      y
76    )
77  }
78  def selectOlderExuOutWithFlag(x: Valid[ExuOutput], y: Valid[ExuOutput]): (Valid[ExuOutput], Bool) = {
79    val yIsOlder = Mux(x.valid,
80      Mux(y.valid,
81        Mux(isAfter(x.bits.redirect.roqIdx, y.bits.redirect.roqIdx), true.B, false.B),
82        false.B
83      ),
84      true.B
85    )
86    val sel = Mux(yIsOlder, y, x)
87    (sel, yIsOlder)
88  }
89  def selectOlderExuOut(x: Valid[ExuOutput], y: Valid[ExuOutput]): Valid[ExuOutput] = {
90    selectOlderExuOutWithFlag(x, y)._1
91  }
92  val jumpOut = io.exuMispredict.head
93  val oldestAluOut = ParallelOperation(io.exuMispredict.tail, selectOlderExuOut)
94  val (oldestExuOut, jumpIsOlder) = selectOlderExuOutWithFlag(oldestAluOut, jumpOut) // select between jump and alu
95
96  val oldestMispredict = selectOlderRedirect(io.loadRelay, {
97    val redirect = Wire(Valid(new Redirect))
98    redirect.valid := oldestExuOut.valid
99    redirect.bits := oldestExuOut.bits.redirect
100    redirect
101  })
102
103  XSDebug(oldestExuOut.valid, p"exuMispredict: ${Binary(Cat(io.exuMispredict.map(_.valid)))}\n")
104
105  val s1_isJump = RegNext(jumpIsOlder, init = false.B)
106  val s1_jumpTarget = RegEnable(jumpOut.bits.redirect.cfiUpdate.target, jumpOut.valid)
107  val s1_imm12_reg = RegEnable(oldestExuOut.bits.uop.ctrl.imm(11, 0), oldestExuOut.valid)
108  val s1_pd = RegEnable(oldestExuOut.bits.uop.cf.pd, oldestExuOut.valid)
109  val s1_redirect_bits_reg = Reg(new Redirect)
110  val s1_redirect_valid_reg = RegInit(false.B)
111
112  // stage1 -> stage2
113  when(oldestMispredict.valid && !oldestMispredict.bits.roqIdx.needFlush(io.stage2Redirect, io.flush)){
114    s1_redirect_bits_reg := oldestMispredict.bits
115    s1_redirect_valid_reg := true.B
116  }.otherwise({
117    s1_redirect_valid_reg := false.B
118  })
119  io.stage2Redirect.valid := s1_redirect_valid_reg && !io.flush
120  io.stage2Redirect.bits := s1_redirect_bits_reg
121  io.stage2Redirect.bits.cfiUpdate := DontCare
122  // at stage2, we read ftq to get pc
123  io.stage2FtqRead.ptr := s1_redirect_bits_reg.ftqIdx
124
125  // stage3, calculate redirect target
126  val s2_isJump = RegNext(s1_isJump)
127  val s2_jumpTarget = RegEnable(s1_jumpTarget, s1_redirect_valid_reg)
128  val s2_imm12_reg = RegEnable(s1_imm12_reg, s1_redirect_valid_reg)
129  val s2_pd = RegEnable(s1_pd, s1_redirect_valid_reg)
130  val s2_redirect_bits_reg = RegEnable(s1_redirect_bits_reg, enable = s1_redirect_valid_reg)
131  val s2_redirect_valid_reg = RegNext(s1_redirect_valid_reg && !io.flush, init = false.B)
132
133  val ftqRead = io.stage2FtqRead.entry
134  val cfiUpdate_pc =
135    Cat(ftqRead.ftqPC.head(VAddrBits - s2_redirect_bits_reg.ftqOffset.getWidth - instOffsetBits),
136        s2_redirect_bits_reg.ftqOffset,
137        0.U(instOffsetBits.W))
138  val real_pc =
139    GetPcByFtq(ftqRead.ftqPC, s2_redirect_bits_reg.ftqOffset,
140               ftqRead.lastPacketPC.valid,
141               ftqRead.lastPacketPC.bits)
142  val brTarget = real_pc + SignExt(ImmUnion.B.toImm32(s2_imm12_reg), XLEN)
143  val snpc = real_pc + Mux(s2_pd.isRVC, 2.U, 4.U)
144  val isReplay = RedirectLevel.flushItself(s2_redirect_bits_reg.level)
145  val target = Mux(isReplay,
146    real_pc, // repaly from itself
147    Mux(s2_redirect_bits_reg.cfiUpdate.taken,
148      Mux(s2_isJump, s2_jumpTarget, brTarget),
149      snpc
150    )
151  )
152  io.stage3Redirect.valid := s2_redirect_valid_reg
153  io.stage3Redirect.bits := s2_redirect_bits_reg
154  val stage3CfiUpdate = io.stage3Redirect.bits.cfiUpdate
155  stage3CfiUpdate.pc := cfiUpdate_pc
156  stage3CfiUpdate.pd := s2_pd
157  stage3CfiUpdate.rasSp := ftqRead.rasSp
158  stage3CfiUpdate.rasEntry := ftqRead.rasTop
159  stage3CfiUpdate.hist := ftqRead.hist
160  stage3CfiUpdate.predHist := ftqRead.predHist
161  stage3CfiUpdate.specCnt := ftqRead.specCnt
162  stage3CfiUpdate.predTaken := s2_redirect_bits_reg.cfiUpdate.predTaken
163  stage3CfiUpdate.sawNotTakenBranch := VecInit((0 until PredictWidth).map{ i =>
164    if(i == 0) false.B else Cat(ftqRead.br_mask.take(i)).orR()
165  })(s2_redirect_bits_reg.ftqOffset)
166  stage3CfiUpdate.target := target
167  stage3CfiUpdate.taken := s2_redirect_bits_reg.cfiUpdate.taken
168  stage3CfiUpdate.isMisPred := s2_redirect_bits_reg.cfiUpdate.isMisPred
169}
170
171class CtrlBlock extends XSModule with HasCircularQueuePtrHelper {
172  val io = IO(new Bundle {
173    val frontend = Flipped(new FrontendToBackendIO)
174    val fromIntBlock = Flipped(new IntBlockToCtrlIO)
175    val fromFpBlock = Flipped(new FpBlockToCtrlIO)
176    val fromLsBlock = Flipped(new LsBlockToCtrlIO)
177    val toIntBlock = new CtrlToIntBlockIO
178    val toFpBlock = new CtrlToFpBlockIO
179    val toLsBlock = new CtrlToLsBlockIO
180    val roqio = new Bundle {
181      // to int block
182      val toCSR = new RoqCSRIO
183      val exception = ValidIO(new ExceptionInfo)
184      // to mem block
185      val lsq = new RoqLsqIO
186    }
187  })
188
189  val difftestIO = IO(new Bundle() {
190    val fromRoq = new Bundle() {
191      val commit = Output(UInt(32.W))
192      val thisPC = Output(UInt(XLEN.W))
193      val thisINST = Output(UInt(32.W))
194      val skip = Output(UInt(32.W))
195      val wen = Output(UInt(32.W))
196      val wdata = Output(Vec(CommitWidth, UInt(XLEN.W))) // set difftest width to 6
197      val wdst = Output(Vec(CommitWidth, UInt(32.W))) // set difftest width to 6
198      val wpc = Output(Vec(CommitWidth, UInt(XLEN.W))) // set difftest width to 6
199      val isRVC = Output(UInt(32.W))
200      val scFailed = Output(Bool())
201      val lpaddr = Output(Vec(CommitWidth, UInt(64.W)))
202      val ltype = Output(Vec(CommitWidth, UInt(32.W)))
203      val lfu = Output(Vec(CommitWidth, UInt(4.W)))
204    }
205  })
206  difftestIO <> DontCare
207
208  val ftq = Module(new Ftq)
209  val trapIO = IO(new TrapIO())
210  trapIO <> DontCare
211
212  val decode = Module(new DecodeStage)
213  val rename = Module(new Rename)
214  val dispatch = Module(new Dispatch)
215  val intBusyTable = Module(new BusyTable(NRIntReadPorts, NRIntWritePorts))
216  val fpBusyTable = Module(new BusyTable(NRFpReadPorts, NRFpWritePorts))
217  val redirectGen = Module(new RedirectGenerator)
218
219  val roqWbSize = NRIntWritePorts + NRFpWritePorts + exuParameters.StuCnt
220  val roq = Module(new Roq(roqWbSize))
221
222  val backendRedirect = redirectGen.io.stage2Redirect
223  val frontendRedirect = redirectGen.io.stage3Redirect
224  val flush = roq.io.flushOut.valid
225  val flushReg = RegNext(flush)
226
227  redirectGen.io.exuMispredict.zip(io.fromIntBlock.exuRedirect).map({case (x, y) =>
228    val misPred = y.valid && y.bits.redirect.cfiUpdate.isMisPred
229    val killedByOlder = y.bits.uop.roqIdx.needFlush(backendRedirect, flushReg)
230    x.valid := RegNext(misPred && !killedByOlder, init = false.B)
231    x.bits := RegEnable(y.bits, y.valid)
232  })
233  redirectGen.io.loadRelay := io.fromLsBlock.replay
234  redirectGen.io.flush := flushReg
235
236  ftq.io.enq <> io.frontend.fetchInfo
237  for(i <- 0 until CommitWidth){
238    ftq.io.roq_commits(i).valid := roq.io.commits.valid(i) && !roq.io.commits.isWalk
239    ftq.io.roq_commits(i).bits := roq.io.commits.info(i)
240  }
241  ftq.io.redirect <> backendRedirect
242  ftq.io.flush := flushReg
243  ftq.io.flushIdx := RegNext(roq.io.flushOut.bits.ftqIdx)
244  ftq.io.flushOffset := RegNext(roq.io.flushOut.bits.ftqOffset)
245  ftq.io.frontendRedirect <> frontendRedirect
246  ftq.io.exuWriteback <> io.fromIntBlock.exuRedirect
247
248  ftq.io.ftqRead(1) <> redirectGen.io.stage2FtqRead
249  ftq.io.ftqRead(2).ptr := roq.io.flushOut.bits.ftqIdx
250  val flushPC = GetPcByFtq(
251    ftq.io.ftqRead(2).entry.ftqPC,
252    RegEnable(roq.io.flushOut.bits.ftqOffset, roq.io.flushOut.valid),
253    ftq.io.ftqRead(2).entry.lastPacketPC.valid,
254    ftq.io.ftqRead(2).entry.lastPacketPC.bits
255  )
256
257  val flushRedirect = Wire(Valid(new Redirect))
258  flushRedirect.valid := flushReg
259  flushRedirect.bits := DontCare
260  flushRedirect.bits.ftqIdx := RegEnable(roq.io.flushOut.bits.ftqIdx, flush)
261  flushRedirect.bits.interrupt := true.B
262  flushRedirect.bits.cfiUpdate.target := Mux(io.roqio.toCSR.isXRet || roq.io.exception.valid,
263    io.roqio.toCSR.trapTarget,
264    flushPC + 4.U // flush pipe
265  )
266
267  io.frontend.redirect_cfiUpdate := Mux(flushRedirect.valid, flushRedirect, frontendRedirect)
268  io.frontend.commit_cfiUpdate := ftq.io.commit_ftqEntry
269  io.frontend.ftqEnqPtr := ftq.io.enqPtr
270  io.frontend.ftqLeftOne := ftq.io.leftOne
271
272  decode.io.in <> io.frontend.cfVec
273
274  val jumpInst = dispatch.io.enqIQCtrl(0).bits
275  val ftqOffsetReg = Reg(UInt(log2Up(PredictWidth).W))
276  ftqOffsetReg := jumpInst.cf.ftqOffset
277  ftq.io.ftqRead(0).ptr := jumpInst.cf.ftqPtr // jump
278  io.toIntBlock.jumpPc := GetPcByFtq(
279    ftq.io.ftqRead(0).entry.ftqPC, ftqOffsetReg,
280    ftq.io.ftqRead(0).entry.lastPacketPC.valid,
281    ftq.io.ftqRead(0).entry.lastPacketPC.bits
282  )
283  io.toIntBlock.jalr_target := ftq.io.ftqRead(0).entry.target
284
285  // pipeline between decode and dispatch
286  for (i <- 0 until RenameWidth) {
287    PipelineConnect(decode.io.out(i), rename.io.in(i), rename.io.in(i).ready,
288      io.frontend.redirect_cfiUpdate.valid)
289  }
290
291  rename.io.redirect <> backendRedirect
292  rename.io.flush := flushReg
293  rename.io.roqCommits <> roq.io.commits
294  rename.io.out <> dispatch.io.fromRename
295  rename.io.renameBypass <> dispatch.io.renameBypass
296  rename.io.dispatchInfo <> dispatch.io.preDpInfo
297
298  dispatch.io.redirect <> backendRedirect
299  dispatch.io.flush := flushReg
300  dispatch.io.enqRoq <> roq.io.enq
301  dispatch.io.enqLsq <> io.toLsBlock.enqLsq
302  dispatch.io.readIntRf <> io.toIntBlock.readRf
303  dispatch.io.readFpRf <> io.toFpBlock.readRf
304  dispatch.io.allocPregs.zipWithIndex.foreach { case (preg, i) =>
305    intBusyTable.io.allocPregs(i).valid := preg.isInt
306    fpBusyTable.io.allocPregs(i).valid := preg.isFp
307    intBusyTable.io.allocPregs(i).bits := preg.preg
308    fpBusyTable.io.allocPregs(i).bits := preg.preg
309  }
310  dispatch.io.numExist <> io.fromIntBlock.numExist ++ io.fromFpBlock.numExist ++ io.fromLsBlock.numExist
311  dispatch.io.enqIQCtrl <> io.toIntBlock.enqIqCtrl ++ io.toFpBlock.enqIqCtrl ++ io.toLsBlock.enqIqCtrl
312//  dispatch.io.enqIQData <> io.toIntBlock.enqIqData ++ io.toFpBlock.enqIqData ++ io.toLsBlock.enqIqData
313
314
315  fpBusyTable.io.flush := flushReg
316  intBusyTable.io.flush := flushReg
317  for((wb, setPhyRegRdy) <- io.fromIntBlock.wbRegs.zip(intBusyTable.io.wbPregs)){
318    setPhyRegRdy.valid := wb.valid && wb.bits.uop.ctrl.rfWen
319    setPhyRegRdy.bits := wb.bits.uop.pdest
320  }
321  for((wb, setPhyRegRdy) <- io.fromFpBlock.wbRegs.zip(fpBusyTable.io.wbPregs)){
322    setPhyRegRdy.valid := wb.valid && wb.bits.uop.ctrl.fpWen
323    setPhyRegRdy.bits := wb.bits.uop.pdest
324  }
325  intBusyTable.io.read <> dispatch.io.readIntState
326  fpBusyTable.io.read <> dispatch.io.readFpState
327
328  roq.io.redirect <> backendRedirect
329  roq.io.exeWbResults <> (io.fromIntBlock.wbRegs ++ io.fromFpBlock.wbRegs ++ io.fromLsBlock.stOut)
330
331  // TODO: is 'backendRedirect' necesscary?
332  io.toIntBlock.redirect <> backendRedirect
333  io.toIntBlock.flush <> flushReg
334  io.toFpBlock.redirect <> backendRedirect
335  io.toFpBlock.flush <> flushReg
336  io.toLsBlock.redirect <> backendRedirect
337  io.toLsBlock.flush <> flushReg
338
339  if (!env.FPGAPlatform) {
340    difftestIO.fromRoq <> roq.difftestIO
341    trapIO <> roq.trapIO
342  }
343
344  dispatch.io.readPortIndex.intIndex <> io.toIntBlock.readPortIndex
345  dispatch.io.readPortIndex.fpIndex <> io.toFpBlock.readPortIndex
346
347  // roq to int block
348  io.roqio.toCSR <> roq.io.csr
349  io.roqio.exception := roq.io.exception
350  io.roqio.exception.bits.uop.cf.pc := flushPC
351  // roq to mem block
352  io.roqio.lsq <> roq.io.lsq
353}
354