xref: /XiangShan/src/main/scala/xiangshan/frontend/IFU.scala (revision 17e43f8e9ad12c6c42ef8e31c92e68630b78cd53)
1package xiangshan.frontend
2
3import chisel3._
4import chisel3.util._
5import device.RAMHelper
6import xiangshan._
7import utils._
8import xiangshan.cache._
9import chisel3.experimental.chiselName
10import freechips.rocketchip.tile.HasLazyRoCC
11import chisel3.ExcitingUtils._
12import xiangshan.backend.ftq.FtqPtr
13
14trait HasInstrMMIOConst extends HasXSParameter with HasIFUConst{
15  def mmioBusWidth = 64
16  def mmioBusBytes = mmioBusWidth /8
17  def mmioBeats = FetchWidth * 4 * 8 / mmioBusWidth
18  def mmioMask  = VecInit(List.fill(PredictWidth)(true.B)).asUInt
19  def mmioBusAligned(pc :UInt): UInt = align(pc, mmioBusBytes)
20}
21
22trait HasIFUConst extends HasXSParameter {
23  val resetVector = 0x10000000L//TODO: set reset vec
24  def align(pc: UInt, bytes: Int): UInt = Cat(pc(VAddrBits-1, log2Ceil(bytes)), 0.U(log2Ceil(bytes).W))
25  val groupBytes = 64 // correspond to cache line size
26  val groupOffsetBits = log2Ceil(groupBytes)
27  val groupWidth = groupBytes / instBytes
28  val packetBytes = PredictWidth * instBytes
29  val packetOffsetBits = log2Ceil(packetBytes)
30  def offsetInPacket(pc: UInt) = pc(packetOffsetBits-1, instOffsetBits)
31  def packetIdx(pc: UInt) = pc(VAddrBits-1, log2Ceil(packetBytes))
32  def groupAligned(pc: UInt)  = align(pc, groupBytes)
33  def packetAligned(pc: UInt) = align(pc, packetBytes)
34  def mask(pc: UInt): UInt = ((~(0.U(PredictWidth.W))) << offsetInPacket(pc))(PredictWidth-1,0)
35  def snpc(pc: UInt): UInt = packetAligned(pc) + packetBytes.U
36
37  val enableGhistRepair = true
38  val IFUDebug = true
39}
40
41class GlobalHistory extends XSBundle {
42  val predHist = UInt(HistoryLength.W)
43  def update(sawNTBr: Bool, takenOnBr: Bool, hist: UInt = predHist): GlobalHistory = {
44    val g = Wire(new GlobalHistory)
45    val shifted = takenOnBr || sawNTBr
46    g.predHist := Mux(shifted, (hist << 1) | takenOnBr.asUInt, hist)
47    g
48  }
49
50  final def === (that: GlobalHistory): Bool = {
51    predHist === that.predHist
52  }
53
54  final def =/= (that: GlobalHistory): Bool = !(this === that)
55
56  implicit val name = "IFU"
57  def debug(where: String) = XSDebug(p"[${where}_GlobalHistory] hist=${Binary(predHist)}\n")
58  // override def toString(): String = "histPtr=%d, sawNTBr=%d, takenOnBr=%d, saveHalfRVI=%d".format(histPtr, sawNTBr, takenOnBr, saveHalfRVI)
59}
60
61
62class IFUIO extends XSBundle
63{
64  // to ibuffer
65  val fetchPacket = DecoupledIO(new FetchPacket)
66  // from backend
67  val redirect = Flipped(ValidIO(new Redirect))
68  val bp_ctrl = Input(new BPUCtrl)
69  val commitUpdate = Flipped(ValidIO(new FtqEntry))
70  val ftqEnqPtr = Input(new FtqPtr)
71  val ftqLeftOne = Input(Bool())
72  // to backend
73  val toFtq = DecoupledIO(new FtqEntry)
74  // to icache
75  val icacheMemGrant = Flipped(DecoupledIO(new L1plusCacheResp))
76  val fencei = Input(Bool())
77  // from icache
78  val icacheMemAcq = DecoupledIO(new L1plusCacheReq)
79  val l1plusFlush = Output(Bool())
80  val prefetchTrainReq = ValidIO(new IcacheMissReq)
81  // to tlb
82  val sfence = Input(new SfenceBundle)
83  val tlbCsr = Input(new TlbCsrBundle)
84  // from tlb
85  val ptw = new TlbPtwIO
86  // icache uncache
87  val mmio_acquire = DecoupledIO(new InsUncacheReq)
88  val mmio_grant  = Flipped(DecoupledIO(new InsUncacheResp))
89  val mmio_flush = Output(Bool())
90}
91
92class PrevHalfInstr extends XSBundle {
93  val pc = UInt(VAddrBits.W)
94  val npc = UInt(VAddrBits.W)
95  val instr = UInt(16.W)
96  val ipf = Bool()
97}
98
99@chiselName
100class IFU extends XSModule with HasIFUConst with HasCircularQueuePtrHelper
101{
102  val io = IO(new IFUIO)
103  val bpu = BPU(EnableBPU)
104  val icache = Module(new ICache)
105
106  io.ptw <> TLB(
107    in = Seq(icache.io.tlb),
108    sfence = io.sfence,
109    csr = io.tlbCsr,
110    width = 1,
111    isDtlb = false,
112    shouldBlock = true
113  )
114
115  val if2_redirect, if3_redirect, if4_redirect = WireInit(false.B)
116  val if1_flush, if2_flush, if3_flush, if4_flush = WireInit(false.B)
117
118  val icacheResp = icache.io.resp.bits
119
120  if4_flush := io.redirect.valid
121  if3_flush := if4_flush || if4_redirect
122  if2_flush := if3_flush || if3_redirect
123  if1_flush := if2_flush || if2_redirect
124
125  //********************** IF1 ****************************//
126  val if1_valid = !reset.asBool && GTimer() > 500.U
127  val if1_npc = WireInit(0.U(VAddrBits.W))
128  val if2_ready = WireInit(false.B)
129  val if2_valid = RegInit(init = false.B)
130  val if2_allReady = WireInit(if2_ready && icache.io.req.ready)
131  val if1_fire = (if1_valid &&  if2_allReady) && (icache.io.tlb.resp.valid || !if2_valid)
132  val if1_can_go = if1_fire
133
134  val if1_gh, if2_gh, if3_gh, if4_gh = Wire(new GlobalHistory)
135  val if2_predicted_gh, if3_predicted_gh, if4_predicted_gh = Wire(new GlobalHistory)
136  val final_gh = RegInit(0.U.asTypeOf(new GlobalHistory))
137  val final_gh_bypass = WireInit(0.U.asTypeOf(new GlobalHistory))
138  val flush_final_gh = WireInit(false.B)
139
140  //********************** IF2 ****************************//
141  val if2_allValid = if2_valid && icache.io.tlb.resp.valid
142  val if3_ready = WireInit(false.B)
143  val if2_fire = (if2_valid && if3_ready) && icache.io.tlb.resp.valid
144  val if2_pc = RegEnable(next = if1_npc, init = resetVector.U, enable = if1_can_go)
145  val if2_snpc = snpc(if2_pc)
146  val if2_predHist = RegEnable(if1_gh.predHist, enable=if1_can_go)
147  if2_ready := if3_ready || !if2_valid
148  when (if1_can_go)       { if2_valid := true.B }
149  .elsewhen (if2_flush) { if2_valid := false.B }
150  .elsewhen (if2_fire)  { if2_valid := false.B }
151
152  val npcGen = new PriorityMuxGenerator[UInt]
153  npcGen.register(true.B, RegNext(if1_npc), Some("stallPC"))
154  val if2_bp = bpu.io.out(0)
155
156  // if taken, bp_redirect should be true
157  // when taken on half RVI, we suppress this redirect signal
158
159  npcGen.register(if2_valid, Mux(if2_bp.taken, if2_bp.target, if2_snpc), Some("if2_target"))
160
161  if2_predicted_gh := if2_gh.update(if2_bp.hasNotTakenBrs, if2_bp.takenOnBr)
162
163  //********************** IF3 ****************************//
164  // if3 should wait for instructions resp to arrive
165  val if3_valid = RegInit(init = false.B)
166  val if4_ready = WireInit(false.B)
167  val if3_allValid = if3_valid && icache.io.resp.valid
168  val if3_fire = if3_allValid && if4_ready
169  val if3_pc = RegEnable(if2_pc, if2_fire)
170  val if3_snpc = RegEnable(if2_snpc, if2_fire)
171  val if3_predHist = RegEnable(if2_predHist, enable=if2_fire)
172  if3_ready := if4_ready && icache.io.resp.valid || !if3_valid
173  when (if3_flush) {
174    if3_valid := false.B
175  }.elsewhen (if2_fire && !if2_flush) {
176    if3_valid := true.B
177  }.elsewhen (if3_fire) {
178    if3_valid := false.B
179  }
180
181  val if3_bp = bpu.io.out(1)
182  if3_predicted_gh := if3_gh.update(if3_bp.hasNotTakenBrs, if3_bp.takenOnBr)
183
184
185  val prevHalfInstrReq = WireInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
186  // only valid when if4_fire
187  val hasPrevHalfInstrReq = prevHalfInstrReq.valid && HasCExtension.B
188
189  val if3_prevHalfInstr = RegInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
190
191  // 32-bit instr crosses 2 pages, and the higher 16-bit triggers page fault
192  val crossPageIPF = WireInit(false.B)
193
194  val if3_pendingPrevHalfInstr = if3_prevHalfInstr.valid && HasCExtension.B
195
196  // the previous half of RVI instruction waits until it meets its last half
197  val if3_prevHalfInstrMet = if3_pendingPrevHalfInstr && if3_prevHalfInstr.bits.npc === if3_pc && if3_valid
198  // set to invalid once consumed or redirect from backend
199  val if3_prevHalfConsumed = if3_prevHalfInstrMet && if3_fire
200  val if3_prevHalfFlush = if4_flush
201  when (if3_prevHalfFlush) {
202    if3_prevHalfInstr.valid := false.B
203  }.elsewhen (hasPrevHalfInstrReq) {
204    if3_prevHalfInstr.valid := true.B
205  }.elsewhen (if3_prevHalfConsumed) {
206    if3_prevHalfInstr.valid := false.B
207  }
208  when (hasPrevHalfInstrReq) {
209    if3_prevHalfInstr.bits := prevHalfInstrReq.bits
210  }
211  // when bp signal a redirect, we distinguish between taken and not taken
212  // if taken and saveHalfRVI is true, we do not redirect to the target
213
214  class IF3_PC_COMP extends XSModule {
215    val io = IO(new Bundle {
216      val if2_pc = Input(UInt(VAddrBits.W))
217      val pc     = Input(UInt(VAddrBits.W))
218      val if2_valid = Input(Bool())
219      val res = Output(Bool())
220    })
221    io.res := !io.if2_valid || io.if2_valid && io.if2_pc =/= io.pc
222  }
223  def if3_nextValidPCNotEquals(pc: UInt) = {
224    val comp = Module(new IF3_PC_COMP)
225    comp.io.if2_pc := if2_pc
226    comp.io.pc     := pc
227    comp.io.if2_valid := if2_valid
228    comp.io.res
229  }
230
231  val if3_predTakenRedirectVec = VecInit((0 until PredictWidth).map(i => !if3_pendingPrevHalfInstr && if3_bp.takens(i) && if3_nextValidPCNotEquals(if3_bp.targets(i))))
232  val if3_prevHalfNotMetRedirect = if3_pendingPrevHalfInstr && !if3_prevHalfInstrMet && if3_nextValidPCNotEquals(if3_prevHalfInstr.bits.npc)
233  val if3_predTakenRedirect    = ParallelOR(if3_predTakenRedirectVec)
234  val if3_predNotTakenRedirect = !if3_pendingPrevHalfInstr && !if3_bp.taken && if3_nextValidPCNotEquals(if3_snpc)
235  // when pendingPrevHalfInstr, if3_GHInfo is set to the info of last prev half instr
236  // val if3_ghInfoNotIdenticalRedirect = !if3_pendingPrevHalfInstr && if3_GHInfo =/= if3_lastGHInfo && enableGhistRepair.B
237
238  if3_redirect := if3_valid && (
239                    // prevHalf does not match if3_pc and the next fetch packet is not snpc
240                    if3_prevHalfNotMetRedirect && HasCExtension.B ||
241                    // pred taken and next fetch packet is not the predicted target
242                    if3_predTakenRedirect ||
243                    // pred not taken and next fetch packet is not snpc
244                    if3_predNotTakenRedirect
245                    // GHInfo from last pred does not corresponds with this packet
246                    // if3_ghInfoNotIdenticalRedirect
247                  )
248
249  val if3_target = WireInit(if3_snpc)
250
251  if3_target := Mux1H(Seq((if3_prevHalfNotMetRedirect -> if3_prevHalfInstr.bits.npc),
252                          (if3_predTakenRedirect      -> if3_bp.target),
253                          (if3_predNotTakenRedirect   -> if3_snpc)))
254
255  npcGen.register(if3_redirect, if3_target, Some("if3_target"))
256
257
258  //********************** IF4 ****************************//
259  val ftqEnqBuf_ready = Wire(Bool())
260  val if4_ftqEnqPtr = Wire(new FtqPtr)
261  val if4_pd = RegEnable(icache.io.pd_out, if3_fire)
262  val if4_ipf = RegEnable(icacheResp.ipf || if3_prevHalfInstrMet && if3_prevHalfInstr.bits.ipf, if3_fire)
263  val if4_acf = RegEnable(icacheResp.acf, if3_fire)
264  val if4_crossPageIPF = RegEnable(crossPageIPF, if3_fire)
265  val if4_valid = RegInit(false.B)
266  val if4_fire = if4_valid && io.fetchPacket.ready && ftqEnqBuf_ready
267  val if4_pc = RegEnable(if3_pc, if3_fire)
268  val if4_snpc = RegEnable(if3_snpc, if3_fire)
269  // This is the real mask given from icache
270  val if4_mask = RegEnable(icacheResp.mask, if3_fire)
271
272
273  val if4_predHist = RegEnable(if3_predHist, enable=if3_fire)
274  // wait until prevHalfInstr written into reg
275  if4_ready := (io.fetchPacket.ready && !hasPrevHalfInstrReq && ftqEnqBuf_ready || !if4_valid) && GTimer() > 500.U
276  when (if4_flush) {
277    if4_valid := false.B
278  }.elsewhen (if3_fire && !if3_flush) {
279    if4_valid := Mux(if3_pendingPrevHalfInstr, if3_prevHalfInstrMet, true.B)
280  }.elsewhen (if4_fire) {
281    if4_valid := false.B
282  }
283
284  val if4_bp = Wire(new BranchPrediction)
285  if4_bp := bpu.io.out(2)
286
287  if4_predicted_gh := if4_gh.update(if4_bp.hasNotTakenBrs, if4_bp.takenOnBr)
288
289  def jal_offset(inst: UInt, rvc: Bool): SInt = {
290    Mux(rvc,
291      Cat(inst(12), inst(8), inst(10, 9), inst(6), inst(7), inst(2), inst(11), inst(5, 3), 0.U(1.W)).asSInt(),
292      Cat(inst(31), inst(19, 12), inst(20), inst(30, 21), 0.U(1.W)).asSInt()
293    )
294  }
295  def br_offset(inst: UInt, rvc: Bool): SInt = {
296    Mux(rvc,
297      Cat(inst(12), inst(6, 5), inst(2), inst(11, 10), inst(4, 3), 0.U(1.W)).asSInt,
298      Cat(inst(31), inst(7), inst(30, 25), inst(11, 8), 0.U(1.W)).asSInt()
299    )
300  }
301  val if4_instrs = if4_pd.instrs
302  val if4_jals = if4_bp.jalMask
303  val if4_jal_tgts = VecInit((0 until PredictWidth).map(i => (if4_pd.pc(i).asSInt + jal_offset(if4_instrs(i), if4_pd.pd(i).isRVC)).asUInt))
304  val if4_brs = if4_bp.brMask
305  val if4_br_tgts = VecInit((0 until PredictWidth).map(i => (if4_pd.pc(i).asSInt + br_offset(if4_instrs(i), if4_pd.pd(i).isRVC)).asUInt))
306  (0 until PredictWidth).foreach {i =>
307    when (if4_jals(i)) {
308      if4_bp.targets(i) := if4_jal_tgts(i)
309    }.elsewhen (if4_brs(i)) {
310      if4_bp.targets(i) := if4_br_tgts(i)
311    }
312  }
313
314  // we need this to tell BPU the prediction of prev half
315  // because the prediction is with the start of each inst
316  val if4_prevHalfInstr = RegInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
317  val if4_pendingPrevHalfInstr = if4_prevHalfInstr.valid && HasCExtension.B
318  val if4_prevHalfInstrMet = if4_pendingPrevHalfInstr && if4_valid
319  val if4_prevHalfConsumed = if4_prevHalfInstrMet && if4_fire
320  val if4_prevHalfFlush = if4_flush
321
322  when (if4_prevHalfFlush) {
323    if4_prevHalfInstr.valid := false.B
324  }.elsewhen (if3_prevHalfConsumed) {
325    if4_prevHalfInstr.valid := if3_prevHalfInstr.valid
326  }.elsewhen (if4_prevHalfConsumed) {
327    if4_prevHalfInstr.valid := false.B
328  }
329
330  when (if3_prevHalfConsumed) {
331    if4_prevHalfInstr.bits := if3_prevHalfInstr.bits
332  }
333
334  prevHalfInstrReq.valid := if4_fire && if4_bp.saveHalfRVI && HasCExtension.B
335
336  // // this is result of the last half RVI
337  prevHalfInstrReq.bits.pc := if4_pd.pc(PredictWidth-1)
338  prevHalfInstrReq.bits.npc := snpc(if4_pc)
339  prevHalfInstrReq.bits.instr := if4_pd.instrs(PredictWidth-1)(15, 0)
340  prevHalfInstrReq.bits.ipf := if4_ipf
341
342  class IF4_PC_COMP extends XSModule {
343    val io = IO(new Bundle {
344      val if2_pc = Input(UInt(VAddrBits.W))
345      val if3_pc = Input(UInt(VAddrBits.W))
346      val pc     = Input(UInt(VAddrBits.W))
347      val if2_valid = Input(Bool())
348      val if3_valid = Input(Bool())
349      val res = Output(Bool())
350    })
351    io.res := io.if3_valid  && io.if3_pc =/= io.pc ||
352              !io.if3_valid && (io.if2_valid && io.if2_pc =/= io.pc) ||
353              !io.if3_valid && !io.if2_valid
354  }
355  def if4_nextValidPCNotEquals(pc: UInt) = {
356    val comp = Module(new IF4_PC_COMP)
357    comp.io.if2_pc := if2_pc
358    comp.io.if3_pc := if3_pc
359    comp.io.pc     := pc
360    comp.io.if2_valid := if2_valid
361    comp.io.if3_valid := if3_valid
362    comp.io.res
363  }
364
365  val if4_predTakenRedirectVec = VecInit((0 until PredictWidth).map(i => if4_bp.takens(i) && if4_nextValidPCNotEquals(if4_bp.targets(i))))
366
367  val if4_prevHalfNextNotMet = hasPrevHalfInstrReq && if4_nextValidPCNotEquals(prevHalfInstrReq.bits.pc+2.U)
368  val if4_predTakenRedirect = ParallelORR(if4_predTakenRedirectVec)
369  val if4_predNotTakenRedirect = !if4_bp.taken && if4_nextValidPCNotEquals(if4_snpc)
370  // val if4_ghInfoNotIdenticalRedirect = if4_GHInfo =/= if4_lastGHInfo && enableGhistRepair.B
371
372  if4_redirect := if4_valid && (
373                    // when if4 has a lastHalfRVI, but the next fetch packet is not snpc
374                    // if4_prevHalfNextNotMet ||
375                    // when if4 preds taken, but the pc of next fetch packet is not the target
376                    if4_predTakenRedirect ||
377                    // when if4 preds not taken, but the pc of next fetch packet is not snpc
378                    if4_predNotTakenRedirect
379                    // GHInfo from last pred does not corresponds with this packet
380                    // if4_ghInfoNotIdenticalRedirect
381                  )
382
383  val if4_target = WireInit(if4_snpc)
384
385  if4_target := Mux(if4_bp.taken, if4_bp.target, if4_snpc)
386
387  npcGen.register(if4_redirect, if4_target, Some("if4_target"))
388
389  when (if4_fire) {
390    final_gh := if4_predicted_gh
391  }
392  if4_gh := Mux(flush_final_gh, final_gh_bypass, final_gh)
393  if3_gh := Mux(if4_valid && !if4_flush, if4_predicted_gh, if4_gh)
394  if2_gh := Mux(if3_valid && !if3_flush, if3_predicted_gh, if3_gh)
395  if1_gh := Mux(if2_valid && !if2_flush, if2_predicted_gh, if2_gh)
396
397  // ***************** Ftq enq buffer ********************
398  val toFtqBuf = Wire(new FtqEntry)
399  val ftqEnqBuf = RegEnable(toFtqBuf, enable=if4_fire)
400  val ftqEnqBuf_valid = RegInit(false.B)
401  val ftqLeftOne = WireInit(false.B) // TODO: to be replaced
402  ftqEnqBuf_ready := io.toFtq.ready && !(io.ftqLeftOne && ftqEnqBuf_valid)
403  if4_ftqEnqPtr := Mux(ftqEnqBuf_valid, io.ftqEnqPtr+1.U, io.ftqEnqPtr)
404  when (io.redirect.valid)  { ftqEnqBuf_valid := false.B }
405  .elsewhen (if4_fire)      { ftqEnqBuf_valid := true.B }
406  .elsewhen (io.toFtq.fire) { ftqEnqBuf_valid := false.B }
407
408  io.toFtq.valid := ftqEnqBuf_valid
409  io.toFtq.bits  := ftqEnqBuf
410
411  toFtqBuf := DontCare
412  toFtqBuf.ftqPC    := if4_pc
413  toFtqBuf.lastPacketPC.valid := if4_pendingPrevHalfInstr
414  toFtqBuf.lastPacketPC.bits  := if4_prevHalfInstr.bits.pc
415
416  toFtqBuf.hist     := final_gh
417  toFtqBuf.predHist := if4_predHist.asTypeOf(new GlobalHistory)
418  toFtqBuf.rasSp    := bpu.io.brInfo.rasSp
419  toFtqBuf.rasTop   := bpu.io.brInfo.rasTop
420  toFtqBuf.specCnt  := bpu.io.brInfo.specCnt
421  toFtqBuf.metas    := bpu.io.brInfo.metas
422
423  // For perf counters
424  toFtqBuf.pd    := if4_pd.pd
425
426
427  val if4_jmpIdx = WireInit(if4_bp.jmpIdx)
428  val if4_taken = WireInit(if4_bp.taken)
429  val if4_real_valids = if4_pd.mask &
430    (Fill(PredictWidth, !if4_taken) |
431      (Fill(PredictWidth, 1.U(1.W)) >> (~if4_jmpIdx)))
432
433  val cfiIsCall = if4_pd.pd(if4_jmpIdx).isCall
434  val cfiIsRet  = if4_pd.pd(if4_jmpIdx).isRet
435  val cfiIsRVC  = if4_pd.pd(if4_jmpIdx).isRVC
436  toFtqBuf.cfiIsCall := cfiIsCall
437  toFtqBuf.cfiIsRet  := cfiIsRet
438  toFtqBuf.cfiIsRVC  := cfiIsRVC
439  toFtqBuf.cfiIndex.valid := if4_taken
440  toFtqBuf.cfiIndex.bits  := if4_jmpIdx
441
442  toFtqBuf.br_mask   := if4_bp.brMask.asTypeOf(Vec(PredictWidth, Bool()))
443  toFtqBuf.rvc_mask  := VecInit(if4_pd.pd.map(_.isRVC))
444  toFtqBuf.valids    := if4_real_valids.asTypeOf(Vec(PredictWidth, Bool()))
445  toFtqBuf.target := Mux(if4_taken, if4_target, if4_snpc)
446
447
448
449  val r = io.redirect
450  val cfiUpdate = io.redirect.bits.cfiUpdate
451  when (r.valid) {
452    val isMisPred = r.bits.level === 0.U
453    val b = cfiUpdate
454    val oldGh = b.hist
455    val sawNTBr = b.sawNotTakenBranch
456    val isBr = b.pd.isBr
457    val taken = Mux(isMisPred, b.taken, b.predTaken)
458    val updatedGh = oldGh.update(sawNTBr, isBr && taken)
459    final_gh := updatedGh
460    final_gh_bypass := updatedGh
461    flush_final_gh := true.B
462  }
463
464  npcGen.register(io.redirect.valid, io.redirect.bits.cfiUpdate.target, Some("backend_redirect"))
465  npcGen.register(RegNext(reset.asBool) && !reset.asBool, resetVector.U(VAddrBits.W), Some("reset_vector"))
466
467  if1_npc := npcGen()
468
469
470  icache.io.req.valid := if1_can_go
471  icache.io.resp.ready := if4_ready
472  icache.io.req.bits.addr := if1_npc
473  icache.io.req.bits.mask := mask(if1_npc)
474  icache.io.flush := Cat(if3_flush, if2_flush)
475  icache.io.mem_grant <> io.icacheMemGrant
476  icache.io.fencei := io.fencei
477  icache.io.prev.valid := if3_prevHalfInstrMet
478  icache.io.prev.bits := if3_prevHalfInstr.bits.instr
479  icache.io.prev_ipf := if3_prevHalfInstr.bits.ipf
480  icache.io.prev_pc := if3_prevHalfInstr.bits.pc
481  icache.io.mmio_acquire <> io.mmio_acquire
482  icache.io.mmio_grant <> io.mmio_grant
483  icache.io.mmio_flush <> io.mmio_flush
484  io.icacheMemAcq <> icache.io.mem_acquire
485  io.l1plusFlush := icache.io.l1plusflush
486  io.prefetchTrainReq := icache.io.prefetchTrainReq
487
488  bpu.io.ctrl := RegNext(io.bp_ctrl)
489  bpu.io.commit <> io.commitUpdate
490  bpu.io.redirect <> io.redirect
491
492  bpu.io.inFire(0) := if1_can_go
493  bpu.io.inFire(1) := if2_fire
494  bpu.io.inFire(2) := if3_fire
495  bpu.io.inFire(3) := if4_fire
496  bpu.io.in.pc := if1_npc
497  bpu.io.in.hist := if1_gh.asUInt
498  bpu.io.in.inMask := mask(if1_npc)
499  bpu.io.predecode.mask := if4_pd.mask
500  bpu.io.predecode.lastHalf := if4_pd.lastHalf
501  bpu.io.predecode.pd := if4_pd.pd
502  bpu.io.predecode.hasLastHalfRVI := if4_prevHalfInstrMet
503
504
505  when (if3_prevHalfInstrMet && icacheResp.ipf && !if3_prevHalfInstr.bits.ipf) {
506    crossPageIPF := true.B // higher 16 bits page fault
507  }
508
509  val fetchPacketValid = if4_valid && !io.redirect.valid && ftqEnqBuf_ready
510  val fetchPacketWire = Wire(new FetchPacket)
511
512  fetchPacketWire.mask := if4_real_valids
513  //RVC expand
514  val expandedInstrs = Wire(Vec(PredictWidth, UInt(32.W)))
515  for(i <- 0 until PredictWidth){
516      val expander = Module(new RVCExpander)
517      expander.io.in := if4_pd.instrs(i)
518      expandedInstrs(i) := expander.io.out.bits
519  }
520  fetchPacketWire.instrs := expandedInstrs
521
522  fetchPacketWire.pc := if4_pd.pc
523
524  fetchPacketWire.pdmask := if4_pd.mask
525  fetchPacketWire.pd := if4_pd.pd
526  fetchPacketWire.ipf := if4_ipf
527  fetchPacketWire.acf := if4_acf
528  fetchPacketWire.crossPageIPFFix := if4_crossPageIPF
529  fetchPacketWire.ftqPtr := if4_ftqEnqPtr
530
531  // predTaken Vec
532  fetchPacketWire.pred_taken := if4_bp.takens
533
534  io.fetchPacket.bits := fetchPacketWire
535  io.fetchPacket.valid := fetchPacketValid
536
537//  if(IFUDebug) {
538  // if (!env.FPGAPlatform) {
539  //   val predictor_s3 = RegEnable(Mux(if3_redirect, 1.U(log2Up(4).W), 0.U(log2Up(4).W)), if3_fire)
540  //   val predictor_s4 = Mux(if4_redirect, 2.U, predictor_s3)
541  //   val predictor = predictor_s4
542  //   toFtqBuf.metas.map(_.predictor := predictor)
543  // }
544 // }
545
546  // val predRight = cfiUpdate.valid && !cfiUpdate.bits.isMisPred && !cfiUpdate.bits.isReplay
547  // val predWrong = cfiUpdate.valid && cfiUpdate.bits.isMisPred && !cfiUpdate.bits.isReplay
548
549  // val ubtbRight = predRight && cfiUpdate.bits.bpuMeta.predictor === 0.U
550  // val ubtbWrong = predWrong && cfiUpdate.bits.bpuMeta.predictor === 0.U
551  // val btbRight  = predRight && cfiUpdate.bits.bpuMeta.predictor === 1.U
552  // val btbWrong  = predWrong && cfiUpdate.bits.bpuMeta.predictor === 1.U
553  // val tageRight = predRight && cfiUpdate.bits.bpuMeta.predictor === 2.U
554  // val tageWrong = predWrong && cfiUpdate.bits.bpuMeta.predictor === 2.U
555  // val loopRight = predRight && cfiUpdate.bits.bpuMeta.predictor === 3.U
556  // val loopWrong = predWrong && cfiUpdate.bits.bpuMeta.predictor === 3.U
557
558  // ExcitingUtils.addSource(ubtbRight, "perfCntubtbRight", Perf)
559  // ExcitingUtils.addSource(ubtbWrong, "perfCntubtbWrong", Perf)
560  // ExcitingUtils.addSource(btbRight, "perfCntbtbRight", Perf)
561  // ExcitingUtils.addSource(btbWrong, "perfCntbtbWrong", Perf)
562  // ExcitingUtils.addSource(tageRight, "perfCnttageRight", Perf)
563  // ExcitingUtils.addSource(tageWrong, "perfCnttageWrong", Perf)
564  // ExcitingUtils.addSource(loopRight, "perfCntloopRight", Perf)
565  // ExcitingUtils.addSource(loopWrong, "perfCntloopWrong", Perf)
566
567  if (!env.FPGAPlatform && env.EnablePerfDebug) {
568    val predictor_s3 = RegEnable(Mux(if3_redirect, 1.U(log2Up(4).W), 0.U(log2Up(4).W)), if3_fire)
569    val predictor_s4 = Mux(if4_redirect, 2.U, predictor_s3)
570    val predictor = predictor_s4
571    toFtqBuf.metas.map(_.predictor := predictor)
572
573    // val ubtbAns = WireInit(VecInit(Seq.fill(PredictWidth) {0.U.asTypeOf(new PredictorAnswer)} ))
574    // val btbAns = WireInit(VecInit(Seq.fill(PredictWidth) {0.U.asTypeOf(new PredictorAnswer)} ))
575    // val bimResp = WireInit(VecInit(Seq.fill(PredictWidth) {false.B} ))
576    // val tageAns = WireInit(VecInit(Seq.fill(PredictWidth) {0.U.asTypeOf(new PredictorAnswer)} ))
577    // val rasAns = WireInit(0.U.asTypeOf(new PredictorAnswer))
578    // val loopAns = WireInit(VecInit(Seq.fill(PredictWidth) {0.U.asTypeOf(new PredictorAnswer)} ))
579
580    // ExcitingUtils.addSink(ubtbAns, "ubtbAns")
581    // ExcitingUtils.addSink(btbAns, "btbAns")
582    // ExcitingUtils.addSink(bimResp, "bimResp")
583    // ExcitingUtils.addSink(tageAns, "tageAns")
584    // ExcitingUtils.addSink(rasAns, "rasAns")
585    // // ExcitingUtils.addSink(loopAns, "loopAns")
586
587    // val ubtbAns_s3 = RegEnable(ubtbAns, if2_fire)
588    // val ubtbAns_s4 = RegEnable(ubtbAns_s3, if3_fire)
589
590    // val btbAns_s3 = RegEnable(btbAns, if2_fire)
591    // val btbAns_s4 = RegEnable(btbAns_s3, if3_fire)
592    // val bimResp_s3 = RegEnable(bimResp, if2_fire)
593    // val bimResp_s4 = RegEnable(bimResp_s3, if3_fire)
594
595    toFtqBuf.metas.zipWithIndex.foreach{ case(x,i) =>
596      x.predictor := predictor
597
598      // x.ubtbAns := ubtbAns_s4(i)
599      // x.btbAns := btbAns_s4(i)
600      // x.btbAns.taken := bimResp_s4(i)
601      // x.tageAns := tageAns(i)
602      // x.rasAns := rasAns // Is this right?
603      // x.loopAns := loopAns(i)
604
605      x.ubtbAns := bpu.io.brInfo.metas(i).ubtbAns
606      x.btbAns := bpu.io.brInfo.metas(i).btbAns
607      x.tageAns := bpu.io.brInfo.metas(i).tageAns
608      x.rasAns := bpu.io.brInfo.metas(i).rasAns // Is this right?
609      x.loopAns := bpu.io.brInfo.metas(i).loopAns
610    }
611  }
612
613  // debug info
614  if (IFUDebug) {
615    XSDebug(RegNext(reset.asBool) && !reset.asBool, "Reseting...\n")
616    XSDebug(icache.io.flush(0).asBool, "Flush icache stage2...\n")
617    XSDebug(icache.io.flush(1).asBool, "Flush icache stage3...\n")
618    XSDebug(io.redirect.valid, p"Redirect from backend! target=${Hexadecimal(io.redirect.bits.cfiUpdate.target)}\n")
619
620    XSDebug("[IF1] v=%d     fire=%d  cango=%d          flush=%d pc=%x mask=%b\n", if1_valid, if1_fire,if1_can_go, if1_flush, if1_npc, mask(if1_npc))
621    XSDebug("[IF2] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x snpc=%x\n", if2_valid, if2_ready, if2_fire, if2_redirect, if2_flush, if2_pc, if2_snpc)
622    XSDebug("[IF3] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x crossPageIPF=%d sawNTBrs=%d\n", if3_valid, if3_ready, if3_fire, if3_redirect, if3_flush, if3_pc, crossPageIPF, if3_bp.hasNotTakenBrs)
623    XSDebug("[IF4] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x crossPageIPF=%d sawNTBrs=%d\n", if4_valid, if4_ready, if4_fire, if4_redirect, if4_flush, if4_pc, if4_crossPageIPF, if4_bp.hasNotTakenBrs)
624    XSDebug("[IF1][icacheReq] v=%d r=%d addr=%x\n", icache.io.req.valid, icache.io.req.ready, icache.io.req.bits.addr)
625    XSDebug("[IF1][ghr] hist=%b\n", if1_gh.asUInt)
626    XSDebug("[IF1][ghr] extHist=%b\n\n", if1_gh.asUInt)
627
628    XSDebug("[IF2][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n\n", if2_bp.taken, if2_bp.jmpIdx, if2_bp.hasNotTakenBrs, if2_bp.target, if2_bp.saveHalfRVI)
629    if2_gh.debug("if2")
630
631    XSDebug("[IF3][icacheResp] v=%d r=%d pc=%x mask=%b\n", icache.io.resp.valid, icache.io.resp.ready, icache.io.resp.bits.pc, icache.io.resp.bits.mask)
632    XSDebug("[IF3][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n", if3_bp.taken, if3_bp.jmpIdx, if3_bp.hasNotTakenBrs, if3_bp.target, if3_bp.saveHalfRVI)
633    XSDebug("[IF3][redirect]: v=%d, prevNMet=%d, predT=%d, predNT=%d\n", if3_redirect, if3_prevHalfNotMetRedirect, if3_predTakenRedirect, if3_predNotTakenRedirect)
634    // XSDebug("[IF3][prevHalfInstr] v=%d redirect=%d fetchpc=%x idx=%d tgt=%x taken=%d instr=%x\n\n",
635    //   prev_half_valid, prev_half_redirect, prev_half_fetchpc, prev_half_idx, prev_half_tgt, prev_half_taken, prev_half_instr)
636    XSDebug("[IF3][if3_prevHalfInstr] v=%d pc=%x npc=%x  instr=%x ipf=%d\n\n",
637    if3_prevHalfInstr.valid, if3_prevHalfInstr.bits.pc, if3_prevHalfInstr.bits.npc, if3_prevHalfInstr.bits.instr, if3_prevHalfInstr.bits.ipf)
638    if3_gh.debug("if3")
639
640    XSDebug("[IF4][predecode] mask=%b\n", if4_pd.mask)
641    XSDebug("[IF4][snpc]: %x, realMask=%b\n", if4_snpc, if4_mask)
642    XSDebug("[IF4][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n", if4_bp.taken, if4_bp.jmpIdx, if4_bp.hasNotTakenBrs, if4_bp.target, if4_bp.saveHalfRVI)
643    XSDebug("[IF4][redirect]: v=%d, prevNotMet=%d, predT=%d, predNT=%d\n", if4_redirect, if4_prevHalfNextNotMet, if4_predTakenRedirect, if4_predNotTakenRedirect)
644    XSDebug(if4_pd.pd(if4_bp.jmpIdx).isJal && if4_bp.taken, "[IF4] cfi is jal!  instr=%x target=%x\n", if4_instrs(if4_bp.jmpIdx), if4_jal_tgts(if4_bp.jmpIdx))
645    XSDebug("[IF4][ prevHalfInstrReq] v=%d pc=%x npc=%x instr=%x ipf=%d\n",
646      prevHalfInstrReq.valid, prevHalfInstrReq.bits.pc, prevHalfInstrReq.bits.npc, prevHalfInstrReq.bits.instr, prevHalfInstrReq.bits.ipf)
647    XSDebug("[IF4][if4_prevHalfInstr] v=%d pc=%x npc=%x instr=%x ipf=%d\n",
648      if4_prevHalfInstr.valid, if4_prevHalfInstr.bits.pc, if4_prevHalfInstr.bits.npc, if4_prevHalfInstr.bits.instr, if4_prevHalfInstr.bits.ipf)
649    if4_gh.debug("if4")
650    XSDebug(io.fetchPacket.fire(), "[IF4][fetchPacket] v=%d r=%d mask=%b ipf=%d acf=%d crossPageIPF=%d\n",
651      io.fetchPacket.valid, io.fetchPacket.ready, io.fetchPacket.bits.mask, io.fetchPacket.bits.ipf, io.fetchPacket.bits.acf, io.fetchPacket.bits.crossPageIPFFix)
652    for (i <- 0 until PredictWidth) {
653      XSDebug(io.fetchPacket.fire(), "[IF4][fetchPacket] %b %x pc=%x pd: rvc=%d brType=%b call=%d ret=%d\n",
654        io.fetchPacket.bits.mask(i),
655        io.fetchPacket.bits.instrs(i),
656        io.fetchPacket.bits.pc(i),
657        io.fetchPacket.bits.pd(i).isRVC,
658        io.fetchPacket.bits.pd(i).brType,
659        io.fetchPacket.bits.pd(i).isCall,
660        io.fetchPacket.bits.pd(i).isRet
661      )
662    }
663    val b = ftqEnqBuf
664    XSDebug("[FtqEnqBuf] v=%d r=%d pc=%x cfiIndex(%d)=%d cfiIsCall=%d cfiIsRet=%d cfiIsRVC=%d\n",
665      ftqEnqBuf_valid, ftqEnqBuf_ready, b.ftqPC, b.cfiIndex.valid, b.cfiIndex.bits, b.cfiIsCall, b.cfiIsRet, b.cfiIsRVC)
666    XSDebug("[FtqEnqBuf] valids=%b br_mask=%b rvc_mask=%b hist=%x predHist=%x rasSp=%d rasTopAddr=%x rasTopCtr=%d\n",
667      b.valids.asUInt, b.br_mask.asUInt, b.rvc_mask.asUInt, b.hist.asUInt, b.predHist.asUInt, b.rasSp, b.rasTop.retAddr, b.rasTop.ctr)
668    XSDebug("[ToFTQ] v=%d r=%d leftOne=%d ptr=%d\n", io.toFtq.valid, io.toFtq.ready, io.ftqLeftOne, io.ftqEnqPtr.value)
669  }
670
671}
672