xref: /XiangShan/src/main/scala/xiangshan/frontend/IFU.scala (revision 6b98c508e8e19ed2866e951962b29ae2ad3337cd)
1package xiangshan.frontend
2
3import chisel3._
4import chisel3.util._
5import device.RAMHelper
6import xiangshan._
7import utils._
8import xiangshan.cache._
9import chisel3.experimental.chiselName
10
11trait HasIFUConst extends HasXSParameter {
12  val resetVector = 0x80000000L//TODO: set reset vec
13  def align(pc: UInt, bytes: Int): UInt = Cat(pc(VAddrBits-1, log2Ceil(bytes)), 0.U(log2Ceil(bytes).W))
14  val groupBytes = FetchWidth * 4 * 2 // correspond to cache line size
15  val groupOffsetBits = log2Ceil(groupBytes)
16  val nBanksInPacket = 2
17  val bankBytes = PredictWidth * 2 / nBanksInPacket
18  val nBanksInGroup = groupBytes / bankBytes
19  val bankWidth = PredictWidth / nBanksInPacket
20  val bankOffsetBits = log2Ceil(bankBytes)
21  // (0, nBanksInGroup-1)
22  def bankInGroup(pc: UInt) = pc(groupOffsetBits-1,bankOffsetBits)
23  def isInLastBank(pc: UInt) = bankInGroup(pc) === (nBanksInGroup-1).U
24  // (0, bankBytes/2-1)
25  def offsetInBank(pc: UInt) = pc(bankOffsetBits-1,1)
26  def bankAligned(pc: UInt)  = align(pc, bankBytes)
27  def groupAligned(pc: UInt) = align(pc, groupBytes)
28  // each 1 bit in mask stands for 2 Bytes
29  // 8 bits, in which only the first 7 bits could be 0
30  def maskFirstHalf(pc: UInt): UInt = ((~(0.U(bankWidth.W))) >> offsetInBank(pc))(bankWidth-1,0)
31  def maskLastHalf(pc: UInt): UInt = Mux(isInLastBank(pc), 0.U(bankWidth.W), ~0.U(bankWidth.W))
32  def mask(pc: UInt): UInt = Reverse(Cat(maskFirstHalf(pc), maskLastHalf(pc)))
33  def snpc(pc: UInt): UInt = bankAligned(pc) + Mux(isInLastBank(pc), bankBytes.U, (bankBytes*2).U)
34
35  val enableGhistRepair = true
36  val IFUDebug = true
37}
38
39class GlobalHistory extends XSBundle {
40  val predHist = UInt(HistoryLength.W)
41  // val sawNTBr = Bool()
42  // val takenOnBr = Bool()
43  // val saveHalfRVI = Bool()
44  // def shifted = takenOnBr || sawNTBr
45  // def newPtr(ptr: UInt = nowPtr): UInt = Mux(shifted, ptr - 1.U, ptr)
46  def update(sawNTBr: Bool, takenOnBr: Bool, hist: UInt = predHist): GlobalHistory = {
47    val g = Wire(new GlobalHistory)
48    val shifted = takenOnBr || sawNTBr
49    g.predHist := Mux(shifted, (hist << 1) | takenOnBr.asUInt, hist)
50    g
51  }
52
53  final def === (that: GlobalHistory): Bool = {
54    predHist === that.predHist
55  }
56
57  final def =/= (that: GlobalHistory): Bool = !(this === that)
58
59  implicit val name = "IFU"
60  def debug(where: String) = XSDebug(p"[${where}_GlobalHistory] hist=${Binary(predHist)}\n")
61  // override def toString(): String = "histPtr=%d, sawNTBr=%d, takenOnBr=%d, saveHalfRVI=%d".format(histPtr, sawNTBr, takenOnBr, saveHalfRVI)
62}
63
64
65class IFUIO extends XSBundle
66{
67  // to ibuffer
68  val fetchPacket = DecoupledIO(new FetchPacket)
69  // from backend
70  val redirect = Flipped(ValidIO(UInt(VAddrBits.W)))
71  val cfiUpdateInfo = Flipped(ValidIO(new CfiUpdateInfo))
72  // to icache
73  val icacheMemGrant = Flipped(DecoupledIO(new L1plusCacheResp))
74  val fencei = Input(Bool())
75  // from icache
76  val icacheMemAcq = DecoupledIO(new L1plusCacheReq)
77  val l1plusFlush = Output(Bool())
78  // to tlb
79  val sfence = Input(new SfenceBundle)
80  val tlbCsr = Input(new TlbCsrBundle)
81  // from tlb
82  val ptw = new TlbPtwIO
83}
84
85class PrevHalfInstr extends XSBundle {
86  val taken = Bool()
87  val ghInfo = new GlobalHistory()
88  val fetchpc = UInt(VAddrBits.W) // only for debug
89  val idx = UInt(VAddrBits.W) // only for debug
90  val pc = UInt(VAddrBits.W)
91  val npc = UInt(VAddrBits.W)
92  val target = UInt(VAddrBits.W)
93  val instr = UInt(16.W)
94  val ipf = Bool()
95  val meta = new BpuMeta
96  // val newPtr = UInt(log2Up(ExtHistoryLength).W)
97}
98
99@chiselName
100class IFU extends XSModule with HasIFUConst
101{
102  val io = IO(new IFUIO)
103  val bpu = BPU(EnableBPU)
104  val icache = Module(new ICache)
105
106  io.ptw <> TLB(
107    in = Seq(icache.io.tlb),
108    sfence = io.sfence,
109    csr = io.tlbCsr,
110    width = 1,
111    isDtlb = false,
112    shouldBlock = true
113  )
114
115  val if2_redirect, if3_redirect, if4_redirect = WireInit(false.B)
116  val if1_flush, if2_flush, if3_flush, if4_flush = WireInit(false.B)
117
118  val icacheResp = icache.io.resp.bits
119
120  if4_flush := io.redirect.valid
121  if3_flush := if4_flush || if4_redirect
122  if2_flush := if3_flush || if3_redirect
123  if1_flush := if2_flush || if2_redirect
124
125  //********************** IF1 ****************************//
126  val if1_valid = !reset.asBool && GTimer() > 500.U
127  val if1_npc = WireInit(0.U(VAddrBits.W))
128  val if2_ready = WireInit(false.B)
129  val if2_allReady = WireInit(if2_ready && icache.io.req.ready)
130  val if1_fire = if1_valid && (if2_allReady || if2_flush)
131
132
133  // val if2_newPtr, if3_newPtr, if4_newPtr = Wire(UInt(log2Up(ExtHistoryLength).W))
134
135  val if1_gh, if2_gh, if3_gh, if4_gh = Wire(new GlobalHistory)
136  val if2_predicted_gh, if3_predicted_gh, if4_predicted_gh = Wire(new GlobalHistory)
137  val final_gh = RegInit(0.U.asTypeOf(new GlobalHistory))
138  val final_gh_bypass = WireInit(0.U.asTypeOf(new GlobalHistory))
139  val flush_final_gh = WireInit(false.B)
140
141  //********************** IF2 ****************************//
142  val if2_valid = RegInit(init = false.B)
143  val if2_allValid = if2_valid && icache.io.tlb.resp.valid
144  val if3_ready = WireInit(false.B)
145  val if2_fire = if2_allValid && if3_ready
146  val if2_pc = RegEnable(next = if1_npc, init = resetVector.U, enable = if1_fire)
147  val if2_snpc = snpc(if2_pc)
148  val if2_predHist = RegEnable(if1_gh.predHist, enable=if1_fire)
149  if2_ready := if3_ready && icache.io.tlb.resp.valid || !if2_valid
150  when (if1_fire)       { if2_valid := true.B }
151  .elsewhen (if2_flush) { if2_valid := false.B }
152  .elsewhen (if2_fire)  { if2_valid := false.B }
153
154  val npcGen = new PriorityMuxGenerator[UInt]
155  npcGen.register(true.B, RegNext(if1_npc), Some("stallPC"))
156  // npcGen.register(if2_fire, if2_snpc, Some("if2_snpc"))
157  val if2_bp = bpu.io.out(0)
158
159  // if taken, bp_redirect should be true
160  // when taken on half RVI, we suppress this redirect signal
161  // if2_redirect := if2_valid
162  npcGen.register(if2_valid, Mux(if2_bp.taken, if2_bp.target, if2_snpc), Some("if2_target"))
163
164  if2_predicted_gh := if2_gh.update(if2_bp.hasNotTakenBrs, if2_bp.takenOnBr)
165
166  //********************** IF3 ****************************//
167  // if3 should wait for instructions resp to arrive
168  val if3_valid = RegInit(init = false.B)
169  val if4_ready = WireInit(false.B)
170  val if3_allValid = if3_valid && icache.io.resp.valid
171  val if3_fire = if3_allValid && if4_ready
172  val if3_pc = RegEnable(if2_pc, if2_fire)
173  val if3_snpc = RegEnable(if2_snpc, if2_fire)
174  val if3_predHist = RegEnable(if2_predHist, enable=if2_fire)
175  if3_ready := if4_ready && icache.io.resp.valid || !if3_valid
176  when (if3_flush) {
177    if3_valid := false.B
178  }.elsewhen (if2_fire && !if2_flush) {
179    if3_valid := true.B
180  }.elsewhen (if3_fire) {
181    if3_valid := false.B
182  }
183
184  val if3_bp = bpu.io.out(1)
185  if3_predicted_gh := if3_gh.update(if3_bp.hasNotTakenBrs, if3_bp.takenOnBr)
186
187
188  val prevHalfInstrReq = WireInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
189  // only valid when if4_fire
190  val hasPrevHalfInstrReq = prevHalfInstrReq.valid
191
192  val if3_prevHalfInstr = RegInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
193
194  // 32-bit instr crosses 2 pages, and the higher 16-bit triggers page fault
195  val crossPageIPF = WireInit(false.B)
196
197  val if3_pendingPrevHalfInstr = if3_prevHalfInstr.valid
198
199  // the previous half of RVI instruction waits until it meets its last half
200  val if3_prevHalfInstrMet = if3_pendingPrevHalfInstr && if3_prevHalfInstr.bits.npc === if3_pc && if3_valid
201  // set to invalid once consumed or redirect from backend
202  val if3_prevHalfConsumed = if3_prevHalfInstrMet && if3_fire
203  val if3_prevHalfFlush = if4_flush
204  when (if3_prevHalfFlush) {
205    if3_prevHalfInstr.valid := false.B
206  }.elsewhen (hasPrevHalfInstrReq) {
207    if3_prevHalfInstr.valid := true.B
208  }.elsewhen (if3_prevHalfConsumed) {
209    if3_prevHalfInstr.valid := false.B
210  }
211  when (hasPrevHalfInstrReq) {
212    if3_prevHalfInstr.bits := prevHalfInstrReq.bits
213  }
214  // when bp signal a redirect, we distinguish between taken and not taken
215  // if taken and saveHalfRVI is true, we do not redirect to the target
216
217  class IF3_PC_COMP extends XSModule {
218    val io = IO(new Bundle {
219      val if2_pc = Input(UInt(VAddrBits.W))
220      val pc     = Input(UInt(VAddrBits.W))
221      val if2_valid = Input(Bool())
222      val res = Output(Bool())
223    })
224    io.res := !io.if2_valid || io.if2_valid && io.if2_pc =/= io.pc
225  }
226  def if3_nextValidPCNotEquals(pc: UInt) = {
227    val comp = Module(new IF3_PC_COMP)
228    comp.io.if2_pc := if2_pc
229    comp.io.pc     := pc
230    comp.io.if2_valid := if2_valid
231    comp.io.res
232  }
233
234  val if3_predTakenRedirectVec = VecInit((0 until PredictWidth).map(i => !if3_pendingPrevHalfInstr && if3_bp.realTakens(i) && if3_nextValidPCNotEquals(if3_bp.targets(i))))
235  val if3_prevHalfMetRedirect    = if3_pendingPrevHalfInstr && if3_prevHalfInstrMet && if3_prevHalfInstr.bits.taken && if3_nextValidPCNotEquals(if3_prevHalfInstr.bits.target)
236  val if3_prevHalfNotMetRedirect = if3_pendingPrevHalfInstr && !if3_prevHalfInstrMet && if3_nextValidPCNotEquals(if3_prevHalfInstr.bits.npc)
237  val if3_predTakenRedirect    = ParallelPriorityMux(if3_bp.realTakens, if3_predTakenRedirectVec)
238  val if3_predNotTakenRedirect = !if3_pendingPrevHalfInstr && !if3_bp.taken && if3_nextValidPCNotEquals(if3_snpc)
239  // when pendingPrevHalfInstr, if3_GHInfo is set to the info of last prev half instr
240  // val if3_ghInfoNotIdenticalRedirect = !if3_pendingPrevHalfInstr && if3_GHInfo =/= if3_lastGHInfo && enableGhistRepair.B
241
242  if3_redirect := if3_valid && (
243                    // prevHalf is consumed but the next packet is not where it meant to be
244                    // we do not handle this condition because of the burden of building a correct GHInfo
245                    // prevHalfMetRedirect ||
246                    // prevHalf does not match if3_pc and the next fetch packet is not snpc
247                    if3_prevHalfNotMetRedirect ||
248                    // pred taken and next fetch packet is not the predicted target
249                    if3_predTakenRedirect ||
250                    // pred not taken and next fetch packet is not snpc
251                    if3_predNotTakenRedirect
252                    // GHInfo from last pred does not corresponds with this packet
253                    // if3_ghInfoNotIdenticalRedirect
254                  )
255
256  val if3_target = WireInit(if3_snpc)
257
258  /* when (prevHalfMetRedirect) {
259    if1_npc := if3_prevHalfInstr.target
260  }.else */
261  if3_target := Mux1H(Seq((if3_prevHalfNotMetRedirect -> if3_prevHalfInstr.bits.npc),
262                          (if3_predTakenRedirect      -> if3_bp.target),
263                          (if3_predNotTakenRedirect   -> if3_snpc)))
264  // }.elsewhen (if3_ghInfoNotIdenticalRedirect) {
265  //   if3_target := Mux(if3_bp.taken, if3_bp.target, snpc(if3_pc))
266  // }
267  npcGen.register(if3_redirect, if3_target, Some("if3_target"))
268
269  // when (if3_redirect) {
270  //   if1_npc := if3_target
271  // }
272
273  //********************** IF4 ****************************//
274  val if4_pd = RegEnable(icache.io.pd_out, if3_fire)
275  val if4_ipf = RegEnable(icacheResp.ipf || if3_prevHalfInstrMet && if3_prevHalfInstr.bits.ipf, if3_fire)
276  val if4_acf = RegEnable(icacheResp.acf, if3_fire)
277  val if4_crossPageIPF = RegEnable(crossPageIPF, if3_fire)
278  val if4_valid = RegInit(false.B)
279  val if4_fire = if4_valid && io.fetchPacket.ready
280  val if4_pc = RegEnable(if3_pc, if3_fire)
281  val if4_snpc = RegEnable(if3_snpc, if3_fire)
282  // This is the real mask given from icache
283  val if4_mask = RegEnable(icacheResp.mask, if3_fire)
284
285
286  val if4_predHist = RegEnable(if3_predHist, enable=if3_fire)
287  // wait until prevHalfInstr written into reg
288  if4_ready := (io.fetchPacket.ready && !hasPrevHalfInstrReq || !if4_valid) && GTimer() > 500.U
289  when (if4_flush) {
290    if4_valid := false.B
291  }.elsewhen (if3_fire && !if3_flush) {
292    if4_valid := Mux(if3_pendingPrevHalfInstr, if3_prevHalfInstrMet, true.B)
293  }.elsewhen (if4_fire) {
294    if4_valid := false.B
295  }
296
297  val if4_bp = Wire(new BranchPrediction)
298  if4_bp := bpu.io.out(2)
299
300  if4_predicted_gh := if4_gh.update(if4_bp.hasNotTakenBrs, if4_bp.takenOnBr)
301
302  def cal_jal_tgt(inst: UInt, rvc: Bool): UInt = {
303    Mux(rvc,
304      SignExt(Cat(inst(12), inst(8), inst(10, 9), inst(6), inst(7), inst(2), inst(11), inst(5, 3), 0.U(1.W)), XLEN),
305      SignExt(Cat(inst(31), inst(19, 12), inst(20), inst(30, 21), 0.U(1.W)), XLEN)
306    )
307  }
308  val if4_instrs = if4_pd.instrs
309  val if4_jals = if4_bp.jalMask
310  val if4_jal_tgts = VecInit((0 until PredictWidth).map(i => if4_pd.pc(i) + cal_jal_tgt(if4_instrs(i), if4_pd.pd(i).isRVC)))
311
312  (0 until PredictWidth).foreach {i =>
313    when (if4_jals(i)) {
314      if4_bp.targets(i) := if4_jal_tgts(i)
315    }
316  }
317
318  // we need this to tell BPU the prediction of prev half
319  // because the prediction is with the start of each inst
320  val if4_prevHalfInstr = RegInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
321  val if4_pendingPrevHalfInstr = if4_prevHalfInstr.valid
322  val if4_prevHalfInstrMet = if4_pendingPrevHalfInstr && if4_prevHalfInstr.bits.npc === if4_pc && if4_valid
323  val if4_prevHalfConsumed = if4_prevHalfInstrMet && if4_fire
324  val if4_prevHalfFlush = if4_flush
325
326  val if4_takenPrevHalf = WireInit(if4_prevHalfInstrMet && if4_prevHalfInstr.bits.taken)
327  when (if4_prevHalfFlush) {
328    if4_prevHalfInstr.valid := false.B
329  }.elsewhen (if3_prevHalfConsumed) {
330    if4_prevHalfInstr.valid := if3_prevHalfInstr.valid
331  }.elsewhen (if4_prevHalfConsumed) {
332    if4_prevHalfInstr.valid := false.B
333  }
334
335  when (if3_prevHalfConsumed) {
336    if4_prevHalfInstr.bits := if3_prevHalfInstr.bits
337  }
338
339  prevHalfInstrReq.valid := if4_fire && if4_bp.saveHalfRVI
340  val idx = if4_bp.lastHalfRVIIdx
341
342  // this is result of the last half RVI
343  prevHalfInstrReq.bits.taken := if4_bp.lastHalfRVITaken
344  prevHalfInstrReq.bits.ghInfo := if4_gh
345  prevHalfInstrReq.bits.fetchpc := if4_pc
346  prevHalfInstrReq.bits.idx := idx
347  prevHalfInstrReq.bits.pc := if4_pd.pc(idx)
348  prevHalfInstrReq.bits.npc := if4_pd.pc(idx) + 2.U
349  prevHalfInstrReq.bits.target := if4_bp.lastHalfRVITarget
350  prevHalfInstrReq.bits.instr := if4_pd.instrs(idx)(15, 0)
351  prevHalfInstrReq.bits.ipf := if4_ipf
352  prevHalfInstrReq.bits.meta := bpu.io.bpuMeta(idx)
353
354  class IF4_PC_COMP extends XSModule {
355    val io = IO(new Bundle {
356      val if2_pc = Input(UInt(VAddrBits.W))
357      val if3_pc = Input(UInt(VAddrBits.W))
358      val pc     = Input(UInt(VAddrBits.W))
359      val if2_valid = Input(Bool())
360      val if3_valid = Input(Bool())
361      val res = Output(Bool())
362    })
363    io.res := io.if3_valid  && io.if3_pc =/= io.pc ||
364              !io.if3_valid && (io.if2_valid && io.if2_pc =/= io.pc) ||
365              !io.if3_valid && !io.if2_valid
366  }
367  def if4_nextValidPCNotEquals(pc: UInt) = {
368    val comp = Module(new IF4_PC_COMP)
369    comp.io.if2_pc := if2_pc
370    comp.io.if3_pc := if3_pc
371    comp.io.pc     := pc
372    comp.io.if2_valid := if2_valid
373    comp.io.if3_valid := if3_valid
374    comp.io.res
375  }
376
377  val if4_predTakenRedirectVec = VecInit((0 until PredictWidth).map(i => if4_bp.realTakens(i) && if4_nextValidPCNotEquals(if4_bp.targets(i))))
378
379  val if4_prevHalfNextNotMet = hasPrevHalfInstrReq && if4_nextValidPCNotEquals(prevHalfInstrReq.bits.pc+2.U)
380  val if4_predTakenRedirect = ParallelPriorityMux(if4_bp.realTakens, if4_predTakenRedirectVec)
381  val if4_predNotTakenRedirect = !if4_bp.taken && if4_nextValidPCNotEquals(if4_snpc)
382  // val if4_ghInfoNotIdenticalRedirect = if4_GHInfo =/= if4_lastGHInfo && enableGhistRepair.B
383
384  if4_redirect := if4_valid && (
385                    // when if4 has a lastHalfRVI, but the next fetch packet is not snpc
386                    // if4_prevHalfNextNotMet ||
387                    // when if4 preds taken, but the pc of next fetch packet is not the target
388                    if4_predTakenRedirect ||
389                    // when if4 preds not taken, but the pc of next fetch packet is not snpc
390                    if4_predNotTakenRedirect
391                    // GHInfo from last pred does not corresponds with this packet
392                    // if4_ghInfoNotIdenticalRedirect
393                  )
394
395  val if4_target = WireInit(if4_snpc)
396
397  // when (if4_prevHalfNextNotMet) {
398  //   if4_target := prevHalfInstrReq.pc+2.U
399  // }.else
400  if4_target := Mux(if4_bp.taken, if4_bp.target, if4_snpc)
401  // when (if4_predTakenRedirect) {
402  //   if4_target := if4_bp.target
403  // }.elsewhen (if4_predNotTakenRedirect) {
404  //   if4_target := if4_snpc
405  // }
406  // }.elsewhen (if4_ghInfoNotIdenticalRedirect) {
407  //   if4_target := Mux(if4_bp.taken, if4_bp.target, if4_snpc)
408  // }
409  npcGen.register(if4_redirect, if4_target, Some("if4_target"))
410
411  when (if4_fire) {
412    final_gh := if4_predicted_gh
413  }
414  if4_gh := Mux(flush_final_gh, final_gh_bypass, final_gh)
415  if3_gh := Mux(if4_valid && !if4_flush, if4_predicted_gh, if4_gh)
416  if2_gh := Mux(if3_valid && !if3_flush, if3_predicted_gh, if3_gh)
417  if1_gh := Mux(if2_valid && !if2_flush, if2_predicted_gh, if2_gh)
418
419
420
421
422  val cfiUpdate = io.cfiUpdateInfo
423  when (cfiUpdate.valid && (cfiUpdate.bits.isMisPred || cfiUpdate.bits.isReplay)) {
424    val b = cfiUpdate.bits
425    val oldGh = b.bpuMeta.hist
426    val sawNTBr = b.bpuMeta.sawNotTakenBranch
427    val isBr = b.pd.isBr
428    val taken = Mux(cfiUpdate.bits.isReplay, b.bpuMeta.predTaken, b.taken)
429    val updatedGh = oldGh.update(sawNTBr, isBr && taken)
430    final_gh := updatedGh
431    final_gh_bypass := updatedGh
432    flush_final_gh := true.B
433  }
434
435  npcGen.register(io.redirect.valid, io.redirect.bits, Some("backend_redirect"))
436  npcGen.register(RegNext(reset.asBool) && !reset.asBool, resetVector.U(VAddrBits.W), Some("reset_vector"))
437
438  if1_npc := npcGen()
439
440
441  icache.io.req.valid := if1_valid && (if2_ready || if2_flush)
442  icache.io.resp.ready := if4_ready
443  icache.io.req.bits.addr := if1_npc
444  icache.io.req.bits.mask := mask(if1_npc)
445  icache.io.flush := Cat(if3_flush, if2_flush)
446  icache.io.mem_grant <> io.icacheMemGrant
447  icache.io.fencei := io.fencei
448  icache.io.prev.valid := if3_prevHalfInstrMet
449  icache.io.prev.bits := if3_prevHalfInstr.bits.instr
450  icache.io.prev_ipf := if3_prevHalfInstr.bits.ipf
451  io.icacheMemAcq <> icache.io.mem_acquire
452  io.l1plusFlush := icache.io.l1plusflush
453
454  bpu.io.cfiUpdateInfo <> io.cfiUpdateInfo
455
456  // bpu.io.flush := Cat(if4_flush, if3_flush, if2_flush)
457  bpu.io.flush := VecInit(if2_flush, if3_flush, if4_flush)
458  bpu.io.inFire(0) := if1_fire
459  bpu.io.inFire(1) := if2_fire
460  bpu.io.inFire(2) := if3_fire
461  bpu.io.inFire(3) := if4_fire
462  bpu.io.in.pc := if1_npc
463  bpu.io.in.hist := if1_gh.asUInt
464  // bpu.io.in.histPtr := ptr
465  bpu.io.in.inMask := mask(if1_npc)
466  bpu.io.predecode.mask := if4_pd.mask
467  bpu.io.predecode.lastHalf := if4_pd.lastHalf
468  bpu.io.predecode.pd := if4_pd.pd
469  bpu.io.predecode.hasLastHalfRVI := if4_prevHalfInstrMet
470  bpu.io.realMask := if4_mask
471  bpu.io.prevHalf := if4_prevHalfInstr
472
473
474  when (if3_prevHalfInstrMet && icacheResp.ipf && !if3_prevHalfInstr.bits.ipf) {
475    crossPageIPF := true.B // higher 16 bits page fault
476  }
477
478  val fetchPacketValid = if4_valid && !io.redirect.valid
479  val fetchPacketWire = Wire(new FetchPacket)
480
481  // io.fetchPacket.valid := if4_valid && !io.redirect.valid
482  fetchPacketWire.instrs := if4_pd.instrs
483  fetchPacketWire.mask := if4_pd.mask & (Fill(PredictWidth, !if4_bp.taken) | (Fill(PredictWidth, 1.U(1.W)) >> (~if4_bp.jmpIdx)))
484  fetchPacketWire.pdmask := if4_pd.mask
485
486  fetchPacketWire.pc := if4_pd.pc
487  (0 until PredictWidth).foreach(i => fetchPacketWire.pnpc(i) := if4_pd.pc(i) + Mux(if4_pd.pd(i).isRVC, 2.U, 4.U))
488  when (if4_bp.taken) {
489    fetchPacketWire.pnpc(if4_bp.jmpIdx) := if4_bp.target
490  }
491  fetchPacketWire.bpuMeta := bpu.io.bpuMeta
492  // save it for update
493  when (if4_pendingPrevHalfInstr) {
494    fetchPacketWire.bpuMeta(0) := if4_prevHalfInstr.bits.meta
495  }
496  (0 until PredictWidth).foreach(i => {
497    val meta = fetchPacketWire.bpuMeta(i)
498    meta.hist := final_gh
499    meta.predHist := if4_predHist.asTypeOf(new GlobalHistory)
500    meta.predTaken := if4_bp.takens(i)
501  })
502  fetchPacketWire.pd := if4_pd.pd
503  fetchPacketWire.ipf := if4_ipf
504  fetchPacketWire.acf := if4_acf
505  fetchPacketWire.crossPageIPFFix := if4_crossPageIPF
506
507  // predTaken Vec
508  fetchPacketWire.predTaken := if4_bp.taken
509
510  io.fetchPacket.bits := fetchPacketWire
511  io.fetchPacket.valid := fetchPacketValid
512
513  // debug info
514  if (IFUDebug) {
515    XSDebug(RegNext(reset.asBool) && !reset.asBool, "Reseting...\n")
516    XSDebug(icache.io.flush(0).asBool, "Flush icache stage2...\n")
517    XSDebug(icache.io.flush(1).asBool, "Flush icache stage3...\n")
518    XSDebug(io.redirect.valid, p"Redirect from backend! target=${Hexadecimal(io.redirect.bits)}\n")
519
520    XSDebug("[IF1] v=%d     fire=%d            flush=%d pc=%x mask=%b\n", if1_valid, if1_fire, if1_flush, if1_npc, mask(if1_npc))
521    XSDebug("[IF2] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x snpc=%x\n", if2_valid, if2_ready, if2_fire, if2_redirect, if2_flush, if2_pc, if2_snpc)
522    XSDebug("[IF3] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x crossPageIPF=%d sawNTBrs=%d\n", if3_valid, if3_ready, if3_fire, if3_redirect, if3_flush, if3_pc, crossPageIPF, if3_bp.hasNotTakenBrs)
523    XSDebug("[IF4] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x crossPageIPF=%d sawNTBrs=%d\n", if4_valid, if4_ready, if4_fire, if4_redirect, if4_flush, if4_pc, if4_crossPageIPF, if4_bp.hasNotTakenBrs)
524    XSDebug("[IF1][icacheReq] v=%d r=%d addr=%x\n", icache.io.req.valid, icache.io.req.ready, icache.io.req.bits.addr)
525    XSDebug("[IF1][ghr] hist=%b\n", if1_gh.asUInt)
526    XSDebug("[IF1][ghr] extHist=%b\n\n", if1_gh.asUInt)
527
528    XSDebug("[IF2][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n\n", if2_bp.taken, if2_bp.jmpIdx, if2_bp.hasNotTakenBrs, if2_bp.target, if2_bp.saveHalfRVI)
529    if2_gh.debug("if2")
530
531    XSDebug("[IF3][icacheResp] v=%d r=%d pc=%x mask=%b\n", icache.io.resp.valid, icache.io.resp.ready, icache.io.resp.bits.pc, icache.io.resp.bits.mask)
532    XSDebug("[IF3][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n", if3_bp.taken, if3_bp.jmpIdx, if3_bp.hasNotTakenBrs, if3_bp.target, if3_bp.saveHalfRVI)
533    XSDebug("[IF3][redirect]: v=%d, prevMet=%d, prevNMet=%d, predT=%d, predNT=%d\n", if3_redirect, if3_prevHalfMetRedirect, if3_prevHalfNotMetRedirect, if3_predTakenRedirect, if3_predNotTakenRedirect)
534    // XSDebug("[IF3][prevHalfInstr] v=%d redirect=%d fetchpc=%x idx=%d tgt=%x taken=%d instr=%x\n\n",
535    //   prev_half_valid, prev_half_redirect, prev_half_fetchpc, prev_half_idx, prev_half_tgt, prev_half_taken, prev_half_instr)
536    XSDebug("[IF3][if3_prevHalfInstr] v=%d taken=%d fetchpc=%x idx=%d pc=%x npc=%x tgt=%x instr=%x ipf=%d\n\n",
537    if3_prevHalfInstr.valid, if3_prevHalfInstr.bits.taken, if3_prevHalfInstr.bits.fetchpc, if3_prevHalfInstr.bits.idx, if3_prevHalfInstr.bits.pc, if3_prevHalfInstr.bits.npc, if3_prevHalfInstr.bits.target, if3_prevHalfInstr.bits.instr, if3_prevHalfInstr.bits.ipf)
538    if3_gh.debug("if3")
539
540    XSDebug("[IF4][predecode] mask=%b\n", if4_pd.mask)
541    XSDebug("[IF4][snpc]: %x, realMask=%b\n", if4_snpc, if4_mask)
542    XSDebug("[IF4][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n", if4_bp.taken, if4_bp.jmpIdx, if4_bp.hasNotTakenBrs, if4_bp.target, if4_bp.saveHalfRVI)
543    XSDebug("[IF4][redirect]: v=%d, prevNotMet=%d, predT=%d, predNT=%d\n", if4_redirect, if4_prevHalfNextNotMet, if4_predTakenRedirect, if4_predNotTakenRedirect)
544    XSDebug(if4_pd.pd(if4_bp.jmpIdx).isJal && if4_bp.taken, "[IF4] cfi is jal!  instr=%x target=%x\n", if4_instrs(if4_bp.jmpIdx), if4_jal_tgts(if4_bp.jmpIdx))
545    XSDebug("[IF4][ prevHalfInstrReq] v=%d taken=%d fetchpc=%x idx=%d pc=%x npc=%x tgt=%x instr=%x ipf=%d\n",
546      prevHalfInstrReq.valid, prevHalfInstrReq.bits.taken, prevHalfInstrReq.bits.fetchpc, prevHalfInstrReq.bits.idx, prevHalfInstrReq.bits.pc, prevHalfInstrReq.bits.npc, prevHalfInstrReq.bits.target, prevHalfInstrReq.bits.instr, prevHalfInstrReq.bits.ipf)
547    XSDebug("[IF4][if4_prevHalfInstr] v=%d taken=%d fetchpc=%x idx=%d pc=%x npc=%x tgt=%x instr=%x ipf=%d\n",
548      if4_prevHalfInstr.valid, if4_prevHalfInstr.bits.taken, if4_prevHalfInstr.bits.fetchpc, if4_prevHalfInstr.bits.idx, if4_prevHalfInstr.bits.pc, if4_prevHalfInstr.bits.npc, if4_prevHalfInstr.bits.target, if4_prevHalfInstr.bits.instr, if4_prevHalfInstr.bits.ipf)
549    if4_gh.debug("if4")
550    XSDebug(io.fetchPacket.fire(), "[IF4][fetchPacket] v=%d r=%d mask=%b ipf=%d acf=%d crossPageIPF=%d\n",
551      io.fetchPacket.valid, io.fetchPacket.ready, io.fetchPacket.bits.mask, io.fetchPacket.bits.ipf, io.fetchPacket.bits.acf, io.fetchPacket.bits.crossPageIPFFix)
552    for (i <- 0 until PredictWidth) {
553      XSDebug(io.fetchPacket.fire(), "[IF4][fetchPacket] %b %x pc=%x pnpc=%x pd: rvc=%d brType=%b call=%d ret=%d\n",
554        io.fetchPacket.bits.mask(i),
555        io.fetchPacket.bits.instrs(i),
556        io.fetchPacket.bits.pc(i),
557        io.fetchPacket.bits.pnpc(i),
558        io.fetchPacket.bits.pd(i).isRVC,
559        io.fetchPacket.bits.pd(i).brType,
560        io.fetchPacket.bits.pd(i).isCall,
561        io.fetchPacket.bits.pd(i).isRet
562      )
563    }
564  }
565}