xref: /XiangShan/src/main/scala/xiangshan/frontend/IFU.scala (revision 7335093e406fa80164d76bd1703929109711bdcb)
1package xiangshan.frontend
2
3import chisel3._
4import chisel3.util._
5import device.RAMHelper
6import xiangshan._
7import utils._
8import xiangshan.cache._
9import chisel3.experimental.chiselName
10
11trait HasIFUConst extends HasXSParameter {
12  val resetVector = 0x80000000L//TODO: set reset vec
13  def align(pc: UInt, bytes: Int): UInt = Cat(pc(VAddrBits-1, log2Ceil(bytes)), 0.U(log2Ceil(bytes).W))
14  val groupBytes = FetchWidth * 4 * 2 // correspond to cache line size
15  val groupOffsetBits = log2Ceil(groupBytes)
16  val nBanksInPacket = 2
17  val bankBytes = PredictWidth * 2 / nBanksInPacket
18  val nBanksInGroup = groupBytes / bankBytes
19  val bankWidth = PredictWidth / nBanksInPacket
20  val bankOffsetBits = log2Ceil(bankBytes)
21  // (0, nBanksInGroup-1)
22  def bankInGroup(pc: UInt) = pc(groupOffsetBits-1,bankOffsetBits)
23  def isInLastBank(pc: UInt) = bankInGroup(pc) === (nBanksInGroup-1).U
24  // (0, bankBytes/2-1)
25  def offsetInBank(pc: UInt) = pc(bankOffsetBits-1,1)
26  def bankAligned(pc: UInt)  = align(pc, bankBytes)
27  def groupAligned(pc: UInt) = align(pc, groupBytes)
28  // each 1 bit in mask stands for 2 Bytes
29  // 8 bits, in which only the first 7 bits could be 0
30  def maskFirstHalf(pc: UInt): UInt = ((~(0.U(bankWidth.W))) >> offsetInBank(pc))(bankWidth-1,0)
31  // when in loop(buffer), we need to make use of the full packet
32  // and get the real mask in iCacheResp from loop buffer
33  // we may make predictions on more instructions than we could get from loop buffer
34  // and this will be handled in if4
35  def maskLastHalf(pc: UInt, inLoop: Bool = false.B): UInt = Mux(isInLastBank(pc) && !inLoop, 0.U(bankWidth.W), ~0.U(bankWidth.W))
36  def mask(pc: UInt, inLoop: Bool = false.B): UInt = Reverse(Cat(maskFirstHalf(pc), maskLastHalf(pc, inLoop)))
37  def snpc(pc: UInt, inLoop: Bool = false.B): UInt = pc + (PopCount(mask(pc, inLoop)) << 1)
38
39  val enableGhistRepair = true
40  val IFUDebug = true
41}
42
43class GlobalHistory extends XSBundle {
44  val predHist = UInt(HistoryLength.W)
45  // val sawNTBr = Bool()
46  // val takenOnBr = Bool()
47  // val saveHalfRVI = Bool()
48  // def shifted = takenOnBr || sawNTBr
49  // def newPtr(ptr: UInt = nowPtr): UInt = Mux(shifted, ptr - 1.U, ptr)
50  def update(sawNTBr: Bool, takenOnBr: Bool, hist: UInt = predHist): GlobalHistory = {
51    val g = Wire(new GlobalHistory)
52    val shifted = takenOnBr || sawNTBr
53    g.predHist := Mux(shifted, (hist << 1) | takenOnBr.asUInt, hist)
54    g
55  }
56
57  final def === (that: GlobalHistory): Bool = {
58    predHist === that.predHist
59  }
60
61  final def =/= (that: GlobalHistory): Bool = !(this === that)
62
63  implicit val name = "IFU"
64  def debug(where: String) = XSDebug(p"[${where}_GlobalHistory] hist=${Binary(predHist)}\n")
65  // override def toString(): String = "histPtr=%d, sawNTBr=%d, takenOnBr=%d, saveHalfRVI=%d".format(histPtr, sawNTBr, takenOnBr, saveHalfRVI)
66}
67
68
69class IFUIO extends XSBundle
70{
71  // to ibuffer
72  val fetchPacket = DecoupledIO(new FetchPacket)
73  // from backend
74  val redirect = Flipped(ValidIO(UInt(VAddrBits.W)))
75  val cfiUpdateInfo = Flipped(ValidIO(new CfiUpdateInfo))
76  // to icache
77  val icacheMemGrant = Flipped(DecoupledIO(new L1plusCacheResp))
78  val fencei = Input(Bool())
79  // from icache
80  val icacheMemAcq = DecoupledIO(new L1plusCacheReq)
81  val l1plusFlush = Output(Bool())
82  // to tlb
83  val sfence = Input(new SfenceBundle)
84  val tlbCsr = Input(new TlbCsrBundle)
85  // from tlb
86  val ptw = new TlbPtwIO
87}
88
89class PrevHalfInstr extends XSBundle {
90  val taken = Bool()
91  val ghInfo = new GlobalHistory()
92  val fetchpc = UInt(VAddrBits.W) // only for debug
93  val idx = UInt(VAddrBits.W) // only for debug
94  val pc = UInt(VAddrBits.W)
95  val npc = UInt(VAddrBits.W)
96  val target = UInt(VAddrBits.W)
97  val instr = UInt(16.W)
98  val ipf = Bool()
99  val newPtr = UInt(log2Up(ExtHistoryLength).W)
100}
101
102@chiselName
103class IFU extends XSModule with HasIFUConst
104{
105  val io = IO(new IFUIO)
106  val bpu = BPU(EnableBPU)
107  val icache = Module(new ICache)
108  icache.io.mem_grant <> io.icacheMemGrant
109  icache.io.fencei := io.fencei
110  val pd = Module(new PreDecode)
111  val loopBuffer = if(EnableLB) { Module(new LoopBuffer) } else { Module(new FakeLoopBuffer) }
112  io.ptw <> TLB(
113    in = Seq(icache.io.tlb),
114    sfence = io.sfence,
115    csr = io.tlbCsr,
116    width = 1,
117    isDtlb = false,
118    shouldBlock = true
119  )
120
121  val if2_redirect, if3_redirect, if4_redirect = WireInit(false.B)
122  val if1_flush, if2_flush, if3_flush, if4_flush = WireInit(false.B)
123
124  val loopBufPar = loopBuffer.io.loopBufPar
125  val inLoop = WireInit(loopBuffer.io.out.valid)
126  val icacheResp = WireInit(Mux(inLoop, loopBuffer.io.out.bits, icache.io.resp.bits))
127
128  if4_flush := io.redirect.valid || loopBufPar.LBredirect.valid
129  if3_flush := if4_flush || if4_redirect
130  if2_flush := if3_flush || if3_redirect
131  if1_flush := if2_flush || if2_redirect
132
133  loopBuffer.io.flush := io.redirect.valid
134
135  //********************** IF1 ****************************//
136  val if1_valid = !reset.asBool && GTimer() > 500.U
137  val if1_npc = WireInit(0.U(VAddrBits.W))
138  val if2_ready = WireInit(false.B)
139  val if2_allReady = WireInit(if2_ready && (inLoop || icache.io.req.ready))
140  val if1_fire = if1_valid && (if2_allReady || if1_flush)
141
142
143  // val if2_newPtr, if3_newPtr, if4_newPtr = Wire(UInt(log2Up(ExtHistoryLength).W))
144
145  val if1_gh, if2_gh, if3_gh, if4_gh = Wire(new GlobalHistory)
146  val if2_predicted_gh, if3_predicted_gh, if4_predicted_gh = Wire(new GlobalHistory)
147  val final_gh = RegInit(0.U.asTypeOf(new GlobalHistory))
148  val final_gh_bypass = WireInit(0.U.asTypeOf(new GlobalHistory))
149  val flush_final_gh = WireInit(false.B)
150
151  //********************** IF2 ****************************//
152  val if2_valid = RegInit(init = false.B)
153  val if3_ready = WireInit(false.B)
154  val if2_fire = if2_valid && if3_ready
155  val if2_pc = RegEnable(next = if1_npc, init = resetVector.U, enable = if1_fire)
156  val if2_snpc = snpc(if2_pc, inLoop)
157  val if2_predHist = RegEnable(if1_gh.predHist, enable=if1_fire)
158  if2_ready := if3_ready || !if2_valid
159  when (if1_fire)       { if2_valid := true.B }
160  .elsewhen (if2_flush) { if2_valid := false.B }
161  .elsewhen (if2_fire)  { if2_valid := false.B }
162
163  val npcGen = new PriorityMuxGenerator[UInt]
164  npcGen.register(true.B, RegNext(if1_npc))
165  npcGen.register(if2_fire, if2_snpc)
166  val if2_bp = bpu.io.out(0)
167
168  // if taken, bp_redirect should be true
169  // when taken on half RVI, we suppress this redirect signal
170  if2_redirect := if2_valid && if2_bp.taken
171  npcGen.register(if2_redirect, if2_bp.target)
172
173  if2_predicted_gh := if2_gh.update(if2_bp.hasNotTakenBrs, if2_bp.takenOnBr)
174
175  //********************** IF3 ****************************//
176  // if3 should wait for instructions resp to arrive
177  val if3_valid = RegInit(init = false.B)
178  val if4_ready = WireInit(false.B)
179  val if3_allValid = if3_valid && (inLoop || icache.io.resp.valid)
180  val if3_fire = if3_allValid && if4_ready
181  val if3_pc = RegEnable(if2_pc, if2_fire)
182  val if3_predHist = RegEnable(if2_predHist, enable=if2_fire)
183  if3_ready := if4_ready && (inLoop || icache.io.resp.valid) || !if3_valid
184  when (if3_flush) {
185    if3_valid := false.B
186  }.elsewhen (if2_fire && !if2_flush) {
187    if3_valid := true.B
188  }.elsewhen (if3_fire) {
189    if3_valid := false.B
190  }
191
192  val if3_bp = bpu.io.out(1)
193  if3_predicted_gh := if3_gh.update(if3_bp.hasNotTakenBrs, if3_bp.takenOnBr)
194
195
196  val prevHalfInstrReq = WireInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
197  // only valid when if4_fire
198  val hasPrevHalfInstrReq = prevHalfInstrReq.valid
199
200  val if3_prevHalfInstr = RegInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
201
202  // 32-bit instr crosses 2 pages, and the higher 16-bit triggers page fault
203  val crossPageIPF = WireInit(false.B)
204
205  val if3_pendingPrevHalfInstr = if3_prevHalfInstr.valid
206
207  // the previous half of RVI instruction waits until it meets its last half
208  val if3_prevHalfInstrMet = if3_pendingPrevHalfInstr && if3_prevHalfInstr.bits.npc === if3_pc && if3_valid
209  // set to invalid once consumed or redirect from backend
210  val if3_prevHalfConsumed = if3_prevHalfInstrMet && if3_fire
211  val if3_prevHalfFlush = if4_flush
212  when (hasPrevHalfInstrReq && !if3_prevHalfFlush) {
213    if3_prevHalfInstr.valid := true.B
214  }.elsewhen (if3_prevHalfConsumed || if3_prevHalfFlush) {
215    if3_prevHalfInstr.valid := false.B
216  }
217  when (hasPrevHalfInstrReq) {
218    if3_prevHalfInstr.bits := prevHalfInstrReq.bits
219  }
220  // when bp signal a redirect, we distinguish between taken and not taken
221  // if taken and saveHalfRVI is true, we do not redirect to the target
222
223  def if3_nextValidPCNotEquals(pc: UInt) = !if2_valid || if2_valid && if2_pc =/= pc
224  val if3_prevHalfMetRedirect    = if3_pendingPrevHalfInstr && if3_prevHalfInstrMet && if3_prevHalfInstr.bits.taken && if3_nextValidPCNotEquals(if3_prevHalfInstr.bits.target)
225  val if3_prevHalfNotMetRedirect = if3_pendingPrevHalfInstr && !if3_prevHalfInstrMet && if3_nextValidPCNotEquals(if3_prevHalfInstr.bits.npc)
226  val if3_predTakenRedirect    = !if3_pendingPrevHalfInstr && if3_bp.taken && if3_nextValidPCNotEquals(if3_bp.target)
227  val if3_predNotTakenRedirect = !if3_pendingPrevHalfInstr && !if3_bp.taken && if3_nextValidPCNotEquals(snpc(if3_pc, inLoop))
228  // when pendingPrevHalfInstr, if3_GHInfo is set to the info of last prev half instr
229  // val if3_ghInfoNotIdenticalRedirect = !if3_pendingPrevHalfInstr && if3_GHInfo =/= if3_lastGHInfo && enableGhistRepair.B
230
231  if3_redirect := if3_valid && (
232                    // prevHalf is consumed but the next packet is not where it meant to be
233                    // we do not handle this condition because of the burden of building a correct GHInfo
234                    // prevHalfMetRedirect ||
235                    // prevHalf does not match if3_pc and the next fetch packet is not snpc
236                    if3_prevHalfNotMetRedirect ||
237                    // pred taken and next fetch packet is not the predicted target
238                    if3_predTakenRedirect ||
239                    // pred not taken and next fetch packet is not snpc
240                    if3_predNotTakenRedirect
241                    // GHInfo from last pred does not corresponds with this packet
242                    // if3_ghInfoNotIdenticalRedirect
243                  )
244
245  val if3_target = WireInit(snpc(if3_pc))
246
247  /* when (prevHalfMetRedirect) {
248    if1_npc := if3_prevHalfInstr.target
249  }.else */
250  when (if3_prevHalfNotMetRedirect) {
251    if3_target := if3_prevHalfInstr.bits.npc
252  }.elsewhen (if3_predTakenRedirect) {
253    if3_target := if3_bp.target
254  }.elsewhen (if3_predNotTakenRedirect) {
255    if3_target := snpc(if3_pc)
256  }
257  // }.elsewhen (if3_ghInfoNotIdenticalRedirect) {
258  //   if3_target := Mux(if3_bp.taken, if3_bp.target, snpc(if3_pc))
259  // }
260  npcGen.register(if3_redirect, if3_target)
261
262  // when (if3_redirect) {
263  //   if1_npc := if3_target
264  // }
265
266  //********************** IF4 ****************************//
267  val if4_pd = RegEnable(pd.io.out, if3_fire)
268  val if4_ipf = RegEnable(icacheResp.ipf || if3_prevHalfInstrMet && if3_prevHalfInstr.bits.ipf, if3_fire)
269  val if4_acf = RegEnable(icacheResp.acf, if3_fire)
270  val if4_crossPageIPF = RegEnable(crossPageIPF, if3_fire)
271  val if4_valid = RegInit(false.B)
272  val if4_fire = if4_valid && io.fetchPacket.ready
273  val if4_pc = RegEnable(if3_pc, if3_fire)
274  // This is the real mask given from icache or loop buffer
275  val if4_mask = RegEnable(icacheResp.mask, if3_fire)
276  val if4_snpc = Mux(inLoop, if4_pc + (PopCount(if4_mask) << 1), snpc(if4_pc))
277
278
279  val if4_predHist = RegEnable(if3_predHist, enable=if3_fire)
280  // wait until prevHalfInstr written into reg
281  if4_ready := (io.fetchPacket.ready && !hasPrevHalfInstrReq || !if4_valid) && GTimer() > 500.U
282  when (if4_flush) {
283    if4_valid := false.B
284  }.elsewhen (if3_fire && !if3_flush) {
285    if4_valid := Mux(if3_pendingPrevHalfInstr, if3_prevHalfInstrMet, true.B)
286  }.elsewhen (if4_fire) {
287    if4_valid := false.B
288  }
289
290  val if4_bp = Wire(new BranchPrediction)
291  if4_bp := bpu.io.out(2)
292  if4_bp.takens  := bpu.io.out(2).takens & if4_mask
293  if4_bp.brMask  := bpu.io.out(2).brMask & if4_mask
294  if4_bp.jalMask := bpu.io.out(2).jalMask & if4_mask
295
296  if4_predicted_gh := if4_gh.update(if4_bp.hasNotTakenBrs, if4_bp.takenOnBr)
297
298  def cal_jal_tgt(inst: UInt, rvc: Bool): UInt = {
299    Mux(rvc,
300      SignExt(Cat(inst(12), inst(8), inst(10, 9), inst(6), inst(7), inst(2), inst(11), inst(5, 3), 0.U(1.W)), XLEN),
301      SignExt(Cat(inst(31), inst(19, 12), inst(20), inst(30, 21), 0.U(1.W)), XLEN)
302    )
303  }
304  val if4_instrs = if4_pd.instrs
305  val if4_jals = if4_bp.jalMask
306  val if4_jal_tgts = VecInit((0 until PredictWidth).map(i => if4_pd.pc(i) + cal_jal_tgt(if4_instrs(i), if4_pd.pd(i).isRVC)))
307
308  (0 until PredictWidth).foreach {i =>
309    when (if4_jals(i)) {
310      if4_bp.targets(i) := if4_jal_tgts(i)
311    }
312  }
313
314  // we need this to tell BPU the prediction of prev half
315  // because the prediction is with the start of each inst
316  val if4_prevHalfInstr = RegInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
317  val if4_pendingPrevHalfInstr = if4_prevHalfInstr.valid
318  val if4_prevHalfInstrMet = if4_pendingPrevHalfInstr && if4_prevHalfInstr.bits.npc === if4_pc && if4_valid
319  val if4_prevHalfConsumed = if4_prevHalfInstrMet && if4_fire
320  val if4_prevHalfFlush = if4_flush
321
322  val if4_takenPrevHalf = WireInit(if4_prevHalfInstrMet && if4_prevHalfInstr.bits.taken)
323  when (if3_prevHalfConsumed) {
324    if4_prevHalfInstr.valid := if3_prevHalfInstr.valid
325  }.elsewhen (if4_prevHalfConsumed || if4_prevHalfFlush) {
326    if4_prevHalfInstr.valid := false.B
327  }
328
329  when (if3_prevHalfConsumed) {
330    if4_prevHalfInstr.bits := if3_prevHalfInstr.bits
331  }
332
333  prevHalfInstrReq.valid := if4_fire && if4_bp.saveHalfRVI
334  val idx = if4_bp.lastHalfRVIIdx
335
336  // this is result of the last half RVI
337  prevHalfInstrReq.bits.taken := if4_bp.lastHalfRVITaken
338  prevHalfInstrReq.bits.ghInfo := if4_gh
339  prevHalfInstrReq.bits.newPtr := DontCare
340  prevHalfInstrReq.bits.fetchpc := if4_pc
341  prevHalfInstrReq.bits.idx := idx
342  prevHalfInstrReq.bits.pc := if4_pd.pc(idx)
343  prevHalfInstrReq.bits.npc := if4_pd.pc(idx) + 2.U
344  prevHalfInstrReq.bits.target := if4_bp.lastHalfRVITarget
345  prevHalfInstrReq.bits.instr := if4_pd.instrs(idx)(15, 0)
346  prevHalfInstrReq.bits.ipf := if4_ipf
347
348  def if4_nextValidPCNotEquals(pc: UInt) = if3_valid  && if3_pc =/= pc ||
349                                           !if3_valid && (if2_valid && if2_pc =/= pc) ||
350                                           !if3_valid && !if2_valid
351
352  val if4_prevHalfNextNotMet = hasPrevHalfInstrReq && if4_nextValidPCNotEquals(prevHalfInstrReq.bits.pc+2.U)
353  val if4_predTakenRedirect = !hasPrevHalfInstrReq && if4_bp.taken && if4_nextValidPCNotEquals(if4_bp.target)
354  val if4_predNotTakenRedirect = !hasPrevHalfInstrReq && !if4_bp.taken && if4_nextValidPCNotEquals(if4_snpc)
355  // val if4_ghInfoNotIdenticalRedirect = if4_GHInfo =/= if4_lastGHInfo && enableGhistRepair.B
356
357  if4_redirect := if4_valid && (
358                    // when if4 has a lastHalfRVI, but the next fetch packet is not snpc
359                    // if4_prevHalfNextNotMet ||
360                    // when if4 preds taken, but the pc of next fetch packet is not the target
361                    if4_predTakenRedirect ||
362                    // when if4 preds not taken, but the pc of next fetch packet is not snpc
363                    if4_predNotTakenRedirect
364                    // GHInfo from last pred does not corresponds with this packet
365                    // if4_ghInfoNotIdenticalRedirect
366                  )
367
368  val if4_target = WireInit(if4_snpc)
369
370  // when (if4_prevHalfNextNotMet) {
371  //   if4_target := prevHalfInstrReq.pc+2.U
372  // }.else
373  when (if4_predTakenRedirect) {
374    if4_target := if4_bp.target
375  }.elsewhen (if4_predNotTakenRedirect) {
376    if4_target := if4_snpc
377  }
378  // }.elsewhen (if4_ghInfoNotIdenticalRedirect) {
379  //   if4_target := Mux(if4_bp.taken, if4_bp.target, if4_snpc)
380  // }
381  npcGen.register(if4_redirect, if4_target)
382
383  when (if4_fire) {
384    final_gh := if4_predicted_gh
385  }
386  if4_gh := Mux(flush_final_gh, final_gh_bypass, final_gh)
387  if3_gh := Mux(if4_valid && !if4_flush, if4_predicted_gh, if4_gh)
388  if2_gh := Mux(if3_valid && !if3_flush, if3_predicted_gh, if3_gh)
389  if1_gh := Mux(if2_valid && !if2_flush, if2_predicted_gh, if2_gh)
390
391
392
393
394  val cfiUpdate = io.cfiUpdateInfo
395  when (cfiUpdate.valid && (cfiUpdate.bits.isMisPred || cfiUpdate.bits.isReplay)) {
396    val b = cfiUpdate.bits
397    val oldGh = b.bpuMeta.hist
398    val sawNTBr = b.bpuMeta.sawNotTakenBranch
399    val isBr = b.pd.isBr
400    val taken = Mux(cfiUpdate.bits.isReplay, b.bpuMeta.predTaken, b.taken)
401    val updatedGh = oldGh.update(sawNTBr, isBr && taken)
402    final_gh := updatedGh
403    final_gh_bypass := updatedGh
404    flush_final_gh := true.B
405  }
406
407  npcGen.register(loopBufPar.LBredirect.valid, loopBufPar.LBredirect.bits)
408  npcGen.register(io.redirect.valid, io.redirect.bits)
409  npcGen.register(RegNext(reset.asBool) && !reset.asBool, resetVector.U(VAddrBits.W))
410
411  if1_npc := npcGen()
412
413  when(inLoop) {
414    icache.io.req.valid := if4_flush
415  }.otherwise {
416    icache.io.req.valid := if1_valid && (if2_ready || if1_flush)
417  }
418  icache.io.resp.ready := if4_ready
419  icache.io.req.bits.addr := if1_npc
420
421  // when(if4_bp.taken) {
422  //   when(if4_bp.saveHalfRVI) {
423  //     io.loopBufPar.LBReq := snpc(if4_pc)
424  //   }.otherwise {
425  //     io.loopBufPar.LBReq := if4_bp.target
426  //   }
427  // }.otherwise {
428  //   io.loopBufPar.LBReq := snpc(if4_pc)
429  //   XSDebug(p"snpc(if4_pc)=${Hexadecimal(snpc(if4_pc))}\n")
430  // }
431  loopBufPar.fetchReq := if3_pc
432
433  icache.io.req.bits.mask := mask(if1_npc)
434  icache.io.flush := Cat(if3_flush, if2_flush)
435
436  bpu.io.cfiUpdateInfo <> io.cfiUpdateInfo
437
438  // bpu.io.flush := Cat(if4_flush, if3_flush, if2_flush)
439  bpu.io.flush := VecInit(if2_flush, if3_flush, if4_flush)
440  bpu.io.inFire(0) := if1_fire
441  bpu.io.inFire(1) := if2_fire
442  bpu.io.inFire(2) := if3_fire
443  bpu.io.inFire(3) := if4_fire
444  bpu.io.in.pc := if1_npc
445  bpu.io.in.hist := if1_gh.asUInt
446  // bpu.io.in.histPtr := ptr
447  bpu.io.in.inMask := mask(if1_npc)
448  bpu.io.predecode.mask := if4_pd.mask
449  bpu.io.predecode.lastHalf := if4_pd.lastHalf
450  bpu.io.predecode.pd := if4_pd.pd
451  bpu.io.predecode.hasLastHalfRVI := if4_prevHalfInstrMet
452  bpu.io.realMask := if4_mask
453  bpu.io.prevHalf := if4_prevHalfInstr
454
455  pd.io.in := icacheResp
456  when(inLoop) {
457    pd.io.in.mask := loopBuffer.io.out.bits.mask // TODO: Maybe this is unnecessary
458    // XSDebug("Fetch from LB\n")
459    // XSDebug(p"pc=${Hexadecimal(io.loopBufPar.LBResp.pc)}\n")
460    // XSDebug(p"data=${Hexadecimal(io.loopBufPar.LBResp.data)}\n")
461    // XSDebug(p"mask=${Hexadecimal(io.loopBufPar.LBResp.mask)}\n")
462  }
463
464  pd.io.prev.valid := if3_prevHalfInstrMet
465  pd.io.prev.bits := if3_prevHalfInstr.bits.instr
466  // if a fetch packet triggers page fault, set the pf instruction to nop
467  when (!if3_prevHalfInstrMet && icacheResp.ipf) {
468    val instrs = Wire(Vec(FetchWidth, UInt(32.W)))
469    (0 until FetchWidth).foreach(i => instrs(i) := ZeroExt("b0010011".U, 32)) // nop
470    pd.io.in.data := instrs.asUInt
471  }.elsewhen (if3_prevHalfInstrMet && (if3_prevHalfInstr.bits.ipf || icacheResp.ipf)) {
472    pd.io.prev.bits := ZeroExt("b0010011".U, 16)
473    val instrs = Wire(Vec(FetchWidth, UInt(32.W)))
474    (0 until FetchWidth).foreach(i => instrs(i) := Cat(ZeroExt("b0010011".U, 16), Fill(16, 0.U(1.W))))
475    pd.io.in.data := instrs.asUInt
476
477    when (icacheResp.ipf && !if3_prevHalfInstr.bits.ipf) { crossPageIPF := true.B } // higher 16 bits page fault
478  }
479
480  //Performance Counter
481  // if (!env.FPGAPlatform ) {
482  //   ExcitingUtils.addSource(io.fetchPacket.fire && !inLoop, "CntFetchFromICache", Perf)
483  //   ExcitingUtils.addSource(io.fetchPacket.fire && inLoop, "CntFetchFromLoopBuffer", Perf)
484  // }
485
486  val fetchPacketValid = if4_valid && !io.redirect.valid
487  val fetchPacketWire = Wire(new FetchPacket)
488
489  // io.fetchPacket.valid := if4_valid && !io.redirect.valid
490  fetchPacketWire.instrs := if4_pd.instrs
491  fetchPacketWire.mask := if4_pd.mask & (Fill(PredictWidth, !if4_bp.taken) | (Fill(PredictWidth, 1.U(1.W)) >> (~if4_bp.jmpIdx)))
492  fetchPacketWire.pdmask := if4_pd.mask
493
494  loopBufPar.noTakenMask := if4_pd.mask
495  fetchPacketWire.pc := if4_pd.pc
496  (0 until PredictWidth).foreach(i => fetchPacketWire.pnpc(i) := if4_pd.pc(i) + Mux(if4_pd.pd(i).isRVC, 2.U, 4.U))
497  when (if4_bp.taken) {
498    fetchPacketWire.pnpc(if4_bp.jmpIdx) := if4_bp.target
499  }
500  fetchPacketWire.bpuMeta := bpu.io.bpuMeta
501  (0 until PredictWidth).foreach(i => {
502    val meta = fetchPacketWire.bpuMeta(i)
503    meta.hist := final_gh
504    meta.predHist := if4_predHist.asTypeOf(new GlobalHistory)
505    meta.predTaken := if4_bp.takens(i)
506  })
507  fetchPacketWire.pd := if4_pd.pd
508  fetchPacketWire.ipf := if4_ipf
509  fetchPacketWire.acf := if4_acf
510  fetchPacketWire.crossPageIPFFix := if4_crossPageIPF
511
512  // predTaken Vec
513  fetchPacketWire.predTaken := if4_bp.taken
514
515  loopBuffer.io.in.bits := fetchPacketWire
516  io.fetchPacket.bits := fetchPacketWire
517  io.fetchPacket.valid := fetchPacketValid
518  loopBuffer.io.in.valid := io.fetchPacket.fire
519
520  // debug info
521  if (IFUDebug) {
522    XSDebug(RegNext(reset.asBool) && !reset.asBool, "Reseting...\n")
523    XSDebug(icache.io.flush(0).asBool, "Flush icache stage2...\n")
524    XSDebug(icache.io.flush(1).asBool, "Flush icache stage3...\n")
525    XSDebug(io.redirect.valid, p"Redirect from backend! target=${Hexadecimal(io.redirect.bits)}\n")
526
527    XSDebug("[IF1] v=%d     fire=%d            flush=%d pc=%x mask=%b\n", if1_valid, if1_fire, if1_flush, if1_npc, mask(if1_npc))
528    XSDebug("[IF2] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x snpc=%x\n", if2_valid, if2_ready, if2_fire, if2_redirect, if2_flush, if2_pc, if2_snpc)
529    XSDebug("[IF3] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x crossPageIPF=%d sawNTBrs=%d\n", if3_valid, if3_ready, if3_fire, if3_redirect, if3_flush, if3_pc, crossPageIPF, if3_bp.hasNotTakenBrs)
530    XSDebug("[IF4] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x crossPageIPF=%d sawNTBrs=%d\n", if4_valid, if4_ready, if4_fire, if4_redirect, if4_flush, if4_pc, if4_crossPageIPF, if4_bp.hasNotTakenBrs)
531    XSDebug("[IF1][icacheReq] v=%d r=%d addr=%x\n", icache.io.req.valid, icache.io.req.ready, icache.io.req.bits.addr)
532    XSDebug("[IF1][ghr] hist=%b\n", if1_gh.asUInt)
533    XSDebug("[IF1][ghr] extHist=%b\n\n", if1_gh.asUInt)
534
535    XSDebug("[IF2][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n\n", if2_bp.taken, if2_bp.jmpIdx, if2_bp.hasNotTakenBrs, if2_bp.target, if2_bp.saveHalfRVI)
536    if2_gh.debug("if2")
537
538    XSDebug("[IF3][icacheResp] v=%d r=%d pc=%x mask=%b\n", icache.io.resp.valid, icache.io.resp.ready, icache.io.resp.bits.pc, icache.io.resp.bits.mask)
539    XSDebug("[IF3][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n", if3_bp.taken, if3_bp.jmpIdx, if3_bp.hasNotTakenBrs, if3_bp.target, if3_bp.saveHalfRVI)
540    XSDebug("[IF3][redirect]: v=%d, prevMet=%d, prevNMet=%d, predT=%d, predNT=%d\n", if3_redirect, if3_prevHalfMetRedirect, if3_prevHalfNotMetRedirect, if3_predTakenRedirect, if3_predNotTakenRedirect)
541    // XSDebug("[IF3][prevHalfInstr] v=%d redirect=%d fetchpc=%x idx=%d tgt=%x taken=%d instr=%x\n\n",
542    //   prev_half_valid, prev_half_redirect, prev_half_fetchpc, prev_half_idx, prev_half_tgt, prev_half_taken, prev_half_instr)
543    XSDebug("[IF3][if3_prevHalfInstr] v=%d taken=%d fetchpc=%x idx=%d pc=%x npc=%x tgt=%x instr=%x ipf=%d\n\n",
544    if3_prevHalfInstr.valid, if3_prevHalfInstr.bits.taken, if3_prevHalfInstr.bits.fetchpc, if3_prevHalfInstr.bits.idx, if3_prevHalfInstr.bits.pc, if3_prevHalfInstr.bits.npc, if3_prevHalfInstr.bits.target, if3_prevHalfInstr.bits.instr, if3_prevHalfInstr.bits.ipf)
545    if3_gh.debug("if3")
546
547    XSDebug("[IF4][predecode] mask=%b\n", if4_pd.mask)
548    XSDebug("[IF4][snpc]: %x, realMask=%b\n", if4_snpc, if4_mask)
549    XSDebug("[IF4][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n", if4_bp.taken, if4_bp.jmpIdx, if4_bp.hasNotTakenBrs, if4_bp.target, if4_bp.saveHalfRVI)
550    XSDebug("[IF4][redirect]: v=%d, prevNotMet=%d, predT=%d, predNT=%d\n", if4_redirect, if4_prevHalfNextNotMet, if4_predTakenRedirect, if4_predNotTakenRedirect)
551    XSDebug(if4_pd.pd(if4_bp.jmpIdx).isJal && if4_bp.taken, "[IF4] cfi is jal!  instr=%x target=%x\n", if4_instrs(if4_bp.jmpIdx), if4_jal_tgts(if4_bp.jmpIdx))
552    XSDebug("[IF4][ prevHalfInstrReq] v=%d taken=%d fetchpc=%x idx=%d pc=%x npc=%x tgt=%x instr=%x ipf=%d\n",
553      prevHalfInstrReq.valid, prevHalfInstrReq.bits.taken, prevHalfInstrReq.bits.fetchpc, prevHalfInstrReq.bits.idx, prevHalfInstrReq.bits.pc, prevHalfInstrReq.bits.npc, prevHalfInstrReq.bits.target, prevHalfInstrReq.bits.instr, prevHalfInstrReq.bits.ipf)
554    XSDebug("[IF4][if4_prevHalfInstr] v=%d taken=%d fetchpc=%x idx=%d pc=%x npc=%x tgt=%x instr=%x ipf=%d\n",
555      if4_prevHalfInstr.valid, if4_prevHalfInstr.bits.taken, if4_prevHalfInstr.bits.fetchpc, if4_prevHalfInstr.bits.idx, if4_prevHalfInstr.bits.pc, if4_prevHalfInstr.bits.npc, if4_prevHalfInstr.bits.target, if4_prevHalfInstr.bits.instr, if4_prevHalfInstr.bits.ipf)
556    if4_gh.debug("if4")
557    XSDebug(io.fetchPacket.fire(), "[IF4][fetchPacket] v=%d r=%d mask=%b ipf=%d acf=%d crossPageIPF=%d\n",
558      io.fetchPacket.valid, io.fetchPacket.ready, io.fetchPacket.bits.mask, io.fetchPacket.bits.ipf, io.fetchPacket.bits.acf, io.fetchPacket.bits.crossPageIPFFix)
559    for (i <- 0 until PredictWidth) {
560      XSDebug(io.fetchPacket.fire(), "[IF4][fetchPacket] %b %x pc=%x pnpc=%x pd: rvc=%d brType=%b call=%d ret=%d\n",
561        io.fetchPacket.bits.mask(i),
562        io.fetchPacket.bits.instrs(i),
563        io.fetchPacket.bits.pc(i),
564        io.fetchPacket.bits.pnpc(i),
565        io.fetchPacket.bits.pd(i).isRVC,
566        io.fetchPacket.bits.pd(i).brType,
567        io.fetchPacket.bits.pd(i).isCall,
568        io.fetchPacket.bits.pd(i).isRet
569      )
570    }
571  }
572}