xref: /XiangShan/src/main/scala/xiangshan/frontend/IFU.scala (revision 209167cbda531c33f811ea0221ad0d2fbd5d9022)
1package xiangshan.frontend
2
3import chisel3._
4import chisel3.util._
5import device.RAMHelper
6import xiangshan._
7import utils._
8import xiangshan.cache._
9import chisel3.experimental.chiselName
10import freechips.rocketchip.tile.HasLazyRoCC
11import chisel3.ExcitingUtils._
12
13trait HasIFUConst extends HasXSParameter {
14  val resetVector = 0x80000000L//TODO: set reset vec
15  def align(pc: UInt, bytes: Int): UInt = Cat(pc(VAddrBits-1, log2Ceil(bytes)), 0.U(log2Ceil(bytes).W))
16  val instBytes = if (HasCExtension) 2 else 4
17  val instOffsetBits = log2Ceil(instBytes)
18  val groupBytes = 64 // correspond to cache line size
19  val groupOffsetBits = log2Ceil(groupBytes)
20  val groupWidth = groupBytes / instBytes
21  val packetBytes = PredictWidth * instBytes
22  val packetOffsetBits = log2Ceil(packetBytes)
23  def offsetInPacket(pc: UInt) = pc(packetOffsetBits-1, instOffsetBits)
24  def packetIdx(pc: UInt) = pc(VAddrBits-1, log2Ceil(packetBytes))
25  def groupAligned(pc: UInt)  = align(pc, groupBytes)
26  def packetAligned(pc: UInt) = align(pc, packetBytes)
27  def mask(pc: UInt): UInt = ((~(0.U(PredictWidth.W))) << offsetInPacket(pc))(PredictWidth-1,0)
28  def snpc(pc: UInt): UInt = packetAligned(pc) + packetBytes.U
29
30  val enableGhistRepair = true
31  val IFUDebug = true
32}
33
34class GlobalHistory extends XSBundle {
35  val predHist = UInt(HistoryLength.W)
36  def update(sawNTBr: Bool, takenOnBr: Bool, hist: UInt = predHist): GlobalHistory = {
37    val g = Wire(new GlobalHistory)
38    val shifted = takenOnBr || sawNTBr
39    g.predHist := Mux(shifted, (hist << 1) | takenOnBr.asUInt, hist)
40    g
41  }
42
43  final def === (that: GlobalHistory): Bool = {
44    predHist === that.predHist
45  }
46
47  final def =/= (that: GlobalHistory): Bool = !(this === that)
48
49  implicit val name = "IFU"
50  def debug(where: String) = XSDebug(p"[${where}_GlobalHistory] hist=${Binary(predHist)}\n")
51  // override def toString(): String = "histPtr=%d, sawNTBr=%d, takenOnBr=%d, saveHalfRVI=%d".format(histPtr, sawNTBr, takenOnBr, saveHalfRVI)
52}
53
54
55class IFUIO extends XSBundle
56{
57  // to ibuffer
58  val fetchPacket = DecoupledIO(new FetchPacket)
59  // from backend
60  val redirect = Flipped(ValidIO(UInt(VAddrBits.W)))
61  val cfiUpdateInfo = Flipped(ValidIO(new CfiUpdateInfo))
62  // to icache
63  val icacheMemGrant = Flipped(DecoupledIO(new L1plusCacheResp))
64  val fencei = Input(Bool())
65  // from icache
66  val icacheMemAcq = DecoupledIO(new L1plusCacheReq)
67  val l1plusFlush = Output(Bool())
68  val prefetchTrainReq = ValidIO(new IcacheMissReq)
69  // to tlb
70  val sfence = Input(new SfenceBundle)
71  val tlbCsr = Input(new TlbCsrBundle)
72  // from tlb
73  val ptw = new TlbPtwIO
74}
75
76class PrevHalfInstr extends XSBundle {
77  val taken = Bool()
78  val ghInfo = new GlobalHistory()
79  val fetchpc = UInt(VAddrBits.W) // only for debug
80  val idx = UInt(VAddrBits.W) // only for debug
81  val pc = UInt(VAddrBits.W)
82  val npc = UInt(VAddrBits.W)
83  val target = UInt(VAddrBits.W)
84  val instr = UInt(16.W)
85  val ipf = Bool()
86  val meta = new BpuMeta
87}
88
89@chiselName
90class IFU extends XSModule with HasIFUConst
91{
92  val io = IO(new IFUIO)
93  val bpu = BPU(EnableBPU)
94  val icache = Module(new ICache)
95
96  io.ptw <> TLB(
97    in = Seq(icache.io.tlb),
98    sfence = io.sfence,
99    csr = io.tlbCsr,
100    width = 1,
101    isDtlb = false,
102    shouldBlock = true
103  )
104
105  val if2_redirect, if3_redirect, if4_redirect = WireInit(false.B)
106  val if1_flush, if2_flush, if3_flush, if4_flush = WireInit(false.B)
107
108  val icacheResp = icache.io.resp.bits
109
110  if4_flush := io.redirect.valid
111  if3_flush := if4_flush || if4_redirect
112  if2_flush := if3_flush || if3_redirect
113  if1_flush := if2_flush || if2_redirect
114
115  //********************** IF1 ****************************//
116  val if1_valid = !reset.asBool && GTimer() > 500.U
117  val if1_npc = WireInit(0.U(VAddrBits.W))
118  val if2_ready = WireInit(false.B)
119  val if2_valid = RegInit(init = false.B)
120  val if2_allReady = WireInit(if2_ready && icache.io.req.ready)
121  val if1_fire = (if1_valid &&  if2_allReady) && (icache.io.tlb.resp.valid || !if2_valid)
122  val if1_can_go = if1_fire || if2_flush
123
124  val if1_gh, if2_gh, if3_gh, if4_gh = Wire(new GlobalHistory)
125  val if2_predicted_gh, if3_predicted_gh, if4_predicted_gh = Wire(new GlobalHistory)
126  val final_gh = RegInit(0.U.asTypeOf(new GlobalHistory))
127  val final_gh_bypass = WireInit(0.U.asTypeOf(new GlobalHistory))
128  val flush_final_gh = WireInit(false.B)
129
130  //********************** IF2 ****************************//
131  val if2_allValid = if2_valid && icache.io.tlb.resp.valid
132  val if3_ready = WireInit(false.B)
133  val if2_fire = (if2_valid && if3_ready) && icache.io.tlb.resp.valid
134  val if2_pc = RegEnable(next = if1_npc, init = resetVector.U, enable = if1_can_go)
135  val if2_snpc = snpc(if2_pc)
136  val if2_predHist = RegEnable(if1_gh.predHist, enable=if1_can_go)
137  if2_ready := if3_ready || !if2_valid
138  when (if1_can_go)       { if2_valid := true.B }
139  .elsewhen (if2_flush) { if2_valid := false.B }
140  .elsewhen (if2_fire)  { if2_valid := false.B }
141
142  val npcGen = new PriorityMuxGenerator[UInt]
143  npcGen.register(true.B, RegNext(if1_npc), Some("stallPC"))
144  val if2_bp = bpu.io.out(0)
145
146  // if taken, bp_redirect should be true
147  // when taken on half RVI, we suppress this redirect signal
148
149  npcGen.register(if2_valid, Mux(if2_bp.taken, if2_bp.target, if2_snpc), Some("if2_target"))
150
151  if2_predicted_gh := if2_gh.update(if2_bp.hasNotTakenBrs, if2_bp.takenOnBr)
152
153  //********************** IF3 ****************************//
154  // if3 should wait for instructions resp to arrive
155  val if3_valid = RegInit(init = false.B)
156  val if4_ready = WireInit(false.B)
157  val if3_allValid = if3_valid && icache.io.resp.valid
158  val if3_fire = if3_allValid && if4_ready
159  val if3_pc = RegEnable(if2_pc, if2_fire)
160  val if3_snpc = RegEnable(if2_snpc, if2_fire)
161  val if3_predHist = RegEnable(if2_predHist, enable=if2_fire)
162  if3_ready := if4_ready && icache.io.resp.valid || !if3_valid
163  when (if3_flush) {
164    if3_valid := false.B
165  }.elsewhen (if2_fire && !if2_flush) {
166    if3_valid := true.B
167  }.elsewhen (if3_fire) {
168    if3_valid := false.B
169  }
170
171  val if3_bp = bpu.io.out(1)
172  if3_predicted_gh := if3_gh.update(if3_bp.hasNotTakenBrs, if3_bp.takenOnBr)
173
174
175  val prevHalfInstrReq = WireInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
176  // only valid when if4_fire
177  val hasPrevHalfInstrReq = prevHalfInstrReq.valid && HasCExtension.B
178
179  val if3_prevHalfInstr = RegInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
180
181  // 32-bit instr crosses 2 pages, and the higher 16-bit triggers page fault
182  val crossPageIPF = WireInit(false.B)
183
184  val if3_pendingPrevHalfInstr = if3_prevHalfInstr.valid && HasCExtension.B
185
186  // the previous half of RVI instruction waits until it meets its last half
187  val if3_prevHalfInstrMet = if3_pendingPrevHalfInstr && if3_prevHalfInstr.bits.npc === if3_pc && if3_valid
188  // set to invalid once consumed or redirect from backend
189  val if3_prevHalfConsumed = if3_prevHalfInstrMet && if3_fire
190  val if3_prevHalfFlush = if4_flush
191  when (if3_prevHalfFlush) {
192    if3_prevHalfInstr.valid := false.B
193  }.elsewhen (hasPrevHalfInstrReq) {
194    if3_prevHalfInstr.valid := true.B
195  }.elsewhen (if3_prevHalfConsumed) {
196    if3_prevHalfInstr.valid := false.B
197  }
198  when (hasPrevHalfInstrReq) {
199    if3_prevHalfInstr.bits := prevHalfInstrReq.bits
200  }
201  // when bp signal a redirect, we distinguish between taken and not taken
202  // if taken and saveHalfRVI is true, we do not redirect to the target
203
204  class IF3_PC_COMP extends XSModule {
205    val io = IO(new Bundle {
206      val if2_pc = Input(UInt(VAddrBits.W))
207      val pc     = Input(UInt(VAddrBits.W))
208      val if2_valid = Input(Bool())
209      val res = Output(Bool())
210    })
211    io.res := !io.if2_valid || io.if2_valid && io.if2_pc =/= io.pc
212  }
213  def if3_nextValidPCNotEquals(pc: UInt) = {
214    val comp = Module(new IF3_PC_COMP)
215    comp.io.if2_pc := if2_pc
216    comp.io.pc     := pc
217    comp.io.if2_valid := if2_valid
218    comp.io.res
219  }
220
221  val if3_predTakenRedirectVec = VecInit((0 until PredictWidth).map(i => !if3_pendingPrevHalfInstr && if3_bp.realTakens(i) && if3_nextValidPCNotEquals(if3_bp.targets(i))))
222  val if3_prevHalfMetRedirect    = if3_pendingPrevHalfInstr && if3_prevHalfInstrMet && if3_prevHalfInstr.bits.taken && if3_nextValidPCNotEquals(if3_prevHalfInstr.bits.target)
223  val if3_prevHalfNotMetRedirect = if3_pendingPrevHalfInstr && !if3_prevHalfInstrMet && if3_nextValidPCNotEquals(if3_prevHalfInstr.bits.npc)
224  val if3_predTakenRedirect    = ParallelOR(if3_predTakenRedirectVec)
225  val if3_predNotTakenRedirect = !if3_pendingPrevHalfInstr && !if3_bp.taken && if3_nextValidPCNotEquals(if3_snpc)
226  // when pendingPrevHalfInstr, if3_GHInfo is set to the info of last prev half instr
227  // val if3_ghInfoNotIdenticalRedirect = !if3_pendingPrevHalfInstr && if3_GHInfo =/= if3_lastGHInfo && enableGhistRepair.B
228
229  if3_redirect := if3_valid && (
230                    // prevHalf is consumed but the next packet is not where it meant to be
231                    // we do not handle this condition because of the burden of building a correct GHInfo
232                    // prevHalfMetRedirect ||
233                    // prevHalf does not match if3_pc and the next fetch packet is not snpc
234                    if3_prevHalfNotMetRedirect && HasCExtension.B ||
235                    // pred taken and next fetch packet is not the predicted target
236                    if3_predTakenRedirect ||
237                    // pred not taken and next fetch packet is not snpc
238                    if3_predNotTakenRedirect
239                    // GHInfo from last pred does not corresponds with this packet
240                    // if3_ghInfoNotIdenticalRedirect
241                  )
242
243  val if3_target = WireInit(if3_snpc)
244
245  if3_target := Mux1H(Seq((if3_prevHalfNotMetRedirect -> if3_prevHalfInstr.bits.npc),
246                          (if3_predTakenRedirect      -> if3_bp.target),
247                          (if3_predNotTakenRedirect   -> if3_snpc)))
248
249  npcGen.register(if3_redirect, if3_target, Some("if3_target"))
250
251
252  //********************** IF4 ****************************//
253  val if4_pd = RegEnable(icache.io.pd_out, if3_fire)
254  val if4_ipf = RegEnable(icacheResp.ipf || if3_prevHalfInstrMet && if3_prevHalfInstr.bits.ipf, if3_fire)
255  val if4_acf = RegEnable(icacheResp.acf, if3_fire)
256  val if4_crossPageIPF = RegEnable(crossPageIPF, if3_fire)
257  val if4_valid = RegInit(false.B)
258  val if4_fire = if4_valid && io.fetchPacket.ready
259  val if4_pc = RegEnable(if3_pc, if3_fire)
260  val if4_snpc = RegEnable(if3_snpc, if3_fire)
261  // This is the real mask given from icache
262  val if4_mask = RegEnable(icacheResp.mask, if3_fire)
263
264
265  val if4_predHist = RegEnable(if3_predHist, enable=if3_fire)
266  // wait until prevHalfInstr written into reg
267  if4_ready := (io.fetchPacket.ready && !hasPrevHalfInstrReq || !if4_valid) && GTimer() > 500.U
268  when (if4_flush) {
269    if4_valid := false.B
270  }.elsewhen (if3_fire && !if3_flush) {
271    if4_valid := Mux(if3_pendingPrevHalfInstr, if3_prevHalfInstrMet, true.B)
272  }.elsewhen (if4_fire) {
273    if4_valid := false.B
274  }
275
276  val if4_bp = Wire(new BranchPrediction)
277  if4_bp := bpu.io.out(2)
278
279  if4_predicted_gh := if4_gh.update(if4_bp.hasNotTakenBrs, if4_bp.takenOnBr)
280
281  def jal_offset(inst: UInt, rvc: Bool): SInt = {
282    Mux(rvc,
283      Cat(inst(12), inst(8), inst(10, 9), inst(6), inst(7), inst(2), inst(11), inst(5, 3), 0.U(1.W)).asSInt(),
284      Cat(inst(31), inst(19, 12), inst(20), inst(30, 21), 0.U(1.W)).asSInt()
285    )
286  }
287  val if4_instrs = if4_pd.instrs
288  val if4_jals = if4_bp.jalMask
289  val if4_jal_tgts = VecInit((0 until PredictWidth).map(i => (if4_pd.pc(i).asSInt + jal_offset(if4_instrs(i), if4_pd.pd(i).isRVC)).asUInt))
290
291  (0 until PredictWidth).foreach {i =>
292    when (if4_jals(i)) {
293      if4_bp.targets(i) := if4_jal_tgts(i)
294    }
295  }
296
297  // we need this to tell BPU the prediction of prev half
298  // because the prediction is with the start of each inst
299  val if4_prevHalfInstr = RegInit(0.U.asTypeOf(ValidUndirectioned(new PrevHalfInstr)))
300  val if4_pendingPrevHalfInstr = if4_prevHalfInstr.valid && HasCExtension.B
301  val if4_prevHalfInstrMet = if4_pendingPrevHalfInstr && if4_valid
302  val if4_prevHalfConsumed = if4_prevHalfInstrMet && if4_fire
303  val if4_prevHalfFlush = if4_flush
304
305  val if4_takenPrevHalf = WireInit(if4_prevHalfInstrMet && if4_prevHalfInstr.bits.taken)
306  when (if4_prevHalfFlush) {
307    if4_prevHalfInstr.valid := false.B
308  }.elsewhen (if3_prevHalfConsumed) {
309    if4_prevHalfInstr.valid := if3_prevHalfInstr.valid
310  }.elsewhen (if4_prevHalfConsumed) {
311    if4_prevHalfInstr.valid := false.B
312  }
313
314  when (if3_prevHalfConsumed) {
315    if4_prevHalfInstr.bits := if3_prevHalfInstr.bits
316  }
317
318  prevHalfInstrReq.valid := if4_fire && if4_bp.saveHalfRVI && HasCExtension.B
319  val idx = if4_bp.lastHalfRVIIdx
320
321  // // this is result of the last half RVI
322  prevHalfInstrReq.bits.taken := if4_bp.lastHalfRVITaken
323  prevHalfInstrReq.bits.ghInfo := if4_gh
324  prevHalfInstrReq.bits.fetchpc := if4_pc
325  prevHalfInstrReq.bits.idx := idx
326  prevHalfInstrReq.bits.pc := if4_pd.pc(idx)
327  prevHalfInstrReq.bits.npc := if4_pd.pc(idx) + 2.U
328  prevHalfInstrReq.bits.target := if4_bp.lastHalfRVITarget
329  prevHalfInstrReq.bits.instr := if4_pd.instrs(idx)(15, 0)
330  prevHalfInstrReq.bits.ipf := if4_ipf
331  prevHalfInstrReq.bits.meta := bpu.io.bpuMeta(idx)
332
333  class IF4_PC_COMP extends XSModule {
334    val io = IO(new Bundle {
335      val if2_pc = Input(UInt(VAddrBits.W))
336      val if3_pc = Input(UInt(VAddrBits.W))
337      val pc     = Input(UInt(VAddrBits.W))
338      val if2_valid = Input(Bool())
339      val if3_valid = Input(Bool())
340      val res = Output(Bool())
341    })
342    io.res := io.if3_valid  && io.if3_pc =/= io.pc ||
343              !io.if3_valid && (io.if2_valid && io.if2_pc =/= io.pc) ||
344              !io.if3_valid && !io.if2_valid
345  }
346  def if4_nextValidPCNotEquals(pc: UInt) = {
347    val comp = Module(new IF4_PC_COMP)
348    comp.io.if2_pc := if2_pc
349    comp.io.if3_pc := if3_pc
350    comp.io.pc     := pc
351    comp.io.if2_valid := if2_valid
352    comp.io.if3_valid := if3_valid
353    comp.io.res
354  }
355
356  val if4_predTakenRedirectVec = VecInit((0 until PredictWidth).map(i => if4_bp.realTakens(i) && if4_nextValidPCNotEquals(if4_bp.targets(i))))
357
358  val if4_prevHalfNextNotMet = hasPrevHalfInstrReq && if4_nextValidPCNotEquals(prevHalfInstrReq.bits.pc+2.U)
359  val if4_predTakenRedirect = ParallelORR(if4_predTakenRedirectVec)
360  val if4_predNotTakenRedirect = !if4_bp.taken && if4_nextValidPCNotEquals(if4_snpc)
361  // val if4_ghInfoNotIdenticalRedirect = if4_GHInfo =/= if4_lastGHInfo && enableGhistRepair.B
362
363  if4_redirect := if4_valid && (
364                    // when if4 has a lastHalfRVI, but the next fetch packet is not snpc
365                    // if4_prevHalfNextNotMet ||
366                    // when if4 preds taken, but the pc of next fetch packet is not the target
367                    if4_predTakenRedirect ||
368                    // when if4 preds not taken, but the pc of next fetch packet is not snpc
369                    if4_predNotTakenRedirect
370                    // GHInfo from last pred does not corresponds with this packet
371                    // if4_ghInfoNotIdenticalRedirect
372                  )
373
374  val if4_target = WireInit(if4_snpc)
375
376  if4_target := Mux(if4_bp.taken, if4_bp.target, if4_snpc)
377
378  npcGen.register(if4_redirect, if4_target, Some("if4_target"))
379
380  when (if4_fire) {
381    final_gh := if4_predicted_gh
382  }
383  if4_gh := Mux(flush_final_gh, final_gh_bypass, final_gh)
384  if3_gh := Mux(if4_valid && !if4_flush, if4_predicted_gh, if4_gh)
385  if2_gh := Mux(if3_valid && !if3_flush, if3_predicted_gh, if3_gh)
386  if1_gh := Mux(if2_valid && !if2_flush, if2_predicted_gh, if2_gh)
387
388
389
390
391  val cfiUpdate = io.cfiUpdateInfo
392  when (cfiUpdate.valid && (cfiUpdate.bits.isMisPred || cfiUpdate.bits.isReplay)) {
393    val b = cfiUpdate.bits
394    val oldGh = b.bpuMeta.hist
395    val sawNTBr = b.bpuMeta.sawNotTakenBranch
396    val isBr = b.pd.isBr
397    val taken = Mux(cfiUpdate.bits.isReplay, b.bpuMeta.predTaken, b.taken)
398    val updatedGh = oldGh.update(sawNTBr, isBr && taken)
399    final_gh := updatedGh
400    final_gh_bypass := updatedGh
401    flush_final_gh := true.B
402  }
403
404  npcGen.register(io.redirect.valid, io.redirect.bits, Some("backend_redirect"))
405  npcGen.register(RegNext(reset.asBool) && !reset.asBool, resetVector.U(VAddrBits.W), Some("reset_vector"))
406
407  if1_npc := npcGen()
408
409
410  icache.io.req.valid := if1_can_go
411  icache.io.resp.ready := if4_ready
412  icache.io.req.bits.addr := if1_npc
413  icache.io.req.bits.mask := mask(if1_npc)
414  icache.io.flush := Cat(if3_flush, if2_flush)
415  icache.io.mem_grant <> io.icacheMemGrant
416  icache.io.fencei := io.fencei
417  icache.io.prev.valid := if3_prevHalfInstrMet
418  icache.io.prev.bits := if3_prevHalfInstr.bits.instr
419  icache.io.prev_ipf := if3_prevHalfInstr.bits.ipf
420  icache.io.prev_pc := if3_prevHalfInstr.bits.pc
421  io.icacheMemAcq <> icache.io.mem_acquire
422  io.l1plusFlush := icache.io.l1plusflush
423  io.prefetchTrainReq := icache.io.prefetchTrainReq
424
425  bpu.io.cfiUpdateInfo <> io.cfiUpdateInfo
426
427  bpu.io.inFire(0) := if1_can_go
428  bpu.io.inFire(1) := if2_fire
429  bpu.io.inFire(2) := if3_fire
430  bpu.io.inFire(3) := if4_fire
431  bpu.io.in.pc := if1_npc
432  bpu.io.in.hist := if1_gh.asUInt
433  bpu.io.in.inMask := mask(if1_npc)
434  bpu.io.predecode.mask := if4_pd.mask
435  bpu.io.predecode.lastHalf := if4_pd.lastHalf
436  bpu.io.predecode.pd := if4_pd.pd
437  bpu.io.predecode.hasLastHalfRVI := if4_prevHalfInstrMet
438  bpu.io.realMask := if4_mask
439  bpu.io.prevHalf := if4_prevHalfInstr
440
441
442  when (if3_prevHalfInstrMet && icacheResp.ipf && !if3_prevHalfInstr.bits.ipf) {
443    crossPageIPF := true.B // higher 16 bits page fault
444  }
445
446  val fetchPacketValid = if4_valid && !io.redirect.valid
447  val fetchPacketWire = Wire(new FetchPacket)
448
449  fetchPacketWire.instrs := if4_pd.instrs
450  fetchPacketWire.mask := if4_pd.mask & (Fill(PredictWidth, !if4_bp.taken) | (Fill(PredictWidth, 1.U(1.W)) >> (~if4_bp.jmpIdx)))
451  fetchPacketWire.pdmask := if4_pd.mask
452
453  fetchPacketWire.pc := if4_pd.pc
454  (0 until PredictWidth).foreach(i => fetchPacketWire.pnpc(i) := if4_pd.pc(i) + Mux(if4_pd.pd(i).isRVC, 2.U, 4.U))
455  when (if4_bp.taken) {
456    fetchPacketWire.pnpc(if4_bp.jmpIdx) := if4_bp.target
457  }
458  fetchPacketWire.bpuMeta := bpu.io.bpuMeta
459  // save it for update
460  when (if4_pendingPrevHalfInstr) {
461    fetchPacketWire.bpuMeta(0) := if4_prevHalfInstr.bits.meta
462  }
463  (0 until PredictWidth).foreach(i => {
464    val meta = fetchPacketWire.bpuMeta(i)
465    meta.hist := final_gh
466    meta.predHist := if4_predHist.asTypeOf(new GlobalHistory)
467    meta.predTaken := if4_bp.takens(i)
468  })
469  fetchPacketWire.pd := if4_pd.pd
470  fetchPacketWire.ipf := if4_ipf
471  fetchPacketWire.acf := if4_acf
472  fetchPacketWire.crossPageIPFFix := if4_crossPageIPF
473
474  // predTaken Vec
475  fetchPacketWire.predTaken := if4_bp.taken
476
477  io.fetchPacket.bits := fetchPacketWire
478  io.fetchPacket.valid := fetchPacketValid
479
480//  if(IFUDebug) {
481    val predictor_s3 = RegEnable(Mux(if3_redirect, 1.U(log2Up(4).W), 0.U(log2Up(4).W)), if3_fire)
482    val predictor_s4 = Mux(if4_redirect, 2.U, predictor_s3)
483    val predictor = predictor_s4
484
485    fetchPacketWire.bpuMeta.map(_.predictor := predictor)
486 // }
487
488  // val predRight = cfiUpdate.valid && !cfiUpdate.bits.isMisPred && !cfiUpdate.bits.isReplay
489  // val predWrong = cfiUpdate.valid && cfiUpdate.bits.isMisPred && !cfiUpdate.bits.isReplay
490
491  // val ubtbRight = predRight && cfiUpdate.bits.bpuMeta.predictor === 0.U
492  // val ubtbWrong = predWrong && cfiUpdate.bits.bpuMeta.predictor === 0.U
493  // val btbRight  = predRight && cfiUpdate.bits.bpuMeta.predictor === 1.U
494  // val btbWrong  = predWrong && cfiUpdate.bits.bpuMeta.predictor === 1.U
495  // val tageRight = predRight && cfiUpdate.bits.bpuMeta.predictor === 2.U
496  // val tageWrong = predWrong && cfiUpdate.bits.bpuMeta.predictor === 2.U
497  // val loopRight = predRight && cfiUpdate.bits.bpuMeta.predictor === 3.U
498  // val loopWrong = predWrong && cfiUpdate.bits.bpuMeta.predictor === 3.U
499
500  // ExcitingUtils.addSource(ubtbRight, "perfCntubtbRight", Perf)
501  // ExcitingUtils.addSource(ubtbWrong, "perfCntubtbWrong", Perf)
502  // ExcitingUtils.addSource(btbRight, "perfCntbtbRight", Perf)
503  // ExcitingUtils.addSource(btbWrong, "perfCntbtbWrong", Perf)
504  // ExcitingUtils.addSource(tageRight, "perfCnttageRight", Perf)
505  // ExcitingUtils.addSource(tageWrong, "perfCnttageWrong", Perf)
506  // ExcitingUtils.addSource(loopRight, "perfCntloopRight", Perf)
507  // ExcitingUtils.addSource(loopWrong, "perfCntloopWrong", Perf)
508
509  // debug info
510  if (IFUDebug) {
511    XSDebug(RegNext(reset.asBool) && !reset.asBool, "Reseting...\n")
512    XSDebug(icache.io.flush(0).asBool, "Flush icache stage2...\n")
513    XSDebug(icache.io.flush(1).asBool, "Flush icache stage3...\n")
514    XSDebug(io.redirect.valid, p"Redirect from backend! target=${Hexadecimal(io.redirect.bits)}\n")
515
516    XSDebug("[IF1] v=%d     fire=%d  cango=%d          flush=%d pc=%x mask=%b\n", if1_valid, if1_fire,if1_can_go, if1_flush, if1_npc, mask(if1_npc))
517    XSDebug("[IF2] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x snpc=%x\n", if2_valid, if2_ready, if2_fire, if2_redirect, if2_flush, if2_pc, if2_snpc)
518    XSDebug("[IF3] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x crossPageIPF=%d sawNTBrs=%d\n", if3_valid, if3_ready, if3_fire, if3_redirect, if3_flush, if3_pc, crossPageIPF, if3_bp.hasNotTakenBrs)
519    XSDebug("[IF4] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x crossPageIPF=%d sawNTBrs=%d\n", if4_valid, if4_ready, if4_fire, if4_redirect, if4_flush, if4_pc, if4_crossPageIPF, if4_bp.hasNotTakenBrs)
520    XSDebug("[predictor] predictor_s3=%d, predictor_s4=%d, predictor=%d\n", predictor_s3, predictor_s4, predictor)
521    XSDebug("[IF1][icacheReq] v=%d r=%d addr=%x\n", icache.io.req.valid, icache.io.req.ready, icache.io.req.bits.addr)
522    XSDebug("[IF1][ghr] hist=%b\n", if1_gh.asUInt)
523    XSDebug("[IF1][ghr] extHist=%b\n\n", if1_gh.asUInt)
524
525    XSDebug("[IF2][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n\n", if2_bp.taken, if2_bp.jmpIdx, if2_bp.hasNotTakenBrs, if2_bp.target, if2_bp.saveHalfRVI)
526    if2_gh.debug("if2")
527
528    XSDebug("[IF3][icacheResp] v=%d r=%d pc=%x mask=%b\n", icache.io.resp.valid, icache.io.resp.ready, icache.io.resp.bits.pc, icache.io.resp.bits.mask)
529    XSDebug("[IF3][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n", if3_bp.taken, if3_bp.jmpIdx, if3_bp.hasNotTakenBrs, if3_bp.target, if3_bp.saveHalfRVI)
530    XSDebug("[IF3][redirect]: v=%d, prevMet=%d, prevNMet=%d, predT=%d, predNT=%d\n", if3_redirect, if3_prevHalfMetRedirect, if3_prevHalfNotMetRedirect, if3_predTakenRedirect, if3_predNotTakenRedirect)
531    // XSDebug("[IF3][prevHalfInstr] v=%d redirect=%d fetchpc=%x idx=%d tgt=%x taken=%d instr=%x\n\n",
532    //   prev_half_valid, prev_half_redirect, prev_half_fetchpc, prev_half_idx, prev_half_tgt, prev_half_taken, prev_half_instr)
533    XSDebug("[IF3][if3_prevHalfInstr] v=%d taken=%d fetchpc=%x idx=%d pc=%x npc=%x tgt=%x instr=%x ipf=%d\n\n",
534    if3_prevHalfInstr.valid, if3_prevHalfInstr.bits.taken, if3_prevHalfInstr.bits.fetchpc, if3_prevHalfInstr.bits.idx, if3_prevHalfInstr.bits.pc, if3_prevHalfInstr.bits.npc, if3_prevHalfInstr.bits.target, if3_prevHalfInstr.bits.instr, if3_prevHalfInstr.bits.ipf)
535    if3_gh.debug("if3")
536
537    XSDebug("[IF4][predecode] mask=%b\n", if4_pd.mask)
538    XSDebug("[IF4][snpc]: %x, realMask=%b\n", if4_snpc, if4_mask)
539    XSDebug("[IF4][bp] taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n", if4_bp.taken, if4_bp.jmpIdx, if4_bp.hasNotTakenBrs, if4_bp.target, if4_bp.saveHalfRVI)
540    XSDebug("[IF4][redirect]: v=%d, prevNotMet=%d, predT=%d, predNT=%d\n", if4_redirect, if4_prevHalfNextNotMet, if4_predTakenRedirect, if4_predNotTakenRedirect)
541    XSDebug(if4_pd.pd(if4_bp.jmpIdx).isJal && if4_bp.taken, "[IF4] cfi is jal!  instr=%x target=%x\n", if4_instrs(if4_bp.jmpIdx), if4_jal_tgts(if4_bp.jmpIdx))
542    XSDebug("[IF4][ prevHalfInstrReq] v=%d taken=%d fetchpc=%x idx=%d pc=%x npc=%x tgt=%x instr=%x ipf=%d\n",
543      prevHalfInstrReq.valid, prevHalfInstrReq.bits.taken, prevHalfInstrReq.bits.fetchpc, prevHalfInstrReq.bits.idx, prevHalfInstrReq.bits.pc, prevHalfInstrReq.bits.npc, prevHalfInstrReq.bits.target, prevHalfInstrReq.bits.instr, prevHalfInstrReq.bits.ipf)
544    XSDebug("[IF4][if4_prevHalfInstr] v=%d taken=%d fetchpc=%x idx=%d pc=%x npc=%x tgt=%x instr=%x ipf=%d\n",
545      if4_prevHalfInstr.valid, if4_prevHalfInstr.bits.taken, if4_prevHalfInstr.bits.fetchpc, if4_prevHalfInstr.bits.idx, if4_prevHalfInstr.bits.pc, if4_prevHalfInstr.bits.npc, if4_prevHalfInstr.bits.target, if4_prevHalfInstr.bits.instr, if4_prevHalfInstr.bits.ipf)
546    if4_gh.debug("if4")
547    XSDebug(io.fetchPacket.fire(), "[IF4][fetchPacket] v=%d r=%d mask=%b ipf=%d acf=%d crossPageIPF=%d\n",
548      io.fetchPacket.valid, io.fetchPacket.ready, io.fetchPacket.bits.mask, io.fetchPacket.bits.ipf, io.fetchPacket.bits.acf, io.fetchPacket.bits.crossPageIPFFix)
549    for (i <- 0 until PredictWidth) {
550      XSDebug(io.fetchPacket.fire(), "[IF4][fetchPacket] %b %x pc=%x pnpc=%x pd: rvc=%d brType=%b call=%d ret=%d\n",
551        io.fetchPacket.bits.mask(i),
552        io.fetchPacket.bits.instrs(i),
553        io.fetchPacket.bits.pc(i),
554        io.fetchPacket.bits.pnpc(i),
555        io.fetchPacket.bits.pd(i).isRVC,
556        io.fetchPacket.bits.pd(i).brType,
557        io.fetchPacket.bits.pd(i).isCall,
558        io.fetchPacket.bits.pd(i).isRet
559      )
560    }
561  }
562}
563