xref: /XiangShan/src/main/scala/xiangshan/frontend/NewFtq.scala (revision f21bbcb2c32693a75e46ec8142a3d372a5c4efe5)
109c6f1ddSLingrui98/***************************************************************************************
209c6f1ddSLingrui98* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
309c6f1ddSLingrui98* Copyright (c) 2020-2021 Peng Cheng Laboratory
409c6f1ddSLingrui98*
509c6f1ddSLingrui98* XiangShan is licensed under Mulan PSL v2.
609c6f1ddSLingrui98* You can use this software according to the terms and conditions of the Mulan PSL v2.
709c6f1ddSLingrui98* You may obtain a copy of Mulan PSL v2 at:
809c6f1ddSLingrui98*          http://license.coscl.org.cn/MulanPSL2
909c6f1ddSLingrui98*
1009c6f1ddSLingrui98* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
1109c6f1ddSLingrui98* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
1209c6f1ddSLingrui98* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
1309c6f1ddSLingrui98*
1409c6f1ddSLingrui98* See the Mulan PSL v2 for more details.
1509c6f1ddSLingrui98***************************************************************************************/
1609c6f1ddSLingrui98
1709c6f1ddSLingrui98package xiangshan.frontend
1809c6f1ddSLingrui98
1909c6f1ddSLingrui98import chipsalliance.rocketchip.config.Parameters
2009c6f1ddSLingrui98import chisel3._
2109c6f1ddSLingrui98import chisel3.util._
221ca0e4f3SYinan Xuimport utils._
233c02ee8fSwakafaimport utility._
2409c6f1ddSLingrui98import xiangshan._
25e30430c2SJayimport xiangshan.frontend.icache._
261ca0e4f3SYinan Xuimport xiangshan.backend.CtrlToFtqIO
272e1be6e1SSteve Gouimport xiangshan.backend.decode.ImmUnion
283c02ee8fSwakafaimport utility.ChiselDB
2951532d8bSGuokai Chen
3051532d8bSGuokai Chenclass FtqDebugBundle extends Bundle {
3151532d8bSGuokai Chen  val pc = UInt(39.W)
3251532d8bSGuokai Chen  val target = UInt(39.W)
3351532d8bSGuokai Chen  val isBr = Bool()
3451532d8bSGuokai Chen  val isJmp = Bool()
3551532d8bSGuokai Chen  val isCall = Bool()
3651532d8bSGuokai Chen  val isRet = Bool()
3751532d8bSGuokai Chen  val misPred = Bool()
3851532d8bSGuokai Chen  val isTaken = Bool()
3951532d8bSGuokai Chen  val predStage = UInt(2.W)
4051532d8bSGuokai Chen}
4109c6f1ddSLingrui98
4209c6f1ddSLingrui98class FtqPtr(implicit p: Parameters) extends CircularQueuePtr[FtqPtr](
4309c6f1ddSLingrui98  p => p(XSCoreParamsKey).FtqSize
4409c6f1ddSLingrui98){
4509c6f1ddSLingrui98}
4609c6f1ddSLingrui98
4709c6f1ddSLingrui98object FtqPtr {
4809c6f1ddSLingrui98  def apply(f: Bool, v: UInt)(implicit p: Parameters): FtqPtr = {
4909c6f1ddSLingrui98    val ptr = Wire(new FtqPtr)
5009c6f1ddSLingrui98    ptr.flag := f
5109c6f1ddSLingrui98    ptr.value := v
5209c6f1ddSLingrui98    ptr
5309c6f1ddSLingrui98  }
5409c6f1ddSLingrui98  def inverse(ptr: FtqPtr)(implicit p: Parameters): FtqPtr = {
5509c6f1ddSLingrui98    apply(!ptr.flag, ptr.value)
5609c6f1ddSLingrui98  }
5709c6f1ddSLingrui98}
5809c6f1ddSLingrui98
5909c6f1ddSLingrui98class FtqNRSRAM[T <: Data](gen: T, numRead: Int)(implicit p: Parameters) extends XSModule {
6009c6f1ddSLingrui98
6109c6f1ddSLingrui98  val io = IO(new Bundle() {
6209c6f1ddSLingrui98    val raddr = Input(Vec(numRead, UInt(log2Up(FtqSize).W)))
6309c6f1ddSLingrui98    val ren = Input(Vec(numRead, Bool()))
6409c6f1ddSLingrui98    val rdata = Output(Vec(numRead, gen))
6509c6f1ddSLingrui98    val waddr = Input(UInt(log2Up(FtqSize).W))
6609c6f1ddSLingrui98    val wen = Input(Bool())
6709c6f1ddSLingrui98    val wdata = Input(gen)
6809c6f1ddSLingrui98  })
6909c6f1ddSLingrui98
7009c6f1ddSLingrui98  for(i <- 0 until numRead){
7109c6f1ddSLingrui98    val sram = Module(new SRAMTemplate(gen, FtqSize))
7209c6f1ddSLingrui98    sram.io.r.req.valid := io.ren(i)
7309c6f1ddSLingrui98    sram.io.r.req.bits.setIdx := io.raddr(i)
7409c6f1ddSLingrui98    io.rdata(i) := sram.io.r.resp.data(0)
7509c6f1ddSLingrui98    sram.io.w.req.valid := io.wen
7609c6f1ddSLingrui98    sram.io.w.req.bits.setIdx := io.waddr
7709c6f1ddSLingrui98    sram.io.w.req.bits.data := VecInit(io.wdata)
7809c6f1ddSLingrui98  }
7909c6f1ddSLingrui98
8009c6f1ddSLingrui98}
8109c6f1ddSLingrui98
8209c6f1ddSLingrui98class Ftq_RF_Components(implicit p: Parameters) extends XSBundle with BPUUtils {
8309c6f1ddSLingrui98  val startAddr = UInt(VAddrBits.W)
84b37e4b45SLingrui98  val nextLineAddr = UInt(VAddrBits.W)
8509c6f1ddSLingrui98  val isNextMask = Vec(PredictWidth, Bool())
86b37e4b45SLingrui98  val fallThruError = Bool()
87b37e4b45SLingrui98  // val carry = Bool()
8809c6f1ddSLingrui98  def getPc(offset: UInt) = {
8985215037SLingrui98    def getHigher(pc: UInt) = pc(VAddrBits-1, log2Ceil(PredictWidth)+instOffsetBits+1)
9085215037SLingrui98    def getOffset(pc: UInt) = pc(log2Ceil(PredictWidth)+instOffsetBits, instOffsetBits)
91b37e4b45SLingrui98    Cat(getHigher(Mux(isNextMask(offset) && startAddr(log2Ceil(PredictWidth)+instOffsetBits), nextLineAddr, startAddr)),
9209c6f1ddSLingrui98        getOffset(startAddr)+offset, 0.U(instOffsetBits.W))
9309c6f1ddSLingrui98  }
9409c6f1ddSLingrui98  def fromBranchPrediction(resp: BranchPredictionBundle) = {
95a229ab6cSLingrui98    def carryPos(addr: UInt) = addr(instOffsetBits+log2Ceil(PredictWidth)+1)
9609c6f1ddSLingrui98    this.startAddr := resp.pc
97a60a2901SLingrui98    this.nextLineAddr := resp.pc + (FetchWidth * 4 * 2).U // may be broken on other configs
9809c6f1ddSLingrui98    this.isNextMask := VecInit((0 until PredictWidth).map(i =>
9909c6f1ddSLingrui98      (resp.pc(log2Ceil(PredictWidth), 1) +& i.U)(log2Ceil(PredictWidth)).asBool()
10009c6f1ddSLingrui98    ))
101b37e4b45SLingrui98    this.fallThruError := resp.fallThruError
10209c6f1ddSLingrui98    this
10309c6f1ddSLingrui98  }
10409c6f1ddSLingrui98  override def toPrintable: Printable = {
105b37e4b45SLingrui98    p"startAddr:${Hexadecimal(startAddr)}"
10609c6f1ddSLingrui98  }
10709c6f1ddSLingrui98}
10809c6f1ddSLingrui98
10909c6f1ddSLingrui98class Ftq_pd_Entry(implicit p: Parameters) extends XSBundle {
11009c6f1ddSLingrui98  val brMask = Vec(PredictWidth, Bool())
11109c6f1ddSLingrui98  val jmpInfo = ValidUndirectioned(Vec(3, Bool()))
11209c6f1ddSLingrui98  val jmpOffset = UInt(log2Ceil(PredictWidth).W)
11309c6f1ddSLingrui98  val jalTarget = UInt(VAddrBits.W)
11409c6f1ddSLingrui98  val rvcMask = Vec(PredictWidth, Bool())
11509c6f1ddSLingrui98  def hasJal  = jmpInfo.valid && !jmpInfo.bits(0)
11609c6f1ddSLingrui98  def hasJalr = jmpInfo.valid && jmpInfo.bits(0)
11709c6f1ddSLingrui98  def hasCall = jmpInfo.valid && jmpInfo.bits(1)
11809c6f1ddSLingrui98  def hasRet  = jmpInfo.valid && jmpInfo.bits(2)
11909c6f1ddSLingrui98
12009c6f1ddSLingrui98  def fromPdWb(pdWb: PredecodeWritebackBundle) = {
12109c6f1ddSLingrui98    val pds = pdWb.pd
12209c6f1ddSLingrui98    this.brMask := VecInit(pds.map(pd => pd.isBr && pd.valid))
12309c6f1ddSLingrui98    this.jmpInfo.valid := VecInit(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid)).asUInt.orR
12409c6f1ddSLingrui98    this.jmpInfo.bits := ParallelPriorityMux(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid),
12509c6f1ddSLingrui98                                             pds.map(pd => VecInit(pd.isJalr, pd.isCall, pd.isRet)))
12609c6f1ddSLingrui98    this.jmpOffset := ParallelPriorityEncoder(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid))
12709c6f1ddSLingrui98    this.rvcMask := VecInit(pds.map(pd => pd.isRVC))
12809c6f1ddSLingrui98    this.jalTarget := pdWb.jalTarget
12909c6f1ddSLingrui98  }
13009c6f1ddSLingrui98
13109c6f1ddSLingrui98  def toPd(offset: UInt) = {
13209c6f1ddSLingrui98    require(offset.getWidth == log2Ceil(PredictWidth))
13309c6f1ddSLingrui98    val pd = Wire(new PreDecodeInfo)
13409c6f1ddSLingrui98    pd.valid := true.B
13509c6f1ddSLingrui98    pd.isRVC := rvcMask(offset)
13609c6f1ddSLingrui98    val isBr = brMask(offset)
13709c6f1ddSLingrui98    val isJalr = offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(0)
13809c6f1ddSLingrui98    pd.brType := Cat(offset === jmpOffset && jmpInfo.valid, isJalr || isBr)
13909c6f1ddSLingrui98    pd.isCall := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(1)
14009c6f1ddSLingrui98    pd.isRet  := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(2)
14109c6f1ddSLingrui98    pd
14209c6f1ddSLingrui98  }
14309c6f1ddSLingrui98}
14409c6f1ddSLingrui98
14509c6f1ddSLingrui98
14609c6f1ddSLingrui98
147c2d1ec7dSLingrui98class Ftq_Redirect_SRAMEntry(implicit p: Parameters) extends SpeculativeInfo {}
14809c6f1ddSLingrui98
14909c6f1ddSLingrui98class Ftq_1R_SRAMEntry(implicit p: Parameters) extends XSBundle with HasBPUConst {
15009c6f1ddSLingrui98  val meta = UInt(MaxMetaLength.W)
15109c6f1ddSLingrui98}
15209c6f1ddSLingrui98
15309c6f1ddSLingrui98class Ftq_Pred_Info(implicit p: Parameters) extends XSBundle {
15409c6f1ddSLingrui98  val target = UInt(VAddrBits.W)
15509c6f1ddSLingrui98  val cfiIndex = ValidUndirectioned(UInt(log2Ceil(PredictWidth).W))
15609c6f1ddSLingrui98}
15709c6f1ddSLingrui98
15809c6f1ddSLingrui98
15909c6f1ddSLingrui98class FtqRead[T <: Data](private val gen: T)(implicit p: Parameters) extends XSBundle {
16009c6f1ddSLingrui98  val ptr = Output(new FtqPtr)
16109c6f1ddSLingrui98  val offset = Output(UInt(log2Ceil(PredictWidth).W))
16209c6f1ddSLingrui98  val data = Input(gen)
16309c6f1ddSLingrui98  def apply(ptr: FtqPtr, offset: UInt) = {
16409c6f1ddSLingrui98    this.ptr := ptr
16509c6f1ddSLingrui98    this.offset := offset
16609c6f1ddSLingrui98    this.data
16709c6f1ddSLingrui98  }
16809c6f1ddSLingrui98}
16909c6f1ddSLingrui98
17009c6f1ddSLingrui98
17109c6f1ddSLingrui98class FtqToBpuIO(implicit p: Parameters) extends XSBundle {
17209c6f1ddSLingrui98  val redirect = Valid(new BranchPredictionRedirect)
17309c6f1ddSLingrui98  val update = Valid(new BranchPredictionUpdate)
17409c6f1ddSLingrui98  val enq_ptr = Output(new FtqPtr)
17509c6f1ddSLingrui98}
17609c6f1ddSLingrui98
17709c6f1ddSLingrui98class FtqToIfuIO(implicit p: Parameters) extends XSBundle with HasCircularQueuePtrHelper {
17809c6f1ddSLingrui98  val req = Decoupled(new FetchRequestBundle)
17909c6f1ddSLingrui98  val redirect = Valid(new Redirect)
18009c6f1ddSLingrui98  val flushFromBpu = new Bundle {
18109c6f1ddSLingrui98    // when ifu pipeline is not stalled,
18209c6f1ddSLingrui98    // a packet from bpu s3 can reach f1 at most
18309c6f1ddSLingrui98    val s2 = Valid(new FtqPtr)
184cb4f77ceSLingrui98    val s3 = Valid(new FtqPtr)
18509c6f1ddSLingrui98    def shouldFlushBy(src: Valid[FtqPtr], idx_to_flush: FtqPtr) = {
18609c6f1ddSLingrui98      src.valid && !isAfter(src.bits, idx_to_flush)
18709c6f1ddSLingrui98    }
18809c6f1ddSLingrui98    def shouldFlushByStage2(idx: FtqPtr) = shouldFlushBy(s2, idx)
189cb4f77ceSLingrui98    def shouldFlushByStage3(idx: FtqPtr) = shouldFlushBy(s3, idx)
19009c6f1ddSLingrui98  }
19109c6f1ddSLingrui98}
19209c6f1ddSLingrui98
193c5c5edaeSJeniusclass FtqToICacheIO(implicit p: Parameters) extends XSBundle with HasCircularQueuePtrHelper {
194c5c5edaeSJenius  //NOTE: req.bits must be prepare in T cycle
195c5c5edaeSJenius  // while req.valid is set true in T + 1 cycle
196c5c5edaeSJenius  val req = Decoupled(new FtqToICacheRequestBundle)
197c5c5edaeSJenius}
198c5c5edaeSJenius
19909c6f1ddSLingrui98trait HasBackendRedirectInfo extends HasXSParameter {
2002e1be6e1SSteve Gou  def numRedirectPcRead = exuParameters.JmpCnt + exuParameters.AluCnt + 1
20109c6f1ddSLingrui98  def isLoadReplay(r: Valid[Redirect]) = r.bits.flushItself()
20209c6f1ddSLingrui98}
20309c6f1ddSLingrui98
20409c6f1ddSLingrui98class FtqToCtrlIO(implicit p: Parameters) extends XSBundle with HasBackendRedirectInfo {
205b56f947eSYinan Xu  // write to backend pc mem
206b56f947eSYinan Xu  val pc_mem_wen = Output(Bool())
207b56f947eSYinan Xu  val pc_mem_waddr = Output(UInt(log2Ceil(FtqSize).W))
208b56f947eSYinan Xu  val pc_mem_wdata = Output(new Ftq_RF_Components)
209873dc383SLingrui98  // newest target
210873dc383SLingrui98  val newest_entry_target = Output(UInt(VAddrBits.W))
211873dc383SLingrui98  val newest_entry_ptr = Output(new FtqPtr)
21209c6f1ddSLingrui98}
21309c6f1ddSLingrui98
21409c6f1ddSLingrui98
21509c6f1ddSLingrui98class FTBEntryGen(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo with HasBPUParameter {
21609c6f1ddSLingrui98  val io = IO(new Bundle {
21709c6f1ddSLingrui98    val start_addr = Input(UInt(VAddrBits.W))
21809c6f1ddSLingrui98    val old_entry = Input(new FTBEntry)
21909c6f1ddSLingrui98    val pd = Input(new Ftq_pd_Entry)
22009c6f1ddSLingrui98    val cfiIndex = Flipped(Valid(UInt(log2Ceil(PredictWidth).W)))
22109c6f1ddSLingrui98    val target = Input(UInt(VAddrBits.W))
22209c6f1ddSLingrui98    val hit = Input(Bool())
22309c6f1ddSLingrui98    val mispredict_vec = Input(Vec(PredictWidth, Bool()))
22409c6f1ddSLingrui98
22509c6f1ddSLingrui98    val new_entry = Output(new FTBEntry)
22609c6f1ddSLingrui98    val new_br_insert_pos = Output(Vec(numBr, Bool()))
22709c6f1ddSLingrui98    val taken_mask = Output(Vec(numBr, Bool()))
228803124a6SLingrui98    val jmp_taken = Output(Bool())
22909c6f1ddSLingrui98    val mispred_mask = Output(Vec(numBr+1, Bool()))
23009c6f1ddSLingrui98
23109c6f1ddSLingrui98    // for perf counters
23209c6f1ddSLingrui98    val is_init_entry = Output(Bool())
23309c6f1ddSLingrui98    val is_old_entry = Output(Bool())
23409c6f1ddSLingrui98    val is_new_br = Output(Bool())
23509c6f1ddSLingrui98    val is_jalr_target_modified = Output(Bool())
23609c6f1ddSLingrui98    val is_always_taken_modified = Output(Bool())
23709c6f1ddSLingrui98    val is_br_full = Output(Bool())
23809c6f1ddSLingrui98  })
23909c6f1ddSLingrui98
24009c6f1ddSLingrui98  // no mispredictions detected at predecode
24109c6f1ddSLingrui98  val hit = io.hit
24209c6f1ddSLingrui98  val pd = io.pd
24309c6f1ddSLingrui98
24409c6f1ddSLingrui98  val init_entry = WireInit(0.U.asTypeOf(new FTBEntry))
24509c6f1ddSLingrui98
24609c6f1ddSLingrui98
24709c6f1ddSLingrui98  val cfi_is_br = pd.brMask(io.cfiIndex.bits) && io.cfiIndex.valid
24809c6f1ddSLingrui98  val entry_has_jmp = pd.jmpInfo.valid
24909c6f1ddSLingrui98  val new_jmp_is_jal  = entry_has_jmp && !pd.jmpInfo.bits(0) && io.cfiIndex.valid
25009c6f1ddSLingrui98  val new_jmp_is_jalr = entry_has_jmp &&  pd.jmpInfo.bits(0) && io.cfiIndex.valid
25109c6f1ddSLingrui98  val new_jmp_is_call = entry_has_jmp &&  pd.jmpInfo.bits(1) && io.cfiIndex.valid
25209c6f1ddSLingrui98  val new_jmp_is_ret  = entry_has_jmp &&  pd.jmpInfo.bits(2) && io.cfiIndex.valid
25309c6f1ddSLingrui98  val last_jmp_rvi = entry_has_jmp && pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask.last
254a60a2901SLingrui98  // val last_br_rvi = cfi_is_br && io.cfiIndex.bits === (PredictWidth-1).U && !pd.rvcMask.last
25509c6f1ddSLingrui98
25609c6f1ddSLingrui98  val cfi_is_jal = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jal
25709c6f1ddSLingrui98  val cfi_is_jalr = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jalr
25809c6f1ddSLingrui98
259a60a2901SLingrui98  def carryPos = log2Ceil(PredictWidth)+instOffsetBits
26009c6f1ddSLingrui98  def getLower(pc: UInt) = pc(carryPos-1, instOffsetBits)
26109c6f1ddSLingrui98  // if not hit, establish a new entry
26209c6f1ddSLingrui98  init_entry.valid := true.B
26309c6f1ddSLingrui98  // tag is left for ftb to assign
264eeb5ff92SLingrui98
265eeb5ff92SLingrui98  // case br
266eeb5ff92SLingrui98  val init_br_slot = init_entry.getSlotForBr(0)
267eeb5ff92SLingrui98  when (cfi_is_br) {
268eeb5ff92SLingrui98    init_br_slot.valid := true.B
269eeb5ff92SLingrui98    init_br_slot.offset := io.cfiIndex.bits
270b37e4b45SLingrui98    init_br_slot.setLowerStatByTarget(io.start_addr, io.target, numBr == 1)
271eeb5ff92SLingrui98    init_entry.always_taken(0) := true.B // set to always taken on init
272eeb5ff92SLingrui98  }
273eeb5ff92SLingrui98
274eeb5ff92SLingrui98  // case jmp
275eeb5ff92SLingrui98  when (entry_has_jmp) {
276eeb5ff92SLingrui98    init_entry.tailSlot.offset := pd.jmpOffset
277eeb5ff92SLingrui98    init_entry.tailSlot.valid := new_jmp_is_jal || new_jmp_is_jalr
278eeb5ff92SLingrui98    init_entry.tailSlot.setLowerStatByTarget(io.start_addr, Mux(cfi_is_jalr, io.target, pd.jalTarget), isShare=false)
279eeb5ff92SLingrui98  }
280eeb5ff92SLingrui98
28109c6f1ddSLingrui98  val jmpPft = getLower(io.start_addr) +& pd.jmpOffset +& Mux(pd.rvcMask(pd.jmpOffset), 1.U, 2.U)
282a60a2901SLingrui98  init_entry.pftAddr := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft, getLower(io.start_addr))
283a60a2901SLingrui98  init_entry.carry   := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft(carryPos-instOffsetBits), true.B)
28409c6f1ddSLingrui98  init_entry.isJalr := new_jmp_is_jalr
28509c6f1ddSLingrui98  init_entry.isCall := new_jmp_is_call
28609c6f1ddSLingrui98  init_entry.isRet  := new_jmp_is_ret
287f4ebc4b2SLingrui98  // that means fall thru points to the middle of an inst
288ae409b75SSteve Gou  init_entry.last_may_be_rvi_call := pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask(pd.jmpOffset)
28909c6f1ddSLingrui98
29009c6f1ddSLingrui98  // if hit, check whether a new cfi(only br is possible) is detected
29109c6f1ddSLingrui98  val oe = io.old_entry
292eeb5ff92SLingrui98  val br_recorded_vec = oe.getBrRecordedVec(io.cfiIndex.bits)
29309c6f1ddSLingrui98  val br_recorded = br_recorded_vec.asUInt.orR
29409c6f1ddSLingrui98  val is_new_br = cfi_is_br && !br_recorded
29509c6f1ddSLingrui98  val new_br_offset = io.cfiIndex.bits
29609c6f1ddSLingrui98  // vec(i) means new br will be inserted BEFORE old br(i)
297eeb5ff92SLingrui98  val allBrSlotsVec = oe.allSlotsForBr
29809c6f1ddSLingrui98  val new_br_insert_onehot = VecInit((0 until numBr).map{
29909c6f1ddSLingrui98    i => i match {
300eeb5ff92SLingrui98      case 0 =>
301eeb5ff92SLingrui98        !allBrSlotsVec(0).valid || new_br_offset < allBrSlotsVec(0).offset
302eeb5ff92SLingrui98      case idx =>
303eeb5ff92SLingrui98        allBrSlotsVec(idx-1).valid && new_br_offset > allBrSlotsVec(idx-1).offset &&
304eeb5ff92SLingrui98        (!allBrSlotsVec(idx).valid || new_br_offset < allBrSlotsVec(idx).offset)
30509c6f1ddSLingrui98    }
30609c6f1ddSLingrui98  })
30709c6f1ddSLingrui98
30809c6f1ddSLingrui98  val old_entry_modified = WireInit(io.old_entry)
30909c6f1ddSLingrui98  for (i <- 0 until numBr) {
310eeb5ff92SLingrui98    val slot = old_entry_modified.allSlotsForBr(i)
311eeb5ff92SLingrui98    when (new_br_insert_onehot(i)) {
312eeb5ff92SLingrui98      slot.valid := true.B
313eeb5ff92SLingrui98      slot.offset := new_br_offset
314b37e4b45SLingrui98      slot.setLowerStatByTarget(io.start_addr, io.target, i == numBr-1)
315eeb5ff92SLingrui98      old_entry_modified.always_taken(i) := true.B
316eeb5ff92SLingrui98    }.elsewhen (new_br_offset > oe.allSlotsForBr(i).offset) {
317eeb5ff92SLingrui98      old_entry_modified.always_taken(i) := false.B
318eeb5ff92SLingrui98      // all other fields remain unchanged
319eeb5ff92SLingrui98    }.otherwise {
320eeb5ff92SLingrui98      // case i == 0, remain unchanged
321eeb5ff92SLingrui98      if (i != 0) {
322b37e4b45SLingrui98        val noNeedToMoveFromFormerSlot = (i == numBr-1).B && !oe.brSlots.last.valid
323eeb5ff92SLingrui98        when (!noNeedToMoveFromFormerSlot) {
324eeb5ff92SLingrui98          slot.fromAnotherSlot(oe.allSlotsForBr(i-1))
325eeb5ff92SLingrui98          old_entry_modified.always_taken(i) := oe.always_taken(i)
32609c6f1ddSLingrui98        }
327eeb5ff92SLingrui98      }
328eeb5ff92SLingrui98    }
329eeb5ff92SLingrui98  }
33009c6f1ddSLingrui98
331eeb5ff92SLingrui98  // two circumstances:
332eeb5ff92SLingrui98  // 1. oe: | br | j  |, new br should be in front of j, thus addr of j should be new pft
333eeb5ff92SLingrui98  // 2. oe: | br | br |, new br could be anywhere between, thus new pft is the addr of either
334eeb5ff92SLingrui98  //        the previous last br or the new br
335eeb5ff92SLingrui98  val may_have_to_replace = oe.noEmptySlotForNewBr
336eeb5ff92SLingrui98  val pft_need_to_change = is_new_br && may_have_to_replace
33709c6f1ddSLingrui98  // it should either be the given last br or the new br
33809c6f1ddSLingrui98  when (pft_need_to_change) {
339eeb5ff92SLingrui98    val new_pft_offset =
340710a8720SLingrui98      Mux(!new_br_insert_onehot.asUInt.orR,
341710a8720SLingrui98        new_br_offset, oe.allSlotsForBr.last.offset)
342eeb5ff92SLingrui98
343710a8720SLingrui98    // set jmp to invalid
34409c6f1ddSLingrui98    old_entry_modified.pftAddr := getLower(io.start_addr) + new_pft_offset
34509c6f1ddSLingrui98    old_entry_modified.carry := (getLower(io.start_addr) +& new_pft_offset).head(1).asBool
346f4ebc4b2SLingrui98    old_entry_modified.last_may_be_rvi_call := false.B
34709c6f1ddSLingrui98    old_entry_modified.isCall := false.B
34809c6f1ddSLingrui98    old_entry_modified.isRet := false.B
349eeb5ff92SLingrui98    old_entry_modified.isJalr := false.B
35009c6f1ddSLingrui98  }
35109c6f1ddSLingrui98
35209c6f1ddSLingrui98  val old_entry_jmp_target_modified = WireInit(oe)
353710a8720SLingrui98  val old_target = oe.tailSlot.getTarget(io.start_addr) // may be wrong because we store only 20 lowest bits
354b37e4b45SLingrui98  val old_tail_is_jmp = !oe.tailSlot.sharing
355eeb5ff92SLingrui98  val jalr_target_modified = cfi_is_jalr && (old_target =/= io.target) && old_tail_is_jmp // TODO: pass full jalr target
3563bcae573SLingrui98  when (jalr_target_modified) {
35709c6f1ddSLingrui98    old_entry_jmp_target_modified.setByJmpTarget(io.start_addr, io.target)
35809c6f1ddSLingrui98    old_entry_jmp_target_modified.always_taken := 0.U.asTypeOf(Vec(numBr, Bool()))
35909c6f1ddSLingrui98  }
36009c6f1ddSLingrui98
36109c6f1ddSLingrui98  val old_entry_always_taken = WireInit(oe)
36209c6f1ddSLingrui98  val always_taken_modified_vec = Wire(Vec(numBr, Bool())) // whether modified or not
36309c6f1ddSLingrui98  for (i <- 0 until numBr) {
36409c6f1ddSLingrui98    old_entry_always_taken.always_taken(i) :=
36509c6f1ddSLingrui98      oe.always_taken(i) && io.cfiIndex.valid && oe.brValids(i) && io.cfiIndex.bits === oe.brOffset(i)
366710a8720SLingrui98    always_taken_modified_vec(i) := oe.always_taken(i) && !old_entry_always_taken.always_taken(i)
36709c6f1ddSLingrui98  }
36809c6f1ddSLingrui98  val always_taken_modified = always_taken_modified_vec.reduce(_||_)
36909c6f1ddSLingrui98
37009c6f1ddSLingrui98
37109c6f1ddSLingrui98
37209c6f1ddSLingrui98  val derived_from_old_entry =
37309c6f1ddSLingrui98    Mux(is_new_br, old_entry_modified,
3743bcae573SLingrui98      Mux(jalr_target_modified, old_entry_jmp_target_modified, old_entry_always_taken))
37509c6f1ddSLingrui98
37609c6f1ddSLingrui98
37709c6f1ddSLingrui98  io.new_entry := Mux(!hit, init_entry, derived_from_old_entry)
37809c6f1ddSLingrui98
37909c6f1ddSLingrui98  io.new_br_insert_pos := new_br_insert_onehot
38009c6f1ddSLingrui98  io.taken_mask := VecInit((io.new_entry.brOffset zip io.new_entry.brValids).map{
38109c6f1ddSLingrui98    case (off, v) => io.cfiIndex.bits === off && io.cfiIndex.valid && v
38209c6f1ddSLingrui98  })
383803124a6SLingrui98  io.jmp_taken := io.new_entry.jmpValid && io.new_entry.tailSlot.offset === io.cfiIndex.bits
38409c6f1ddSLingrui98  for (i <- 0 until numBr) {
38509c6f1ddSLingrui98    io.mispred_mask(i) := io.new_entry.brValids(i) && io.mispredict_vec(io.new_entry.brOffset(i))
38609c6f1ddSLingrui98  }
38709c6f1ddSLingrui98  io.mispred_mask.last := io.new_entry.jmpValid && io.mispredict_vec(pd.jmpOffset)
38809c6f1ddSLingrui98
38909c6f1ddSLingrui98  // for perf counters
39009c6f1ddSLingrui98  io.is_init_entry := !hit
3913bcae573SLingrui98  io.is_old_entry := hit && !is_new_br && !jalr_target_modified && !always_taken_modified
39209c6f1ddSLingrui98  io.is_new_br := hit && is_new_br
3933bcae573SLingrui98  io.is_jalr_target_modified := hit && jalr_target_modified
39409c6f1ddSLingrui98  io.is_always_taken_modified := hit && always_taken_modified
395eeb5ff92SLingrui98  io.is_br_full := hit && is_new_br && may_have_to_replace
39609c6f1ddSLingrui98}
39709c6f1ddSLingrui98
398c5c5edaeSJeniusclass FtqPcMemWrapper(numOtherReads: Int)(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo {
399c5c5edaeSJenius  val io = IO(new Bundle {
400c5c5edaeSJenius    val ifuPtr_w       = Input(new FtqPtr)
401c5c5edaeSJenius    val ifuPtrPlus1_w  = Input(new FtqPtr)
4026bf9b30dSLingrui98    val ifuPtrPlus2_w  = Input(new FtqPtr)
403c5c5edaeSJenius    val commPtr_w      = Input(new FtqPtr)
4046bf9b30dSLingrui98    val commPtrPlus1_w = Input(new FtqPtr)
405c5c5edaeSJenius    val ifuPtr_rdata       = Output(new Ftq_RF_Components)
406c5c5edaeSJenius    val ifuPtrPlus1_rdata  = Output(new Ftq_RF_Components)
4076bf9b30dSLingrui98    val ifuPtrPlus2_rdata  = Output(new Ftq_RF_Components)
408c5c5edaeSJenius    val commPtr_rdata      = Output(new Ftq_RF_Components)
4096bf9b30dSLingrui98    val commPtrPlus1_rdata = Output(new Ftq_RF_Components)
410c5c5edaeSJenius
411c5c5edaeSJenius    val other_raddrs = Input(Vec(numOtherReads, UInt(log2Ceil(FtqSize).W)))
412c5c5edaeSJenius    val other_rdatas = Output(Vec(numOtherReads, new Ftq_RF_Components))
413c5c5edaeSJenius
414c5c5edaeSJenius    val wen = Input(Bool())
415c5c5edaeSJenius    val waddr = Input(UInt(log2Ceil(FtqSize).W))
416c5c5edaeSJenius    val wdata = Input(new Ftq_RF_Components)
417c5c5edaeSJenius  })
418c5c5edaeSJenius
4196bf9b30dSLingrui98  val num_pc_read = numOtherReads + 5
420c5c5edaeSJenius  val mem = Module(new SyncDataModuleTemplate(new Ftq_RF_Components, FtqSize,
42128f2cf58SLingrui98    num_pc_read, 1, "FtqPC"))
422c5c5edaeSJenius  mem.io.wen(0)   := io.wen
423c5c5edaeSJenius  mem.io.waddr(0) := io.waddr
424c5c5edaeSJenius  mem.io.wdata(0) := io.wdata
425c5c5edaeSJenius
4266bf9b30dSLingrui98  // read one cycle ahead for ftq local reads
427c5c5edaeSJenius  val raddr_vec = VecInit(io.other_raddrs ++
42888bc4f90SLingrui98    Seq(io.ifuPtr_w.value, io.ifuPtrPlus1_w.value, io.ifuPtrPlus2_w.value, io.commPtrPlus1_w.value, io.commPtr_w.value))
429c5c5edaeSJenius
430c5c5edaeSJenius  mem.io.raddr := raddr_vec
431c5c5edaeSJenius
4326bf9b30dSLingrui98  io.other_rdatas       := mem.io.rdata.dropRight(5)
4336bf9b30dSLingrui98  io.ifuPtr_rdata       := mem.io.rdata.dropRight(4).last
4346bf9b30dSLingrui98  io.ifuPtrPlus1_rdata  := mem.io.rdata.dropRight(3).last
4356bf9b30dSLingrui98  io.ifuPtrPlus2_rdata  := mem.io.rdata.dropRight(2).last
4366bf9b30dSLingrui98  io.commPtrPlus1_rdata := mem.io.rdata.dropRight(1).last
437c5c5edaeSJenius  io.commPtr_rdata      := mem.io.rdata.last
438c5c5edaeSJenius}
439c5c5edaeSJenius
44009c6f1ddSLingrui98class Ftq(implicit p: Parameters) extends XSModule with HasCircularQueuePtrHelper
441e30430c2SJay  with HasBackendRedirectInfo with BPUUtils with HasBPUConst with HasPerfEvents
442e30430c2SJay  with HasICacheParameters{
44309c6f1ddSLingrui98  val io = IO(new Bundle {
44409c6f1ddSLingrui98    val fromBpu = Flipped(new BpuToFtqIO)
44509c6f1ddSLingrui98    val fromIfu = Flipped(new IfuToFtqIO)
44609c6f1ddSLingrui98    val fromBackend = Flipped(new CtrlToFtqIO)
44709c6f1ddSLingrui98
44809c6f1ddSLingrui98    val toBpu = new FtqToBpuIO
44909c6f1ddSLingrui98    val toIfu = new FtqToIfuIO
450c5c5edaeSJenius    val toICache = new FtqToICacheIO
45109c6f1ddSLingrui98    val toBackend = new FtqToCtrlIO
45209c6f1ddSLingrui98
4537052722fSJay    val toPrefetch = new FtqPrefechBundle
4547052722fSJay
45509c6f1ddSLingrui98    val bpuInfo = new Bundle {
45609c6f1ddSLingrui98      val bpRight = Output(UInt(XLEN.W))
45709c6f1ddSLingrui98      val bpWrong = Output(UInt(XLEN.W))
45809c6f1ddSLingrui98    }
4591d1e6d4dSJenius
4601d1e6d4dSJenius    val mmioCommitRead = Flipped(new mmioCommitRead)
46109c6f1ddSLingrui98  })
46209c6f1ddSLingrui98  io.bpuInfo := DontCare
46309c6f1ddSLingrui98
4642e1be6e1SSteve Gou  val backendRedirect = Wire(Valid(new Redirect))
4652e1be6e1SSteve Gou  val backendRedirectReg = RegNext(backendRedirect)
46609c6f1ddSLingrui98
467df5b4b8eSYinan Xu  val stage2Flush = backendRedirect.valid
46809c6f1ddSLingrui98  val backendFlush = stage2Flush || RegNext(stage2Flush)
46909c6f1ddSLingrui98  val ifuFlush = Wire(Bool())
47009c6f1ddSLingrui98
47109c6f1ddSLingrui98  val flush = stage2Flush || RegNext(stage2Flush)
47209c6f1ddSLingrui98
47309c6f1ddSLingrui98  val allowBpuIn, allowToIfu = WireInit(false.B)
47409c6f1ddSLingrui98  val flushToIfu = !allowToIfu
475df5b4b8eSYinan Xu  allowBpuIn := !ifuFlush && !backendRedirect.valid && !backendRedirectReg.valid
476df5b4b8eSYinan Xu  allowToIfu := !ifuFlush && !backendRedirect.valid && !backendRedirectReg.valid
47709c6f1ddSLingrui98
478f56177cbSJenius  def copyNum = 5
479e30430c2SJay  val bpuPtr, ifuPtr, ifuWbPtr, commPtr = RegInit(FtqPtr(false.B, 0.U))
480c9bc5480SLingrui98  val ifuPtrPlus1 = RegInit(FtqPtr(false.B, 1.U))
4816bf9b30dSLingrui98  val ifuPtrPlus2 = RegInit(FtqPtr(false.B, 2.U))
4826bf9b30dSLingrui98  val commPtrPlus1 = RegInit(FtqPtr(false.B, 1.U))
483f56177cbSJenius  val copied_ifu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U)))
484dc270d3bSJenius  val copied_bpu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U)))
4856bf9b30dSLingrui98  require(FtqSize >= 4)
486c5c5edaeSJenius  val ifuPtr_write       = WireInit(ifuPtr)
487c5c5edaeSJenius  val ifuPtrPlus1_write  = WireInit(ifuPtrPlus1)
4886bf9b30dSLingrui98  val ifuPtrPlus2_write  = WireInit(ifuPtrPlus2)
489c5c5edaeSJenius  val ifuWbPtr_write     = WireInit(ifuWbPtr)
490c5c5edaeSJenius  val commPtr_write      = WireInit(commPtr)
4916bf9b30dSLingrui98  val commPtrPlus1_write = WireInit(commPtrPlus1)
492c5c5edaeSJenius  ifuPtr       := ifuPtr_write
493c5c5edaeSJenius  ifuPtrPlus1  := ifuPtrPlus1_write
4946bf9b30dSLingrui98  ifuPtrPlus2  := ifuPtrPlus2_write
495c5c5edaeSJenius  ifuWbPtr     := ifuWbPtr_write
496c5c5edaeSJenius  commPtr      := commPtr_write
497f83ef67eSLingrui98  commPtrPlus1 := commPtrPlus1_write
498f56177cbSJenius  copied_ifu_ptr.map{ptr =>
499f56177cbSJenius    ptr := ifuPtr_write
500f56177cbSJenius    dontTouch(ptr)
501f56177cbSJenius  }
50209c6f1ddSLingrui98  val validEntries = distanceBetween(bpuPtr, commPtr)
50309c6f1ddSLingrui98
50409c6f1ddSLingrui98  // **********************************************************************
50509c6f1ddSLingrui98  // **************************** enq from bpu ****************************
50609c6f1ddSLingrui98  // **********************************************************************
50709c6f1ddSLingrui98  val new_entry_ready = validEntries < FtqSize.U
50809c6f1ddSLingrui98  io.fromBpu.resp.ready := new_entry_ready
50909c6f1ddSLingrui98
51009c6f1ddSLingrui98  val bpu_s2_resp = io.fromBpu.resp.bits.s2
511cb4f77ceSLingrui98  val bpu_s3_resp = io.fromBpu.resp.bits.s3
51209c6f1ddSLingrui98  val bpu_s2_redirect = bpu_s2_resp.valid && bpu_s2_resp.hasRedirect
513cb4f77ceSLingrui98  val bpu_s3_redirect = bpu_s3_resp.valid && bpu_s3_resp.hasRedirect
51409c6f1ddSLingrui98
51509c6f1ddSLingrui98  io.toBpu.enq_ptr := bpuPtr
51609c6f1ddSLingrui98  val enq_fire = io.fromBpu.resp.fire() && allowBpuIn // from bpu s1
517cb4f77ceSLingrui98  val bpu_in_fire = (io.fromBpu.resp.fire() || bpu_s2_redirect || bpu_s3_redirect) && allowBpuIn
51809c6f1ddSLingrui98
519b37e4b45SLingrui98  val bpu_in_resp = io.fromBpu.resp.bits.selectedResp
520b37e4b45SLingrui98  val bpu_in_stage = io.fromBpu.resp.bits.selectedRespIdx
52109c6f1ddSLingrui98  val bpu_in_resp_ptr = Mux(bpu_in_stage === BP_S1, bpuPtr, bpu_in_resp.ftq_idx)
52209c6f1ddSLingrui98  val bpu_in_resp_idx = bpu_in_resp_ptr.value
52309c6f1ddSLingrui98
524378f00d9SJenius  // read ports:      prefetchReq ++  ifuReq1 + ifuReq2 + ifuReq3 + commitUpdate2 + commitUpdate
525378f00d9SJenius  val ftq_pc_mem = Module(new FtqPcMemWrapper(1))
5266bf9b30dSLingrui98  // resp from uBTB
527c5c5edaeSJenius  ftq_pc_mem.io.wen := bpu_in_fire
528c5c5edaeSJenius  ftq_pc_mem.io.waddr := bpu_in_resp_idx
529c5c5edaeSJenius  ftq_pc_mem.io.wdata.fromBranchPrediction(bpu_in_resp)
53009c6f1ddSLingrui98
53109c6f1ddSLingrui98  //                                                            ifuRedirect + backendRedirect + commit
53209c6f1ddSLingrui98  val ftq_redirect_sram = Module(new FtqNRSRAM(new Ftq_Redirect_SRAMEntry, 1+1+1))
53309c6f1ddSLingrui98  // these info is intended to enq at the last stage of bpu
53409c6f1ddSLingrui98  ftq_redirect_sram.io.wen := io.fromBpu.resp.bits.lastStage.valid
53509c6f1ddSLingrui98  ftq_redirect_sram.io.waddr := io.fromBpu.resp.bits.lastStage.ftq_idx.value
536c2d1ec7dSLingrui98  ftq_redirect_sram.io.wdata := io.fromBpu.resp.bits.last_stage_spec_info
53749cbc998SLingrui98  println(f"ftq redirect SRAM: entry ${ftq_redirect_sram.io.wdata.getWidth} * ${FtqSize} * 3")
53849cbc998SLingrui98  println(f"ftq redirect SRAM: ahead fh ${ftq_redirect_sram.io.wdata.afhob.getWidth} * ${FtqSize} * 3")
53909c6f1ddSLingrui98
54009c6f1ddSLingrui98  val ftq_meta_1r_sram = Module(new FtqNRSRAM(new Ftq_1R_SRAMEntry, 1))
54109c6f1ddSLingrui98  // these info is intended to enq at the last stage of bpu
54209c6f1ddSLingrui98  ftq_meta_1r_sram.io.wen := io.fromBpu.resp.bits.lastStage.valid
54309c6f1ddSLingrui98  ftq_meta_1r_sram.io.waddr := io.fromBpu.resp.bits.lastStage.ftq_idx.value
544c2d1ec7dSLingrui98  ftq_meta_1r_sram.io.wdata.meta := io.fromBpu.resp.bits.last_stage_meta
54509c6f1ddSLingrui98  //                                                            ifuRedirect + backendRedirect + commit
54609c6f1ddSLingrui98  val ftb_entry_mem = Module(new SyncDataModuleTemplate(new FTBEntry, FtqSize, 1+1+1, 1))
54709c6f1ddSLingrui98  ftb_entry_mem.io.wen(0) := io.fromBpu.resp.bits.lastStage.valid
54809c6f1ddSLingrui98  ftb_entry_mem.io.waddr(0) := io.fromBpu.resp.bits.lastStage.ftq_idx.value
549c2d1ec7dSLingrui98  ftb_entry_mem.io.wdata(0) := io.fromBpu.resp.bits.last_stage_ftb_entry
55009c6f1ddSLingrui98
55109c6f1ddSLingrui98
55209c6f1ddSLingrui98  // multi-write
553b0ed7239SLingrui98  val update_target = Reg(Vec(FtqSize, UInt(VAddrBits.W))) // could be taken target or fallThrough //TODO: remove this
5546bf9b30dSLingrui98  val newest_entry_target = Reg(UInt(VAddrBits.W))
5556bf9b30dSLingrui98  val newest_entry_ptr = Reg(new FtqPtr)
55609c6f1ddSLingrui98  val cfiIndex_vec = Reg(Vec(FtqSize, ValidUndirectioned(UInt(log2Ceil(PredictWidth).W))))
55709c6f1ddSLingrui98  val mispredict_vec = Reg(Vec(FtqSize, Vec(PredictWidth, Bool())))
55809c6f1ddSLingrui98  val pred_stage = Reg(Vec(FtqSize, UInt(2.W)))
55909c6f1ddSLingrui98
560b5808fc2Ssfencevma  val c_invalid :: c_valid :: c_commited :: Nil = Enum(3)
56109c6f1ddSLingrui98  val commitStateQueue = RegInit(VecInit(Seq.fill(FtqSize) {
56209c6f1ddSLingrui98    VecInit(Seq.fill(PredictWidth)(c_invalid))
56309c6f1ddSLingrui98  }))
56409c6f1ddSLingrui98
56509c6f1ddSLingrui98  val f_to_send :: f_sent :: Nil = Enum(2)
56609c6f1ddSLingrui98  val entry_fetch_status = RegInit(VecInit(Seq.fill(FtqSize)(f_sent)))
56709c6f1ddSLingrui98
56809c6f1ddSLingrui98  val h_not_hit :: h_false_hit :: h_hit :: Nil = Enum(3)
56909c6f1ddSLingrui98  val entry_hit_status = RegInit(VecInit(Seq.fill(FtqSize)(h_not_hit)))
57009c6f1ddSLingrui98
571f63797a4SLingrui98  // modify registers one cycle later to cut critical path
572f63797a4SLingrui98  val last_cycle_bpu_in = RegNext(bpu_in_fire)
5736bf9b30dSLingrui98  val last_cycle_bpu_in_ptr = RegNext(bpu_in_resp_ptr)
5746bf9b30dSLingrui98  val last_cycle_bpu_in_idx = last_cycle_bpu_in_ptr.value
5756bf9b30dSLingrui98  val last_cycle_bpu_target = RegNext(bpu_in_resp.getTarget)
576f63797a4SLingrui98  val last_cycle_cfiIndex = RegNext(bpu_in_resp.cfiIndex)
577f63797a4SLingrui98  val last_cycle_bpu_in_stage = RegNext(bpu_in_stage)
578f56177cbSJenius
5797be982afSLingrui98  def extra_copyNum_for_commitStateQueue = 2
5807be982afSLingrui98  val copied_last_cycle_bpu_in = VecInit(Seq.fill(copyNum+extra_copyNum_for_commitStateQueue)(RegNext(bpu_in_fire)))
5817be982afSLingrui98  val copied_last_cycle_bpu_in_ptr_for_ftq = VecInit(Seq.fill(extra_copyNum_for_commitStateQueue)(RegNext(bpu_in_resp_ptr)))
582f56177cbSJenius
583f63797a4SLingrui98  when (last_cycle_bpu_in) {
584f63797a4SLingrui98    entry_fetch_status(last_cycle_bpu_in_idx) := f_to_send
585f63797a4SLingrui98    cfiIndex_vec(last_cycle_bpu_in_idx) := last_cycle_cfiIndex
586f63797a4SLingrui98    pred_stage(last_cycle_bpu_in_idx) := last_cycle_bpu_in_stage
5876bf9b30dSLingrui98
588b0ed7239SLingrui98    update_target(last_cycle_bpu_in_idx) := last_cycle_bpu_target // TODO: remove this
5896bf9b30dSLingrui98    newest_entry_target := last_cycle_bpu_target
5906bf9b30dSLingrui98    newest_entry_ptr := last_cycle_bpu_in_ptr
59109c6f1ddSLingrui98  }
59209c6f1ddSLingrui98
5937be982afSLingrui98  // reduce fanout by delay write for a cycle
5947be982afSLingrui98  when (RegNext(last_cycle_bpu_in)) {
5957be982afSLingrui98    mispredict_vec(RegNext(last_cycle_bpu_in_idx)) := WireInit(VecInit(Seq.fill(PredictWidth)(false.B)))
5967be982afSLingrui98  }
5977be982afSLingrui98
5987be982afSLingrui98  // reduce fanout using copied last_cycle_bpu_in and copied last_cycle_bpu_in_ptr
5997be982afSLingrui98  val copied_last_cycle_bpu_in_for_ftq = copied_last_cycle_bpu_in.takeRight(extra_copyNum_for_commitStateQueue)
6007be982afSLingrui98  copied_last_cycle_bpu_in_for_ftq.zip(copied_last_cycle_bpu_in_ptr_for_ftq).zipWithIndex.map {
6017be982afSLingrui98    case ((in, ptr), i) =>
6027be982afSLingrui98      when (in) {
6037be982afSLingrui98        val perSetEntries = FtqSize / extra_copyNum_for_commitStateQueue // 32
6047be982afSLingrui98        require(FtqSize % extra_copyNum_for_commitStateQueue == 0)
6057be982afSLingrui98        for (j <- 0 until perSetEntries) {
6069361b0c5SLingrui98          when (ptr.value === (i*perSetEntries+j).U) {
6077be982afSLingrui98            commitStateQueue(i*perSetEntries+j) := VecInit(Seq.fill(PredictWidth)(c_invalid))
6087be982afSLingrui98          }
6097be982afSLingrui98        }
6107be982afSLingrui98      }
6119361b0c5SLingrui98  }
6127be982afSLingrui98
613873dc383SLingrui98  // num cycle is fixed
614873dc383SLingrui98  io.toBackend.newest_entry_ptr := RegNext(newest_entry_ptr)
615873dc383SLingrui98  io.toBackend.newest_entry_target := RegNext(newest_entry_target)
616873dc383SLingrui98
617f63797a4SLingrui98
61809c6f1ddSLingrui98  bpuPtr := bpuPtr + enq_fire
619dc270d3bSJenius  copied_bpu_ptr.map(_ := bpuPtr + enq_fire)
620c9bc5480SLingrui98  when (io.toIfu.req.fire && allowToIfu) {
621c5c5edaeSJenius    ifuPtr_write := ifuPtrPlus1
6226bf9b30dSLingrui98    ifuPtrPlus1_write := ifuPtrPlus2
6236bf9b30dSLingrui98    ifuPtrPlus2_write := ifuPtrPlus2 + 1.U
624c9bc5480SLingrui98  }
62509c6f1ddSLingrui98
62609c6f1ddSLingrui98  // only use ftb result to assign hit status
62709c6f1ddSLingrui98  when (bpu_s2_resp.valid) {
628b37e4b45SLingrui98    entry_hit_status(bpu_s2_resp.ftq_idx.value) := Mux(bpu_s2_resp.full_pred.hit, h_hit, h_not_hit)
62909c6f1ddSLingrui98  }
63009c6f1ddSLingrui98
63109c6f1ddSLingrui98
6322f4a3aa4SLingrui98  io.toIfu.flushFromBpu.s2.valid := bpu_s2_redirect
63309c6f1ddSLingrui98  io.toIfu.flushFromBpu.s2.bits := bpu_s2_resp.ftq_idx
63409c6f1ddSLingrui98  when (bpu_s2_resp.valid && bpu_s2_resp.hasRedirect) {
63509c6f1ddSLingrui98    bpuPtr := bpu_s2_resp.ftq_idx + 1.U
636dc270d3bSJenius    copied_bpu_ptr.map(_ := bpu_s2_resp.ftq_idx + 1.U)
63709c6f1ddSLingrui98    // only when ifuPtr runs ahead of bpu s2 resp should we recover it
63809c6f1ddSLingrui98    when (!isBefore(ifuPtr, bpu_s2_resp.ftq_idx)) {
639c5c5edaeSJenius      ifuPtr_write := bpu_s2_resp.ftq_idx
640c5c5edaeSJenius      ifuPtrPlus1_write := bpu_s2_resp.ftq_idx + 1.U
6416bf9b30dSLingrui98      ifuPtrPlus2_write := bpu_s2_resp.ftq_idx + 2.U
64209c6f1ddSLingrui98    }
64309c6f1ddSLingrui98  }
64409c6f1ddSLingrui98
645cb4f77ceSLingrui98  io.toIfu.flushFromBpu.s3.valid := bpu_s3_redirect
646cb4f77ceSLingrui98  io.toIfu.flushFromBpu.s3.bits := bpu_s3_resp.ftq_idx
647cb4f77ceSLingrui98  when (bpu_s3_resp.valid && bpu_s3_resp.hasRedirect) {
648cb4f77ceSLingrui98    bpuPtr := bpu_s3_resp.ftq_idx + 1.U
649dc270d3bSJenius    copied_bpu_ptr.map(_ := bpu_s3_resp.ftq_idx + 1.U)
650cb4f77ceSLingrui98    // only when ifuPtr runs ahead of bpu s2 resp should we recover it
651cb4f77ceSLingrui98    when (!isBefore(ifuPtr, bpu_s3_resp.ftq_idx)) {
652c5c5edaeSJenius      ifuPtr_write := bpu_s3_resp.ftq_idx
653c5c5edaeSJenius      ifuPtrPlus1_write := bpu_s3_resp.ftq_idx + 1.U
6546bf9b30dSLingrui98      ifuPtrPlus2_write := bpu_s3_resp.ftq_idx + 2.U
655cb4f77ceSLingrui98    }
656cb4f77ceSLingrui98  }
657cb4f77ceSLingrui98
65809c6f1ddSLingrui98  XSError(isBefore(bpuPtr, ifuPtr) && !isFull(bpuPtr, ifuPtr), "\nifuPtr is before bpuPtr!\n")
6592448f137SGuokai Chen  XSError(isBefore(ifuWbPtr, commPtr) && !isFull(ifuWbPtr, commPtr), "\ncommPtr is before ifuWbPtr!\n")
66009c6f1ddSLingrui98
661dc270d3bSJenius  (0 until copyNum).map{i =>
662dc270d3bSJenius    XSError(copied_bpu_ptr(i) =/= bpuPtr, "\ncopiedBpuPtr is different from bpuPtr!\n")
663dc270d3bSJenius  }
664dc270d3bSJenius
66509c6f1ddSLingrui98  // ****************************************************************
66609c6f1ddSLingrui98  // **************************** to ifu ****************************
66709c6f1ddSLingrui98  // ****************************************************************
668f22cf846SJenius  // 0  for ifu, and 1-4 for ICache
669f56177cbSJenius  val bpu_in_bypass_buf = RegEnable(ftq_pc_mem.io.wdata, enable=bpu_in_fire)
670f56177cbSJenius  val copied_bpu_in_bypass_buf = VecInit(Seq.fill(copyNum)(RegEnable(ftq_pc_mem.io.wdata, enable=bpu_in_fire)))
671f56177cbSJenius  val bpu_in_bypass_buf_for_ifu = bpu_in_bypass_buf
67209c6f1ddSLingrui98  val bpu_in_bypass_ptr = RegNext(bpu_in_resp_ptr)
67309c6f1ddSLingrui98  val last_cycle_to_ifu_fire = RegNext(io.toIfu.req.fire)
67409c6f1ddSLingrui98
675f56177cbSJenius  val copied_bpu_in_bypass_ptr = VecInit(Seq.fill(copyNum)(RegNext(bpu_in_resp_ptr)))
676f56177cbSJenius  val copied_last_cycle_to_ifu_fire = VecInit(Seq.fill(copyNum)(RegNext(io.toIfu.req.fire)))
67788bc4f90SLingrui98
67809c6f1ddSLingrui98  // read pc and target
6796bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtr_w       := ifuPtr_write
6806bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtrPlus1_w  := ifuPtrPlus1_write
6816bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtrPlus2_w  := ifuPtrPlus2_write
6826bf9b30dSLingrui98  ftq_pc_mem.io.commPtr_w      := commPtr_write
6836bf9b30dSLingrui98  ftq_pc_mem.io.commPtrPlus1_w := commPtrPlus1_write
684c5c5edaeSJenius
68509c6f1ddSLingrui98
6865ff19bd8SLingrui98  io.toIfu.req.bits.ftqIdx := ifuPtr
687f63797a4SLingrui98
688f56177cbSJenius  val toICachePcBundle = Wire(Vec(copyNum,new Ftq_RF_Components))
689dc270d3bSJenius  val toICacheEntryToSend = Wire(Vec(copyNum,Bool()))
690b37e4b45SLingrui98  val toIfuPcBundle = Wire(new Ftq_RF_Components)
691f63797a4SLingrui98  val entry_is_to_send = WireInit(entry_fetch_status(ifuPtr.value) === f_to_send)
692f63797a4SLingrui98  val entry_ftq_offset = WireInit(cfiIndex_vec(ifuPtr.value))
6936bf9b30dSLingrui98  val entry_next_addr  = Wire(UInt(VAddrBits.W))
694b004fa13SJenius
695f56177cbSJenius  val pc_mem_ifu_ptr_rdata   = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtr_rdata)))
696f56177cbSJenius  val pc_mem_ifu_plus1_rdata = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata)))
697b0ed7239SLingrui98  val diff_entry_next_addr = WireInit(update_target(ifuPtr.value)) //TODO: remove this
698f63797a4SLingrui98
699dc270d3bSJenius  val copied_ifu_plus1_to_send = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1))))
700dc270d3bSJenius  val copied_ifu_ptr_to_send   = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr)))
701dc270d3bSJenius
702f56177cbSJenius  for(i <- 0 until copyNum){
703f56177cbSJenius    when(copied_last_cycle_bpu_in(i) && copied_bpu_in_bypass_ptr(i) === copied_ifu_ptr(i)){
704f56177cbSJenius      toICachePcBundle(i) := copied_bpu_in_bypass_buf(i)
705dc270d3bSJenius      toICacheEntryToSend(i)   := true.B
706f56177cbSJenius    }.elsewhen(copied_last_cycle_to_ifu_fire(i)){
707f56177cbSJenius      toICachePcBundle(i) := pc_mem_ifu_plus1_rdata(i)
708dc270d3bSJenius      toICacheEntryToSend(i)   := copied_ifu_plus1_to_send(i)
709f56177cbSJenius    }.otherwise{
710f56177cbSJenius      toICachePcBundle(i) := pc_mem_ifu_ptr_rdata(i)
711dc270d3bSJenius      toICacheEntryToSend(i)   := copied_ifu_ptr_to_send(i)
712f56177cbSJenius    }
713f56177cbSJenius  }
714f56177cbSJenius
715873dc383SLingrui98  // TODO: reconsider target address bypass logic
71609c6f1ddSLingrui98  when (last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) {
71788bc4f90SLingrui98    toIfuPcBundle := bpu_in_bypass_buf_for_ifu
718f678dd91SSteve Gou    entry_is_to_send := true.B
7196bf9b30dSLingrui98    entry_next_addr := last_cycle_bpu_target
720f63797a4SLingrui98    entry_ftq_offset := last_cycle_cfiIndex
721b0ed7239SLingrui98    diff_entry_next_addr := last_cycle_bpu_target // TODO: remove this
72209c6f1ddSLingrui98  }.elsewhen (last_cycle_to_ifu_fire) {
723c5c5edaeSJenius    toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata)
724c5c5edaeSJenius    entry_is_to_send := RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) ||
725c5c5edaeSJenius                        RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1)) // reduce potential bubbles
726ed434d67SLingrui98    entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1),
72788bc4f90SLingrui98                          bpu_in_bypass_buf_for_ifu.startAddr,
728fef810c0SLingrui98                          Mux(ifuPtr === newest_entry_ptr,
7296bf9b30dSLingrui98                            newest_entry_target,
730f83ef67eSLingrui98                            RegNext(ftq_pc_mem.io.ifuPtrPlus2_rdata.startAddr))) // ifuPtr+2
731c5c5edaeSJenius  }.otherwise {
732c5c5edaeSJenius    toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtr_rdata)
73328f2cf58SLingrui98    entry_is_to_send := RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) ||
73428f2cf58SLingrui98                        RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) // reduce potential bubbles
7356bf9b30dSLingrui98    entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1),
73688bc4f90SLingrui98                          bpu_in_bypass_buf_for_ifu.startAddr,
737fef810c0SLingrui98                          Mux(ifuPtr === newest_entry_ptr,
7386bf9b30dSLingrui98                            newest_entry_target,
739f83ef67eSLingrui98                            RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata.startAddr))) // ifuPtr+1
74009c6f1ddSLingrui98  }
74109c6f1ddSLingrui98
742f678dd91SSteve Gou  io.toIfu.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr
743f63797a4SLingrui98  io.toIfu.req.bits.nextStartAddr := entry_next_addr
744f63797a4SLingrui98  io.toIfu.req.bits.ftqOffset := entry_ftq_offset
745b37e4b45SLingrui98  io.toIfu.req.bits.fromFtqPcBundle(toIfuPcBundle)
746c5c5edaeSJenius
747c5c5edaeSJenius  io.toICache.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr
748dc270d3bSJenius  io.toICache.req.bits.readValid.zipWithIndex.map{case(copy, i) => copy := toICacheEntryToSend(i) && copied_ifu_ptr(i) =/= copied_bpu_ptr(i)}
749b004fa13SJenius  io.toICache.req.bits.pcMemRead.zipWithIndex.map{case(copy,i) => copy.fromFtqPcBundle(toICachePcBundle(i))}
750b004fa13SJenius  // io.toICache.req.bits.bypassSelect := last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr
751b004fa13SJenius  // io.toICache.req.bits.bpuBypassWrite.zipWithIndex.map{case(bypassWrtie, i) =>
752b004fa13SJenius  //   bypassWrtie.startAddr := bpu_in_bypass_buf.tail(i).startAddr
753b004fa13SJenius  //   bypassWrtie.nextlineStart := bpu_in_bypass_buf.tail(i).nextLineAddr
754b004fa13SJenius  // }
755f22cf846SJenius
756b0ed7239SLingrui98  // TODO: remove this
757b0ed7239SLingrui98  XSError(io.toIfu.req.valid && diff_entry_next_addr =/= entry_next_addr,
7585a674179SLingrui98          p"\nifu_req_target wrong! ifuPtr: ${ifuPtr}, entry_next_addr: ${Hexadecimal(entry_next_addr)} diff_entry_next_addr: ${Hexadecimal(diff_entry_next_addr)}\n")
759b0ed7239SLingrui98
76009c6f1ddSLingrui98  // when fall through is smaller in value than start address, there must be a false hit
761b37e4b45SLingrui98  when (toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit) {
76209c6f1ddSLingrui98    when (io.toIfu.req.fire &&
763cb4f77ceSLingrui98      !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) &&
764cb4f77ceSLingrui98      !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr)
76509c6f1ddSLingrui98    ) {
76609c6f1ddSLingrui98      entry_hit_status(ifuPtr.value) := h_false_hit
767352db50aSLingrui98      // XSError(true.B, "FTB false hit by fallThroughError, startAddr: %x, fallTHru: %x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr)
76809c6f1ddSLingrui98    }
769b37e4b45SLingrui98    XSDebug(true.B, "fallThruError! start:%x, fallThru:%x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr)
77009c6f1ddSLingrui98  }
77109c6f1ddSLingrui98
772a60a2901SLingrui98  XSPerfAccumulate(f"fall_through_error_to_ifu", toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit &&
773a60a2901SLingrui98    io.toIfu.req.fire && !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) && !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr))
774a60a2901SLingrui98
77509c6f1ddSLingrui98  val ifu_req_should_be_flushed =
776cb4f77ceSLingrui98    io.toIfu.flushFromBpu.shouldFlushByStage2(io.toIfu.req.bits.ftqIdx) ||
777cb4f77ceSLingrui98    io.toIfu.flushFromBpu.shouldFlushByStage3(io.toIfu.req.bits.ftqIdx)
77809c6f1ddSLingrui98
77909c6f1ddSLingrui98    when (io.toIfu.req.fire && !ifu_req_should_be_flushed) {
78009c6f1ddSLingrui98      entry_fetch_status(ifuPtr.value) := f_sent
78109c6f1ddSLingrui98    }
78209c6f1ddSLingrui98
78309c6f1ddSLingrui98  // *********************************************************************
78409c6f1ddSLingrui98  // **************************** wb from ifu ****************************
78509c6f1ddSLingrui98  // *********************************************************************
78609c6f1ddSLingrui98  val pdWb = io.fromIfu.pdWb
78709c6f1ddSLingrui98  val pds = pdWb.bits.pd
78809c6f1ddSLingrui98  val ifu_wb_valid = pdWb.valid
78909c6f1ddSLingrui98  val ifu_wb_idx = pdWb.bits.ftqIdx.value
79009c6f1ddSLingrui98  // read ports:                                                         commit update
79109c6f1ddSLingrui98  val ftq_pd_mem = Module(new SyncDataModuleTemplate(new Ftq_pd_Entry, FtqSize, 1, 1))
79209c6f1ddSLingrui98  ftq_pd_mem.io.wen(0) := ifu_wb_valid
79309c6f1ddSLingrui98  ftq_pd_mem.io.waddr(0) := pdWb.bits.ftqIdx.value
79409c6f1ddSLingrui98  ftq_pd_mem.io.wdata(0).fromPdWb(pdWb.bits)
79509c6f1ddSLingrui98
79609c6f1ddSLingrui98  val hit_pd_valid = entry_hit_status(ifu_wb_idx) === h_hit && ifu_wb_valid
79709c6f1ddSLingrui98  val hit_pd_mispred = hit_pd_valid && pdWb.bits.misOffset.valid
79809c6f1ddSLingrui98  val hit_pd_mispred_reg = RegNext(hit_pd_mispred, init=false.B)
799005e809bSJiuyang Liu  val pd_reg       = RegEnable(pds,             pdWb.valid)
800005e809bSJiuyang Liu  val start_pc_reg = RegEnable(pdWb.bits.pc(0), pdWb.valid)
801005e809bSJiuyang Liu  val wb_idx_reg   = RegEnable(ifu_wb_idx,      pdWb.valid)
80209c6f1ddSLingrui98
80309c6f1ddSLingrui98  when (ifu_wb_valid) {
80409c6f1ddSLingrui98    val comm_stq_wen = VecInit(pds.map(_.valid).zip(pdWb.bits.instrRange).map{
80509c6f1ddSLingrui98      case (v, inRange) => v && inRange
80609c6f1ddSLingrui98    })
80709c6f1ddSLingrui98    (commitStateQueue(ifu_wb_idx) zip comm_stq_wen).map{
80809c6f1ddSLingrui98      case (qe, v) => when (v) { qe := c_valid }
80909c6f1ddSLingrui98    }
81009c6f1ddSLingrui98  }
81109c6f1ddSLingrui98
812c5c5edaeSJenius  when (ifu_wb_valid) {
813c5c5edaeSJenius    ifuWbPtr_write := ifuWbPtr + 1.U
814c5c5edaeSJenius  }
81509c6f1ddSLingrui98
816*f21bbcb2SGuokai Chen  XSError(ifu_wb_valid && isAfter(pdWb.bits.ftqIdx, ifuPtr), "IFU returned a predecode before its req, check IFU")
817*f21bbcb2SGuokai Chen
81809c6f1ddSLingrui98  ftb_entry_mem.io.raddr.head := ifu_wb_idx
81909c6f1ddSLingrui98  val has_false_hit = WireInit(false.B)
82009c6f1ddSLingrui98  when (RegNext(hit_pd_valid)) {
82109c6f1ddSLingrui98    // check for false hit
82209c6f1ddSLingrui98    val pred_ftb_entry = ftb_entry_mem.io.rdata.head
823eeb5ff92SLingrui98    val brSlots = pred_ftb_entry.brSlots
824eeb5ff92SLingrui98    val tailSlot = pred_ftb_entry.tailSlot
82509c6f1ddSLingrui98    // we check cfis that bpu predicted
82609c6f1ddSLingrui98
827eeb5ff92SLingrui98    // bpu predicted branches but denied by predecode
828eeb5ff92SLingrui98    val br_false_hit =
829eeb5ff92SLingrui98      brSlots.map{
830eeb5ff92SLingrui98        s => s.valid && !(pd_reg(s.offset).valid && pd_reg(s.offset).isBr)
831eeb5ff92SLingrui98      }.reduce(_||_) ||
832b37e4b45SLingrui98      (tailSlot.valid && pred_ftb_entry.tailSlot.sharing &&
833eeb5ff92SLingrui98        !(pd_reg(tailSlot.offset).valid && pd_reg(tailSlot.offset).isBr))
834eeb5ff92SLingrui98
835eeb5ff92SLingrui98    val jmpOffset = tailSlot.offset
83609c6f1ddSLingrui98    val jmp_pd = pd_reg(jmpOffset)
83709c6f1ddSLingrui98    val jal_false_hit = pred_ftb_entry.jmpValid &&
83809c6f1ddSLingrui98      ((pred_ftb_entry.isJal  && !(jmp_pd.valid && jmp_pd.isJal)) ||
83909c6f1ddSLingrui98       (pred_ftb_entry.isJalr && !(jmp_pd.valid && jmp_pd.isJalr)) ||
84009c6f1ddSLingrui98       (pred_ftb_entry.isCall && !(jmp_pd.valid && jmp_pd.isCall)) ||
84109c6f1ddSLingrui98       (pred_ftb_entry.isRet  && !(jmp_pd.valid && jmp_pd.isRet))
84209c6f1ddSLingrui98      )
84309c6f1ddSLingrui98
84409c6f1ddSLingrui98    has_false_hit := br_false_hit || jal_false_hit || hit_pd_mispred_reg
84565fddcf0Szoujr    XSDebug(has_false_hit, "FTB false hit by br or jal or hit_pd, startAddr: %x\n", pdWb.bits.pc(0))
84665fddcf0Szoujr
847352db50aSLingrui98    // assert(!has_false_hit)
84809c6f1ddSLingrui98  }
84909c6f1ddSLingrui98
85009c6f1ddSLingrui98  when (has_false_hit) {
85109c6f1ddSLingrui98    entry_hit_status(wb_idx_reg) := h_false_hit
85209c6f1ddSLingrui98  }
85309c6f1ddSLingrui98
85409c6f1ddSLingrui98
85509c6f1ddSLingrui98  // **********************************************************************
856b56f947eSYinan Xu  // ***************************** to backend *****************************
85709c6f1ddSLingrui98  // **********************************************************************
858b56f947eSYinan Xu  // to backend pc mem / target
859b56f947eSYinan Xu  io.toBackend.pc_mem_wen   := RegNext(last_cycle_bpu_in)
860b56f947eSYinan Xu  io.toBackend.pc_mem_waddr := RegNext(last_cycle_bpu_in_idx)
86188bc4f90SLingrui98  io.toBackend.pc_mem_wdata := RegNext(bpu_in_bypass_buf_for_ifu)
86209c6f1ddSLingrui98
86309c6f1ddSLingrui98  // *******************************************************************************
86409c6f1ddSLingrui98  // **************************** redirect from backend ****************************
86509c6f1ddSLingrui98  // *******************************************************************************
86609c6f1ddSLingrui98
86709c6f1ddSLingrui98  // redirect read cfiInfo, couples to redirectGen s2
8682e1be6e1SSteve Gou  ftq_redirect_sram.io.ren.init.last := backendRedirect.valid
8692e1be6e1SSteve Gou  ftq_redirect_sram.io.raddr.init.last := backendRedirect.bits.ftqIdx.value
87009c6f1ddSLingrui98
8712e1be6e1SSteve Gou  ftb_entry_mem.io.raddr.init.last := backendRedirect.bits.ftqIdx.value
87209c6f1ddSLingrui98
87309c6f1ddSLingrui98  val stage3CfiInfo = ftq_redirect_sram.io.rdata.init.last
874df5b4b8eSYinan Xu  val fromBackendRedirect = WireInit(backendRedirectReg)
87509c6f1ddSLingrui98  val backendRedirectCfi = fromBackendRedirect.bits.cfiUpdate
87609c6f1ddSLingrui98  backendRedirectCfi.fromFtqRedirectSram(stage3CfiInfo)
87709c6f1ddSLingrui98
87809c6f1ddSLingrui98  val r_ftb_entry = ftb_entry_mem.io.rdata.init.last
87909c6f1ddSLingrui98  val r_ftqOffset = fromBackendRedirect.bits.ftqOffset
88009c6f1ddSLingrui98
88109c6f1ddSLingrui98  when (entry_hit_status(fromBackendRedirect.bits.ftqIdx.value) === h_hit) {
88209c6f1ddSLingrui98    backendRedirectCfi.shift := PopCount(r_ftb_entry.getBrMaskByOffset(r_ftqOffset)) +&
88309c6f1ddSLingrui98      (backendRedirectCfi.pd.isBr && !r_ftb_entry.brIsSaved(r_ftqOffset) &&
884eeb5ff92SLingrui98      !r_ftb_entry.newBrCanNotInsert(r_ftqOffset))
88509c6f1ddSLingrui98
88609c6f1ddSLingrui98    backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr && (r_ftb_entry.brIsSaved(r_ftqOffset) ||
887eeb5ff92SLingrui98        !r_ftb_entry.newBrCanNotInsert(r_ftqOffset))
88809c6f1ddSLingrui98  }.otherwise {
88909c6f1ddSLingrui98    backendRedirectCfi.shift := (backendRedirectCfi.pd.isBr && backendRedirectCfi.taken).asUInt
89009c6f1ddSLingrui98    backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr.asUInt
89109c6f1ddSLingrui98  }
89209c6f1ddSLingrui98
89309c6f1ddSLingrui98
89409c6f1ddSLingrui98  // ***************************************************************************
89509c6f1ddSLingrui98  // **************************** redirect from ifu ****************************
89609c6f1ddSLingrui98  // ***************************************************************************
89709c6f1ddSLingrui98  val fromIfuRedirect = WireInit(0.U.asTypeOf(Valid(new Redirect)))
89809c6f1ddSLingrui98  fromIfuRedirect.valid := pdWb.valid && pdWb.bits.misOffset.valid && !backendFlush
89909c6f1ddSLingrui98  fromIfuRedirect.bits.ftqIdx := pdWb.bits.ftqIdx
90009c6f1ddSLingrui98  fromIfuRedirect.bits.ftqOffset := pdWb.bits.misOffset.bits
90109c6f1ddSLingrui98  fromIfuRedirect.bits.level := RedirectLevel.flushAfter
90209c6f1ddSLingrui98
90309c6f1ddSLingrui98  val ifuRedirectCfiUpdate = fromIfuRedirect.bits.cfiUpdate
90409c6f1ddSLingrui98  ifuRedirectCfiUpdate.pc := pdWb.bits.pc(pdWb.bits.misOffset.bits)
90509c6f1ddSLingrui98  ifuRedirectCfiUpdate.pd := pdWb.bits.pd(pdWb.bits.misOffset.bits)
90609c6f1ddSLingrui98  ifuRedirectCfiUpdate.predTaken := cfiIndex_vec(pdWb.bits.ftqIdx.value).valid
90709c6f1ddSLingrui98  ifuRedirectCfiUpdate.target := pdWb.bits.target
90809c6f1ddSLingrui98  ifuRedirectCfiUpdate.taken := pdWb.bits.cfiOffset.valid
90909c6f1ddSLingrui98  ifuRedirectCfiUpdate.isMisPred := pdWb.bits.misOffset.valid
91009c6f1ddSLingrui98
91109c6f1ddSLingrui98  val ifuRedirectReg = RegNext(fromIfuRedirect, init=0.U.asTypeOf(Valid(new Redirect)))
91209c6f1ddSLingrui98  val ifuRedirectToBpu = WireInit(ifuRedirectReg)
91309c6f1ddSLingrui98  ifuFlush := fromIfuRedirect.valid || ifuRedirectToBpu.valid
91409c6f1ddSLingrui98
91509c6f1ddSLingrui98  ftq_redirect_sram.io.ren.head := fromIfuRedirect.valid
91609c6f1ddSLingrui98  ftq_redirect_sram.io.raddr.head := fromIfuRedirect.bits.ftqIdx.value
91709c6f1ddSLingrui98
91809c6f1ddSLingrui98  ftb_entry_mem.io.raddr.head := fromIfuRedirect.bits.ftqIdx.value
91909c6f1ddSLingrui98
92009c6f1ddSLingrui98  val toBpuCfi = ifuRedirectToBpu.bits.cfiUpdate
92109c6f1ddSLingrui98  toBpuCfi.fromFtqRedirectSram(ftq_redirect_sram.io.rdata.head)
92209c6f1ddSLingrui98  when (ifuRedirectReg.bits.cfiUpdate.pd.isRet) {
92309c6f1ddSLingrui98    toBpuCfi.target := toBpuCfi.rasEntry.retAddr
92409c6f1ddSLingrui98  }
92509c6f1ddSLingrui98
92609c6f1ddSLingrui98  // *********************************************************************
92709c6f1ddSLingrui98  // **************************** wb from exu ****************************
92809c6f1ddSLingrui98  // *********************************************************************
92909c6f1ddSLingrui98
930b56f947eSYinan Xu  backendRedirect := io.fromBackend.redirect
9312e1be6e1SSteve Gou
93209c6f1ddSLingrui98  def extractRedirectInfo(wb: Valid[Redirect]) = {
9336bf9b30dSLingrui98    val ftqPtr = wb.bits.ftqIdx
93409c6f1ddSLingrui98    val ftqOffset = wb.bits.ftqOffset
93509c6f1ddSLingrui98    val taken = wb.bits.cfiUpdate.taken
93609c6f1ddSLingrui98    val mispred = wb.bits.cfiUpdate.isMisPred
9376bf9b30dSLingrui98    (wb.valid, ftqPtr, ftqOffset, taken, mispred)
93809c6f1ddSLingrui98  }
93909c6f1ddSLingrui98
94009c6f1ddSLingrui98  // fix mispredict entry
94109c6f1ddSLingrui98  val lastIsMispredict = RegNext(
942df5b4b8eSYinan Xu    backendRedirect.valid && backendRedirect.bits.level === RedirectLevel.flushAfter, init = false.B
94309c6f1ddSLingrui98  )
94409c6f1ddSLingrui98
94509c6f1ddSLingrui98  def updateCfiInfo(redirect: Valid[Redirect], isBackend: Boolean = true) = {
9466bf9b30dSLingrui98    val (r_valid, r_ptr, r_offset, r_taken, r_mispred) = extractRedirectInfo(redirect)
9476bf9b30dSLingrui98    val r_idx = r_ptr.value
94809c6f1ddSLingrui98    val cfiIndex_bits_wen = r_valid && r_taken && r_offset < cfiIndex_vec(r_idx).bits
94909c6f1ddSLingrui98    val cfiIndex_valid_wen = r_valid && r_offset === cfiIndex_vec(r_idx).bits
95009c6f1ddSLingrui98    when (cfiIndex_bits_wen || cfiIndex_valid_wen) {
95109c6f1ddSLingrui98      cfiIndex_vec(r_idx).valid := cfiIndex_bits_wen || cfiIndex_valid_wen && r_taken
9523f88c020SGuokai Chen    } .elsewhen (r_valid && !r_taken && r_offset =/= cfiIndex_vec(r_idx).bits) {
9533f88c020SGuokai Chen      cfiIndex_vec(r_idx).valid :=false.B
95409c6f1ddSLingrui98    }
95509c6f1ddSLingrui98    when (cfiIndex_bits_wen) {
95609c6f1ddSLingrui98      cfiIndex_vec(r_idx).bits := r_offset
95709c6f1ddSLingrui98    }
9586bf9b30dSLingrui98    newest_entry_target := redirect.bits.cfiUpdate.target
959873dc383SLingrui98    newest_entry_ptr := r_ptr
960b0ed7239SLingrui98    update_target(r_idx) := redirect.bits.cfiUpdate.target // TODO: remove this
96109c6f1ddSLingrui98    if (isBackend) {
96209c6f1ddSLingrui98      mispredict_vec(r_idx)(r_offset) := r_mispred
96309c6f1ddSLingrui98    }
96409c6f1ddSLingrui98  }
96509c6f1ddSLingrui98
96681e362d8SLingrui98  when(backendRedirectReg.valid) {
967df5b4b8eSYinan Xu    updateCfiInfo(backendRedirectReg)
96809c6f1ddSLingrui98  }.elsewhen (ifuRedirectToBpu.valid) {
96909c6f1ddSLingrui98    updateCfiInfo(ifuRedirectToBpu, isBackend=false)
97009c6f1ddSLingrui98  }
97109c6f1ddSLingrui98
97209c6f1ddSLingrui98  // ***********************************************************************************
97309c6f1ddSLingrui98  // **************************** flush ptr and state queue ****************************
97409c6f1ddSLingrui98  // ***********************************************************************************
97509c6f1ddSLingrui98
976df5b4b8eSYinan Xu  val redirectVec = VecInit(backendRedirect, fromIfuRedirect)
97709c6f1ddSLingrui98
97809c6f1ddSLingrui98  // when redirect, we should reset ptrs and status queues
97909c6f1ddSLingrui98  when(redirectVec.map(r => r.valid).reduce(_||_)){
9802f4a3aa4SLingrui98    val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits)))
98109c6f1ddSLingrui98    val notIfu = redirectVec.dropRight(1).map(r => r.valid).reduce(_||_)
9822f4a3aa4SLingrui98    val (idx, offset, flushItSelf) = (r.ftqIdx, r.ftqOffset, RedirectLevel.flushItself(r.level))
98309c6f1ddSLingrui98    val next = idx + 1.U
98409c6f1ddSLingrui98    bpuPtr := next
985dc270d3bSJenius    copied_bpu_ptr.map(_ := next)
986c5c5edaeSJenius    ifuPtr_write := next
987c5c5edaeSJenius    ifuWbPtr_write := next
988c5c5edaeSJenius    ifuPtrPlus1_write := idx + 2.U
9896bf9b30dSLingrui98    ifuPtrPlus2_write := idx + 3.U
9903f88c020SGuokai Chen
9913f88c020SGuokai Chen  }
9923f88c020SGuokai Chen  when(RegNext(redirectVec.map(r => r.valid).reduce(_||_))){
9933f88c020SGuokai Chen    val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits)))
9943f88c020SGuokai Chen    val notIfu = redirectVec.dropRight(1).map(r => r.valid).reduce(_||_)
9953f88c020SGuokai Chen    val (idx, offset, flushItSelf) = (r.ftqIdx, r.ftqOffset, RedirectLevel.flushItself(r.level))
9963f88c020SGuokai Chen    when (RegNext(notIfu)) {
9973f88c020SGuokai Chen      commitStateQueue(RegNext(idx.value)).zipWithIndex.foreach({ case (s, i) =>
9983f88c020SGuokai Chen        when(i.U > RegNext(offset) || i.U === RegNext(offset) && RegNext(flushItSelf)){
999b5808fc2Ssfencevma          s := c_invalid
100009c6f1ddSLingrui98        }
100109c6f1ddSLingrui98      })
100209c6f1ddSLingrui98    }
100309c6f1ddSLingrui98  }
100409c6f1ddSLingrui98
10053f88c020SGuokai Chen
100609c6f1ddSLingrui98  // only the valid bit is actually needed
1007df5b4b8eSYinan Xu  io.toIfu.redirect.bits    := backendRedirect.bits
100809c6f1ddSLingrui98  io.toIfu.redirect.valid   := stage2Flush
100909c6f1ddSLingrui98
101009c6f1ddSLingrui98  // commit
10119aca92b9SYinan Xu  for (c <- io.fromBackend.rob_commits) {
101209c6f1ddSLingrui98    when(c.valid) {
101309c6f1ddSLingrui98      commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset) := c_commited
101488825c5cSYinan Xu      // TODO: remove this
101588825c5cSYinan Xu      // For instruction fusions, we also update the next instruction
1016c3abb8b6SYinan Xu      when (c.bits.commitType === 4.U) {
101788825c5cSYinan Xu        commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset + 1.U) := c_commited
1018c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 5.U) {
101988825c5cSYinan Xu        commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset + 2.U) := c_commited
1020c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 6.U) {
102188825c5cSYinan Xu        val index = (c.bits.ftqIdx + 1.U).value
102288825c5cSYinan Xu        commitStateQueue(index)(0) := c_commited
1023c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 7.U) {
102488825c5cSYinan Xu        val index = (c.bits.ftqIdx + 1.U).value
102588825c5cSYinan Xu        commitStateQueue(index)(1) := c_commited
102688825c5cSYinan Xu      }
102709c6f1ddSLingrui98    }
102809c6f1ddSLingrui98  }
102909c6f1ddSLingrui98
103009c6f1ddSLingrui98  // ****************************************************************
103109c6f1ddSLingrui98  // **************************** to bpu ****************************
103209c6f1ddSLingrui98  // ****************************************************************
103309c6f1ddSLingrui98
103451981c77SbugGenerator  io.toBpu.redirect := Mux(fromBackendRedirect.valid, fromBackendRedirect, ifuRedirectToBpu)
103509c6f1ddSLingrui98
1036*f21bbcb2SGuokai Chen  XSError(io.toBpu.redirect.valid && isBefore(io.toBpu.redirect.bits.ftqIdx, commPtr), "Ftq received a redirect after its commit, check backend or replay")
1037*f21bbcb2SGuokai Chen
103802f21c16SLingrui98  val may_have_stall_from_bpu = Wire(Bool())
103902f21c16SLingrui98  val bpu_ftb_update_stall = RegInit(0.U(2.W)) // 2-cycle stall, so we need 3 states
104002f21c16SLingrui98  may_have_stall_from_bpu := bpu_ftb_update_stall =/= 0.U
1041b5808fc2Ssfencevma  val canCommit = commPtr =/= ifuWbPtr && !may_have_stall_from_bpu &&
104209c6f1ddSLingrui98    Cat(commitStateQueue(commPtr.value).map(s => {
1043b5808fc2Ssfencevma      s === c_invalid || s === c_commited
1044b5808fc2Ssfencevma    })).andR()
104509c6f1ddSLingrui98
10461d1e6d4dSJenius  val mmioReadPtr = io.mmioCommitRead.mmioFtqPtr
10471d1e6d4dSJenius  val mmioLastCommit = isBefore(commPtr, mmioReadPtr) && (isAfter(ifuPtr,mmioReadPtr)  ||  mmioReadPtr ===   ifuPtr) &&
1048b5808fc2Ssfencevma                       Cat(commitStateQueue(mmioReadPtr.value).map(s => { s === c_invalid || s === c_commited})).andR()
10491d1e6d4dSJenius  io.mmioCommitRead.mmioLastCommit := RegNext(mmioLastCommit)
10501d1e6d4dSJenius
105109c6f1ddSLingrui98  // commit reads
1052c5c5edaeSJenius  val commit_pc_bundle = RegNext(ftq_pc_mem.io.commPtr_rdata)
105381101dc4SLingrui98  val commit_target =
105434cf890eSLingrui98    Mux(RegNext(commPtr === newest_entry_ptr),
105534cf890eSLingrui98      RegNext(newest_entry_target),
105681101dc4SLingrui98      RegNext(ftq_pc_mem.io.commPtrPlus1_rdata.startAddr))
105709c6f1ddSLingrui98  ftq_pd_mem.io.raddr.last := commPtr.value
105809c6f1ddSLingrui98  val commit_pd = ftq_pd_mem.io.rdata.last
105909c6f1ddSLingrui98  ftq_redirect_sram.io.ren.last := canCommit
106009c6f1ddSLingrui98  ftq_redirect_sram.io.raddr.last := commPtr.value
106109c6f1ddSLingrui98  val commit_spec_meta = ftq_redirect_sram.io.rdata.last
106209c6f1ddSLingrui98  ftq_meta_1r_sram.io.ren(0) := canCommit
106309c6f1ddSLingrui98  ftq_meta_1r_sram.io.raddr(0) := commPtr.value
106409c6f1ddSLingrui98  val commit_meta = ftq_meta_1r_sram.io.rdata(0)
106509c6f1ddSLingrui98  ftb_entry_mem.io.raddr.last := commPtr.value
106609c6f1ddSLingrui98  val commit_ftb_entry = ftb_entry_mem.io.rdata.last
106709c6f1ddSLingrui98
106809c6f1ddSLingrui98  // need one cycle to read mem and srams
106909c6f1ddSLingrui98  val do_commit_ptr = RegNext(commPtr)
10705371700eSzoujr  val do_commit = RegNext(canCommit, init=false.B)
10716bf9b30dSLingrui98  when (canCommit) {
10726bf9b30dSLingrui98    commPtr_write := commPtrPlus1
10736bf9b30dSLingrui98    commPtrPlus1_write := commPtrPlus1 + 1.U
10746bf9b30dSLingrui98  }
107509c6f1ddSLingrui98  val commit_state = RegNext(commitStateQueue(commPtr.value))
10765371700eSzoujr  val can_commit_cfi = WireInit(cfiIndex_vec(commPtr.value))
10773f88c020SGuokai Chen  //
10783f88c020SGuokai Chen  //when (commitStateQueue(commPtr.value)(can_commit_cfi.bits) =/= c_commited) {
10793f88c020SGuokai Chen  //  can_commit_cfi.valid := false.B
10803f88c020SGuokai Chen  //}
10815371700eSzoujr  val commit_cfi = RegNext(can_commit_cfi)
10823f88c020SGuokai Chen  val debug_cfi = RegNext(commitStateQueue(commPtr.value)(can_commit_cfi.bits) =/= c_commited && can_commit_cfi.valid)
108309c6f1ddSLingrui98
108409c6f1ddSLingrui98  val commit_mispredict = VecInit((RegNext(mispredict_vec(commPtr.value)) zip commit_state).map {
108509c6f1ddSLingrui98    case (mis, state) => mis && state === c_commited
108609c6f1ddSLingrui98  })
10875371700eSzoujr  val can_commit_hit = entry_hit_status(commPtr.value)
10885371700eSzoujr  val commit_hit = RegNext(can_commit_hit)
10895fa3df0dSLingrui98  val diff_commit_target = RegNext(update_target(commPtr.value)) // TODO: remove this
1090edc18578SLingrui98  val commit_stage = RegNext(pred_stage(commPtr.value))
109109c6f1ddSLingrui98  val commit_valid = commit_hit === h_hit || commit_cfi.valid // hit or taken
109209c6f1ddSLingrui98
10935371700eSzoujr  val to_bpu_hit = can_commit_hit === h_hit || can_commit_hit === h_false_hit
109402f21c16SLingrui98  switch (bpu_ftb_update_stall) {
109502f21c16SLingrui98    is (0.U) {
109602f21c16SLingrui98      when (can_commit_cfi.valid && !to_bpu_hit && canCommit) {
109702f21c16SLingrui98        bpu_ftb_update_stall := 2.U // 2-cycle stall
109802f21c16SLingrui98      }
109902f21c16SLingrui98    }
110002f21c16SLingrui98    is (2.U) {
110102f21c16SLingrui98      bpu_ftb_update_stall := 1.U
110202f21c16SLingrui98    }
110302f21c16SLingrui98    is (1.U) {
110402f21c16SLingrui98      bpu_ftb_update_stall := 0.U
110502f21c16SLingrui98    }
110602f21c16SLingrui98    is (3.U) {
110702f21c16SLingrui98      XSError(true.B, "bpu_ftb_update_stall should be 0, 1 or 2")
110802f21c16SLingrui98    }
110902f21c16SLingrui98  }
111009c6f1ddSLingrui98
1111b0ed7239SLingrui98  // TODO: remove this
1112b0ed7239SLingrui98  XSError(do_commit && diff_commit_target =/= commit_target, "\ncommit target should be the same as update target\n")
1113b0ed7239SLingrui98
111409c6f1ddSLingrui98  io.toBpu.update := DontCare
111509c6f1ddSLingrui98  io.toBpu.update.valid := commit_valid && do_commit
111609c6f1ddSLingrui98  val update = io.toBpu.update.bits
111709c6f1ddSLingrui98  update.false_hit   := commit_hit === h_false_hit
111809c6f1ddSLingrui98  update.pc          := commit_pc_bundle.startAddr
111909c6f1ddSLingrui98  update.meta        := commit_meta.meta
1120803124a6SLingrui98  update.cfi_idx     := commit_cfi
11218ffcd86aSLingrui98  update.full_target := commit_target
1122edc18578SLingrui98  update.from_stage  := commit_stage
1123c2d1ec7dSLingrui98  update.spec_info   := commit_spec_meta
11243f88c020SGuokai Chen  XSError(commit_valid && do_commit && debug_cfi, "\ncommit cfi can be non c_commited\n")
112509c6f1ddSLingrui98
112609c6f1ddSLingrui98  val commit_real_hit = commit_hit === h_hit
112709c6f1ddSLingrui98  val update_ftb_entry = update.ftb_entry
112809c6f1ddSLingrui98
112909c6f1ddSLingrui98  val ftbEntryGen = Module(new FTBEntryGen).io
113009c6f1ddSLingrui98  ftbEntryGen.start_addr     := commit_pc_bundle.startAddr
113109c6f1ddSLingrui98  ftbEntryGen.old_entry      := commit_ftb_entry
113209c6f1ddSLingrui98  ftbEntryGen.pd             := commit_pd
113309c6f1ddSLingrui98  ftbEntryGen.cfiIndex       := commit_cfi
113409c6f1ddSLingrui98  ftbEntryGen.target         := commit_target
113509c6f1ddSLingrui98  ftbEntryGen.hit            := commit_real_hit
113609c6f1ddSLingrui98  ftbEntryGen.mispredict_vec := commit_mispredict
113709c6f1ddSLingrui98
113809c6f1ddSLingrui98  update_ftb_entry         := ftbEntryGen.new_entry
113909c6f1ddSLingrui98  update.new_br_insert_pos := ftbEntryGen.new_br_insert_pos
114009c6f1ddSLingrui98  update.mispred_mask      := ftbEntryGen.mispred_mask
114109c6f1ddSLingrui98  update.old_entry         := ftbEntryGen.is_old_entry
1142edc18578SLingrui98  update.pred_hit          := commit_hit === h_hit || commit_hit === h_false_hit
1143803124a6SLingrui98  update.br_taken_mask     := ftbEntryGen.taken_mask
1144803124a6SLingrui98  update.jmp_taken         := ftbEntryGen.jmp_taken
1145b37e4b45SLingrui98
1146803124a6SLingrui98  // update.full_pred.fromFtbEntry(ftbEntryGen.new_entry, update.pc)
1147803124a6SLingrui98  // update.full_pred.jalr_target := commit_target
1148803124a6SLingrui98  // update.full_pred.hit := true.B
1149803124a6SLingrui98  // when (update.full_pred.is_jalr) {
1150803124a6SLingrui98  //   update.full_pred.targets.last := commit_target
1151803124a6SLingrui98  // }
115209c6f1ddSLingrui98
1153e30430c2SJay  // ****************************************************************
1154e30430c2SJay  // *********************** to prefetch ****************************
1155e30430c2SJay  // ****************************************************************
1156e30430c2SJay
11579c8f16f2SJenius  ftq_pc_mem.io.other_raddrs(0) := DontCare
1158e30430c2SJay  if(cacheParams.hasPrefetch){
1159e30430c2SJay    val prefetchPtr = RegInit(FtqPtr(false.B, 0.U))
1160378f00d9SJenius    val diff_prefetch_addr = WireInit(update_target(prefetchPtr.value)) //TODO: remove this
1161378f00d9SJenius
1162e30430c2SJay    prefetchPtr := prefetchPtr + io.toPrefetch.req.fire()
1163e30430c2SJay
1164378f00d9SJenius    ftq_pc_mem.io.other_raddrs(0) := prefetchPtr.value
1165378f00d9SJenius
1166e30430c2SJay    when (bpu_s2_resp.valid && bpu_s2_resp.hasRedirect && !isBefore(prefetchPtr, bpu_s2_resp.ftq_idx)) {
1167e30430c2SJay      prefetchPtr := bpu_s2_resp.ftq_idx
1168e30430c2SJay    }
1169e30430c2SJay
1170cb4f77ceSLingrui98    when (bpu_s3_resp.valid && bpu_s3_resp.hasRedirect && !isBefore(prefetchPtr, bpu_s3_resp.ftq_idx)) {
1171cb4f77ceSLingrui98      prefetchPtr := bpu_s3_resp.ftq_idx
1172a3c55791SJinYue      // XSError(true.B, "\ns3_redirect mechanism not implemented!\n")
1173cb4f77ceSLingrui98    }
1174de7689fcSJay
1175f63797a4SLingrui98
1176f63797a4SLingrui98    val prefetch_is_to_send = WireInit(entry_fetch_status(prefetchPtr.value) === f_to_send)
1177f56177cbSJenius    val prefetch_addr = Wire(UInt(VAddrBits.W))
1178f63797a4SLingrui98
1179f63797a4SLingrui98    when (last_cycle_bpu_in && bpu_in_bypass_ptr === prefetchPtr) {
1180f63797a4SLingrui98      prefetch_is_to_send := true.B
11816bf9b30dSLingrui98      prefetch_addr := last_cycle_bpu_target
1182378f00d9SJenius      diff_prefetch_addr := last_cycle_bpu_target // TODO: remove this
1183f56177cbSJenius    }.otherwise{
1184f56177cbSJenius      prefetch_addr := RegNext( ftq_pc_mem.io.other_rdatas(0).startAddr)
1185f63797a4SLingrui98    }
1186f63797a4SLingrui98    io.toPrefetch.req.valid := prefetchPtr =/= bpuPtr && prefetch_is_to_send
1187f63797a4SLingrui98    io.toPrefetch.req.bits.target := prefetch_addr
1188de7689fcSJay
1189de7689fcSJay    when(redirectVec.map(r => r.valid).reduce(_||_)){
1190de7689fcSJay      val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits)))
1191de7689fcSJay      val next = r.ftqIdx + 1.U
1192de7689fcSJay      prefetchPtr := next
1193de7689fcSJay    }
1194de7689fcSJay
1195378f00d9SJenius    // TODO: remove this
119610f8eea3SLingrui98    // XSError(io.toPrefetch.req.valid && diff_prefetch_addr =/= prefetch_addr,
119710f8eea3SLingrui98    //         f"\nprefetch_req_target wrong! prefetchPtr: ${prefetchPtr}, prefetch_addr: ${Hexadecimal(prefetch_addr)} diff_prefetch_addr: ${Hexadecimal(diff_prefetch_addr)}\n")
1198378f00d9SJenius
1199378f00d9SJenius
1200de7689fcSJay    XSError(isBefore(bpuPtr, prefetchPtr) && !isFull(bpuPtr, prefetchPtr), "\nprefetchPtr is before bpuPtr!\n")
1201e8747464SJenius    XSError(isBefore(prefetchPtr, ifuPtr) && !isFull(ifuPtr, prefetchPtr), "\nifuPtr is before prefetchPtr!\n")
1202de7689fcSJay  }
1203de7689fcSJay  else {
1204de7689fcSJay    io.toPrefetch.req <> DontCare
1205de7689fcSJay  }
1206de7689fcSJay
120709c6f1ddSLingrui98  // ******************************************************************************
120809c6f1ddSLingrui98  // **************************** commit perf counters ****************************
120909c6f1ddSLingrui98  // ******************************************************************************
121009c6f1ddSLingrui98
121109c6f1ddSLingrui98  val commit_inst_mask    = VecInit(commit_state.map(c => c === c_commited && do_commit)).asUInt
121209c6f1ddSLingrui98  val commit_mispred_mask = commit_mispredict.asUInt
121309c6f1ddSLingrui98  val commit_not_mispred_mask = ~commit_mispred_mask
121409c6f1ddSLingrui98
121509c6f1ddSLingrui98  val commit_br_mask = commit_pd.brMask.asUInt
121609c6f1ddSLingrui98  val commit_jmp_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.jmpInfo.valid.asTypeOf(UInt(1.W)))
121709c6f1ddSLingrui98  val commit_cfi_mask = (commit_br_mask | commit_jmp_mask)
121809c6f1ddSLingrui98
121909c6f1ddSLingrui98  val mbpInstrs = commit_inst_mask & commit_cfi_mask
122009c6f1ddSLingrui98
122109c6f1ddSLingrui98  val mbpRights = mbpInstrs & commit_not_mispred_mask
122209c6f1ddSLingrui98  val mbpWrongs = mbpInstrs & commit_mispred_mask
122309c6f1ddSLingrui98
122409c6f1ddSLingrui98  io.bpuInfo.bpRight := PopCount(mbpRights)
122509c6f1ddSLingrui98  io.bpuInfo.bpWrong := PopCount(mbpWrongs)
122609c6f1ddSLingrui98
1227da3bf434SMaxpicca-Li  val isWriteFTQTable = WireInit(Constantin.createRecord("isWriteFTQTable" + p(XSCoreParamsKey).HartId.toString))
122851532d8bSGuokai Chen  val ftqBranchTraceDB = ChiselDB.createTable("FTQTable" + p(XSCoreParamsKey).HartId.toString, new FtqDebugBundle)
122909c6f1ddSLingrui98  // Cfi Info
123009c6f1ddSLingrui98  for (i <- 0 until PredictWidth) {
123109c6f1ddSLingrui98    val pc = commit_pc_bundle.startAddr + (i * instBytes).U
123209c6f1ddSLingrui98    val v = commit_state(i) === c_commited
123309c6f1ddSLingrui98    val isBr = commit_pd.brMask(i)
123409c6f1ddSLingrui98    val isJmp = commit_pd.jmpInfo.valid && commit_pd.jmpOffset === i.U
123509c6f1ddSLingrui98    val isCfi = isBr || isJmp
123609c6f1ddSLingrui98    val isTaken = commit_cfi.valid && commit_cfi.bits === i.U
123709c6f1ddSLingrui98    val misPred = commit_mispredict(i)
1238c2ad24ebSLingrui98    // val ghist = commit_spec_meta.ghist.predHist
1239c2ad24ebSLingrui98    val histPtr = commit_spec_meta.histPtr
124009c6f1ddSLingrui98    val predCycle = commit_meta.meta(63, 0)
124109c6f1ddSLingrui98    val target = commit_target
124209c6f1ddSLingrui98
124309c6f1ddSLingrui98    val brIdx = OHToUInt(Reverse(Cat(update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U})))
124409c6f1ddSLingrui98    val inFtbEntry = update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U}.reduce(_||_)
124509c6f1ddSLingrui98    val addIntoHist = ((commit_hit === h_hit) && inFtbEntry) || ((!(commit_hit === h_hit) && i.U === commit_cfi.bits && isBr && commit_cfi.valid))
124609c6f1ddSLingrui98    XSDebug(v && do_commit && isCfi, p"cfi_update: isBr(${isBr}) pc(${Hexadecimal(pc)}) " +
1247c2ad24ebSLingrui98    p"taken(${isTaken}) mispred(${misPred}) cycle($predCycle) hist(${histPtr.value}) " +
124809c6f1ddSLingrui98    p"startAddr(${Hexadecimal(commit_pc_bundle.startAddr)}) AddIntoHist(${addIntoHist}) " +
124909c6f1ddSLingrui98    p"brInEntry(${inFtbEntry}) brIdx(${brIdx}) target(${Hexadecimal(target)})\n")
125051532d8bSGuokai Chen
125151532d8bSGuokai Chen    val logbundle = Wire(new FtqDebugBundle)
125251532d8bSGuokai Chen    logbundle.pc := pc
125351532d8bSGuokai Chen    logbundle.target := target
125451532d8bSGuokai Chen    logbundle.isBr := isBr
125551532d8bSGuokai Chen    logbundle.isJmp := isJmp
125651532d8bSGuokai Chen    logbundle.isCall := isJmp && commit_pd.hasCall
125751532d8bSGuokai Chen    logbundle.isRet := isJmp && commit_pd.hasRet
125851532d8bSGuokai Chen    logbundle.misPred := misPred
125951532d8bSGuokai Chen    logbundle.isTaken := isTaken
126051532d8bSGuokai Chen    logbundle.predStage := commit_stage
126151532d8bSGuokai Chen
126251532d8bSGuokai Chen    ftqBranchTraceDB.log(
126351532d8bSGuokai Chen      data = logbundle /* hardware of type T */,
1264da3bf434SMaxpicca-Li      en = isWriteFTQTable.orR && v && do_commit && isCfi,
126551532d8bSGuokai Chen      site = "FTQ" + p(XSCoreParamsKey).HartId.toString,
126651532d8bSGuokai Chen      clock = clock,
126751532d8bSGuokai Chen      reset = reset
126851532d8bSGuokai Chen    )
126909c6f1ddSLingrui98  }
127009c6f1ddSLingrui98
127109c6f1ddSLingrui98  val enq = io.fromBpu.resp
12722e1be6e1SSteve Gou  val perf_redirect = backendRedirect
127309c6f1ddSLingrui98
127409c6f1ddSLingrui98  XSPerfAccumulate("entry", validEntries)
127509c6f1ddSLingrui98  XSPerfAccumulate("bpu_to_ftq_stall", enq.valid && !enq.ready)
127609c6f1ddSLingrui98  XSPerfAccumulate("mispredictRedirect", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level)
127709c6f1ddSLingrui98  XSPerfAccumulate("replayRedirect", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level))
127809c6f1ddSLingrui98  XSPerfAccumulate("predecodeRedirect", fromIfuRedirect.valid)
127909c6f1ddSLingrui98
128009c6f1ddSLingrui98  XSPerfAccumulate("to_ifu_bubble", io.toIfu.req.ready && !io.toIfu.req.valid)
128109c6f1ddSLingrui98
128209c6f1ddSLingrui98  XSPerfAccumulate("to_ifu_stall", io.toIfu.req.valid && !io.toIfu.req.ready)
128309c6f1ddSLingrui98  XSPerfAccumulate("from_bpu_real_bubble", !enq.valid && enq.ready && allowBpuIn)
128412cedb6fSLingrui98  XSPerfAccumulate("bpu_to_ifu_bubble", bpuPtr === ifuPtr)
128509c6f1ddSLingrui98
128609c6f1ddSLingrui98  val from_bpu = io.fromBpu.resp.bits
1287c2d1ec7dSLingrui98  def in_entry_len_map_gen(resp: BpuToFtqBundle)(stage: String) = {
1288c2d1ec7dSLingrui98    val entry_len = (resp.last_stage_ftb_entry.getFallThrough(resp.s3.pc) - resp.s3.pc) >> instOffsetBits
128909c6f1ddSLingrui98    val entry_len_recording_vec = (1 to PredictWidth+1).map(i => entry_len === i.U)
129009c6f1ddSLingrui98    val entry_len_map = (1 to PredictWidth+1).map(i =>
1291c2d1ec7dSLingrui98      f"${stage}_ftb_entry_len_$i" -> (entry_len_recording_vec(i-1) && resp.s3.valid)
129209c6f1ddSLingrui98    ).foldLeft(Map[String, UInt]())(_+_)
129309c6f1ddSLingrui98    entry_len_map
129409c6f1ddSLingrui98  }
1295c2d1ec7dSLingrui98  val s3_entry_len_map = in_entry_len_map_gen(from_bpu)("s3")
129609c6f1ddSLingrui98
129709c6f1ddSLingrui98  val to_ifu = io.toIfu.req.bits
129809c6f1ddSLingrui98
129909c6f1ddSLingrui98
130009c6f1ddSLingrui98
130109c6f1ddSLingrui98  val commit_num_inst_recording_vec = (1 to PredictWidth).map(i => PopCount(commit_inst_mask) === i.U)
130209c6f1ddSLingrui98  val commit_num_inst_map = (1 to PredictWidth).map(i =>
130309c6f1ddSLingrui98    f"commit_num_inst_$i" -> (commit_num_inst_recording_vec(i-1) && do_commit)
130409c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
130509c6f1ddSLingrui98
130609c6f1ddSLingrui98
130709c6f1ddSLingrui98
130809c6f1ddSLingrui98  val commit_jal_mask  = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJal.asTypeOf(UInt(1.W)))
130909c6f1ddSLingrui98  val commit_jalr_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJalr.asTypeOf(UInt(1.W)))
131009c6f1ddSLingrui98  val commit_call_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasCall.asTypeOf(UInt(1.W)))
131109c6f1ddSLingrui98  val commit_ret_mask  = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasRet.asTypeOf(UInt(1.W)))
131209c6f1ddSLingrui98
131309c6f1ddSLingrui98
131409c6f1ddSLingrui98  val mbpBRights = mbpRights & commit_br_mask
131509c6f1ddSLingrui98  val mbpJRights = mbpRights & commit_jal_mask
131609c6f1ddSLingrui98  val mbpIRights = mbpRights & commit_jalr_mask
131709c6f1ddSLingrui98  val mbpCRights = mbpRights & commit_call_mask
131809c6f1ddSLingrui98  val mbpRRights = mbpRights & commit_ret_mask
131909c6f1ddSLingrui98
132009c6f1ddSLingrui98  val mbpBWrongs = mbpWrongs & commit_br_mask
132109c6f1ddSLingrui98  val mbpJWrongs = mbpWrongs & commit_jal_mask
132209c6f1ddSLingrui98  val mbpIWrongs = mbpWrongs & commit_jalr_mask
132309c6f1ddSLingrui98  val mbpCWrongs = mbpWrongs & commit_call_mask
132409c6f1ddSLingrui98  val mbpRWrongs = mbpWrongs & commit_ret_mask
132509c6f1ddSLingrui98
13261d7e5011SLingrui98  val commit_pred_stage = RegNext(pred_stage(commPtr.value))
13271d7e5011SLingrui98
13281d7e5011SLingrui98  def pred_stage_map(src: UInt, name: String) = {
13291d7e5011SLingrui98    (0 until numBpStages).map(i =>
13301d7e5011SLingrui98      f"${name}_stage_${i+1}" -> PopCount(src.asBools.map(_ && commit_pred_stage === BP_STAGES(i)))
13311d7e5011SLingrui98    ).foldLeft(Map[String, UInt]())(_+_)
13321d7e5011SLingrui98  }
13331d7e5011SLingrui98
13341d7e5011SLingrui98  val mispred_stage_map      = pred_stage_map(mbpWrongs,  "mispredict")
13351d7e5011SLingrui98  val br_mispred_stage_map   = pred_stage_map(mbpBWrongs, "br_mispredict")
13361d7e5011SLingrui98  val jalr_mispred_stage_map = pred_stage_map(mbpIWrongs, "jalr_mispredict")
13371d7e5011SLingrui98  val correct_stage_map      = pred_stage_map(mbpRights,  "correct")
13381d7e5011SLingrui98  val br_correct_stage_map   = pred_stage_map(mbpBRights, "br_correct")
13391d7e5011SLingrui98  val jalr_correct_stage_map = pred_stage_map(mbpIRights, "jalr_correct")
13401d7e5011SLingrui98
134109c6f1ddSLingrui98  val update_valid = io.toBpu.update.valid
134209c6f1ddSLingrui98  def u(cond: Bool) = update_valid && cond
134309c6f1ddSLingrui98  val ftb_false_hit = u(update.false_hit)
134465fddcf0Szoujr  // assert(!ftb_false_hit)
134509c6f1ddSLingrui98  val ftb_hit = u(commit_hit === h_hit)
134609c6f1ddSLingrui98
134709c6f1ddSLingrui98  val ftb_new_entry = u(ftbEntryGen.is_init_entry)
1348b37e4b45SLingrui98  val ftb_new_entry_only_br = ftb_new_entry && !update_ftb_entry.jmpValid
1349b37e4b45SLingrui98  val ftb_new_entry_only_jmp = ftb_new_entry && !update_ftb_entry.brValids(0)
1350b37e4b45SLingrui98  val ftb_new_entry_has_br_and_jmp = ftb_new_entry && update_ftb_entry.brValids(0) && update_ftb_entry.jmpValid
135109c6f1ddSLingrui98
135209c6f1ddSLingrui98  val ftb_old_entry = u(ftbEntryGen.is_old_entry)
135309c6f1ddSLingrui98
135409c6f1ddSLingrui98  val ftb_modified_entry = u(ftbEntryGen.is_new_br || ftbEntryGen.is_jalr_target_modified || ftbEntryGen.is_always_taken_modified)
135509c6f1ddSLingrui98  val ftb_modified_entry_new_br = u(ftbEntryGen.is_new_br)
135609c6f1ddSLingrui98  val ftb_modified_entry_jalr_target_modified = u(ftbEntryGen.is_jalr_target_modified)
135709c6f1ddSLingrui98  val ftb_modified_entry_br_full = ftb_modified_entry && ftbEntryGen.is_br_full
135809c6f1ddSLingrui98  val ftb_modified_entry_always_taken = ftb_modified_entry && ftbEntryGen.is_always_taken_modified
135909c6f1ddSLingrui98
136009c6f1ddSLingrui98  val ftb_entry_len = (ftbEntryGen.new_entry.getFallThrough(update.pc) - update.pc) >> instOffsetBits
136109c6f1ddSLingrui98  val ftb_entry_len_recording_vec = (1 to PredictWidth+1).map(i => ftb_entry_len === i.U)
136209c6f1ddSLingrui98  val ftb_init_entry_len_map = (1 to PredictWidth+1).map(i =>
136309c6f1ddSLingrui98    f"ftb_init_entry_len_$i" -> (ftb_entry_len_recording_vec(i-1) && ftb_new_entry)
136409c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
136509c6f1ddSLingrui98  val ftb_modified_entry_len_map = (1 to PredictWidth+1).map(i =>
136609c6f1ddSLingrui98    f"ftb_modified_entry_len_$i" -> (ftb_entry_len_recording_vec(i-1) && ftb_modified_entry)
136709c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
136809c6f1ddSLingrui98
136909c6f1ddSLingrui98  val ftq_occupancy_map = (0 to FtqSize).map(i =>
137009c6f1ddSLingrui98    f"ftq_has_entry_$i" ->( validEntries === i.U)
137109c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
137209c6f1ddSLingrui98
137309c6f1ddSLingrui98  val perfCountsMap = Map(
137409c6f1ddSLingrui98    "BpInstr" -> PopCount(mbpInstrs),
137509c6f1ddSLingrui98    "BpBInstr" -> PopCount(mbpBRights | mbpBWrongs),
137609c6f1ddSLingrui98    "BpRight"  -> PopCount(mbpRights),
137709c6f1ddSLingrui98    "BpWrong"  -> PopCount(mbpWrongs),
137809c6f1ddSLingrui98    "BpBRight" -> PopCount(mbpBRights),
137909c6f1ddSLingrui98    "BpBWrong" -> PopCount(mbpBWrongs),
138009c6f1ddSLingrui98    "BpJRight" -> PopCount(mbpJRights),
138109c6f1ddSLingrui98    "BpJWrong" -> PopCount(mbpJWrongs),
138209c6f1ddSLingrui98    "BpIRight" -> PopCount(mbpIRights),
138309c6f1ddSLingrui98    "BpIWrong" -> PopCount(mbpIWrongs),
138409c6f1ddSLingrui98    "BpCRight" -> PopCount(mbpCRights),
138509c6f1ddSLingrui98    "BpCWrong" -> PopCount(mbpCWrongs),
138609c6f1ddSLingrui98    "BpRRight" -> PopCount(mbpRRights),
138709c6f1ddSLingrui98    "BpRWrong" -> PopCount(mbpRWrongs),
138809c6f1ddSLingrui98
138909c6f1ddSLingrui98    "ftb_false_hit"                -> PopCount(ftb_false_hit),
139009c6f1ddSLingrui98    "ftb_hit"                      -> PopCount(ftb_hit),
139109c6f1ddSLingrui98    "ftb_new_entry"                -> PopCount(ftb_new_entry),
139209c6f1ddSLingrui98    "ftb_new_entry_only_br"        -> PopCount(ftb_new_entry_only_br),
139309c6f1ddSLingrui98    "ftb_new_entry_only_jmp"       -> PopCount(ftb_new_entry_only_jmp),
139409c6f1ddSLingrui98    "ftb_new_entry_has_br_and_jmp" -> PopCount(ftb_new_entry_has_br_and_jmp),
139509c6f1ddSLingrui98    "ftb_old_entry"                -> PopCount(ftb_old_entry),
139609c6f1ddSLingrui98    "ftb_modified_entry"           -> PopCount(ftb_modified_entry),
139709c6f1ddSLingrui98    "ftb_modified_entry_new_br"    -> PopCount(ftb_modified_entry_new_br),
139809c6f1ddSLingrui98    "ftb_jalr_target_modified"     -> PopCount(ftb_modified_entry_jalr_target_modified),
139909c6f1ddSLingrui98    "ftb_modified_entry_br_full"   -> PopCount(ftb_modified_entry_br_full),
140009c6f1ddSLingrui98    "ftb_modified_entry_always_taken" -> PopCount(ftb_modified_entry_always_taken)
1401c2d1ec7dSLingrui98  ) ++ ftb_init_entry_len_map ++ ftb_modified_entry_len_map ++
1402cb4f77ceSLingrui98  s3_entry_len_map ++ commit_num_inst_map ++ ftq_occupancy_map ++
14031d7e5011SLingrui98  mispred_stage_map ++ br_mispred_stage_map ++ jalr_mispred_stage_map ++
14041d7e5011SLingrui98  correct_stage_map ++ br_correct_stage_map ++ jalr_correct_stage_map
140509c6f1ddSLingrui98
140609c6f1ddSLingrui98  for((key, value) <- perfCountsMap) {
140709c6f1ddSLingrui98    XSPerfAccumulate(key, value)
140809c6f1ddSLingrui98  }
140909c6f1ddSLingrui98
141009c6f1ddSLingrui98  // --------------------------- Debug --------------------------------
141109c6f1ddSLingrui98  // XSDebug(enq_fire, p"enq! " + io.fromBpu.resp.bits.toPrintable)
141209c6f1ddSLingrui98  XSDebug(io.toIfu.req.fire, p"fire to ifu " + io.toIfu.req.bits.toPrintable)
141309c6f1ddSLingrui98  XSDebug(do_commit, p"deq! [ptr] $do_commit_ptr\n")
141409c6f1ddSLingrui98  XSDebug(true.B, p"[bpuPtr] $bpuPtr, [ifuPtr] $ifuPtr, [ifuWbPtr] $ifuWbPtr [commPtr] $commPtr\n")
141509c6f1ddSLingrui98  XSDebug(true.B, p"[in] v:${io.fromBpu.resp.valid} r:${io.fromBpu.resp.ready} " +
141609c6f1ddSLingrui98    p"[out] v:${io.toIfu.req.valid} r:${io.toIfu.req.ready}\n")
141709c6f1ddSLingrui98  XSDebug(do_commit, p"[deq info] cfiIndex: $commit_cfi, $commit_pc_bundle, target: ${Hexadecimal(commit_target)}\n")
141809c6f1ddSLingrui98
141909c6f1ddSLingrui98  //   def ubtbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
142009c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
142109c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
142209c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
142309c6f1ddSLingrui98  //         isWrong ^ Mux(ans.hit.asBool,
142409c6f1ddSLingrui98  //           Mux(ans.taken.asBool, taken && ans.target === commitEntry.target,
142509c6f1ddSLingrui98  //           !taken),
142609c6f1ddSLingrui98  //         !taken),
142709c6f1ddSLingrui98  //       false.B)
142809c6f1ddSLingrui98  //     }
142909c6f1ddSLingrui98  //   }
143009c6f1ddSLingrui98
143109c6f1ddSLingrui98  //   def btbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
143209c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
143309c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
143409c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
143509c6f1ddSLingrui98  //         isWrong ^ Mux(ans.hit.asBool,
143609c6f1ddSLingrui98  //           Mux(ans.taken.asBool, taken && ans.target === commitEntry.target,
143709c6f1ddSLingrui98  //           !taken),
143809c6f1ddSLingrui98  //         !taken),
143909c6f1ddSLingrui98  //       false.B)
144009c6f1ddSLingrui98  //     }
144109c6f1ddSLingrui98  //   }
144209c6f1ddSLingrui98
144309c6f1ddSLingrui98  //   def tageCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
144409c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
144509c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
144609c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
144709c6f1ddSLingrui98  //         isWrong ^ (ans.taken.asBool === taken),
144809c6f1ddSLingrui98  //       false.B)
144909c6f1ddSLingrui98  //     }
145009c6f1ddSLingrui98  //   }
145109c6f1ddSLingrui98
145209c6f1ddSLingrui98  //   def loopCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
145309c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
145409c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
145509c6f1ddSLingrui98  //       Mux(valid && (pd.isBr) && ans.hit.asBool,
145609c6f1ddSLingrui98  //         isWrong ^ (!taken),
145709c6f1ddSLingrui98  //           false.B)
145809c6f1ddSLingrui98  //     }
145909c6f1ddSLingrui98  //   }
146009c6f1ddSLingrui98
146109c6f1ddSLingrui98  //   def rasCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
146209c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
146309c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
146409c6f1ddSLingrui98  //       Mux(valid && pd.isRet.asBool /*&& taken*/ && ans.hit.asBool,
146509c6f1ddSLingrui98  //         isWrong ^ (ans.target === commitEntry.target),
146609c6f1ddSLingrui98  //           false.B)
146709c6f1ddSLingrui98  //     }
146809c6f1ddSLingrui98  //   }
146909c6f1ddSLingrui98
147009c6f1ddSLingrui98  //   val ubtbRights = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), false.B)
147109c6f1ddSLingrui98  //   val ubtbWrongs = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), true.B)
147209c6f1ddSLingrui98  //   // btb and ubtb pred jal and jalr as well
147309c6f1ddSLingrui98  //   val btbRights = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), false.B)
147409c6f1ddSLingrui98  //   val btbWrongs = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), true.B)
147509c6f1ddSLingrui98  //   val tageRights = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), false.B)
147609c6f1ddSLingrui98  //   val tageWrongs = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), true.B)
147709c6f1ddSLingrui98
147809c6f1ddSLingrui98  //   val loopRights = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), false.B)
147909c6f1ddSLingrui98  //   val loopWrongs = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), true.B)
148009c6f1ddSLingrui98
148109c6f1ddSLingrui98  //   val rasRights = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), false.B)
148209c6f1ddSLingrui98  //   val rasWrongs = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), true.B)
14831ca0e4f3SYinan Xu
1484cd365d4cSrvcoresjw  val perfEvents = Seq(
1485cd365d4cSrvcoresjw    ("bpu_s2_redirect        ", bpu_s2_redirect                                                             ),
1486cb4f77ceSLingrui98    ("bpu_s3_redirect        ", bpu_s3_redirect                                                             ),
1487cd365d4cSrvcoresjw    ("bpu_to_ftq_stall       ", enq.valid && ~enq.ready                                                     ),
1488cd365d4cSrvcoresjw    ("mispredictRedirect     ", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level),
1489cd365d4cSrvcoresjw    ("replayRedirect         ", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level)  ),
1490cd365d4cSrvcoresjw    ("predecodeRedirect      ", fromIfuRedirect.valid                                                       ),
1491cd365d4cSrvcoresjw    ("to_ifu_bubble          ", io.toIfu.req.ready && !io.toIfu.req.valid                                   ),
1492cd365d4cSrvcoresjw    ("from_bpu_real_bubble   ", !enq.valid && enq.ready && allowBpuIn                                       ),
1493cd365d4cSrvcoresjw    ("BpInstr                ", PopCount(mbpInstrs)                                                         ),
1494cd365d4cSrvcoresjw    ("BpBInstr               ", PopCount(mbpBRights | mbpBWrongs)                                           ),
1495cd365d4cSrvcoresjw    ("BpRight                ", PopCount(mbpRights)                                                         ),
1496cd365d4cSrvcoresjw    ("BpWrong                ", PopCount(mbpWrongs)                                                         ),
1497cd365d4cSrvcoresjw    ("BpBRight               ", PopCount(mbpBRights)                                                        ),
1498cd365d4cSrvcoresjw    ("BpBWrong               ", PopCount(mbpBWrongs)                                                        ),
1499cd365d4cSrvcoresjw    ("BpJRight               ", PopCount(mbpJRights)                                                        ),
1500cd365d4cSrvcoresjw    ("BpJWrong               ", PopCount(mbpJWrongs)                                                        ),
1501cd365d4cSrvcoresjw    ("BpIRight               ", PopCount(mbpIRights)                                                        ),
1502cd365d4cSrvcoresjw    ("BpIWrong               ", PopCount(mbpIWrongs)                                                        ),
1503cd365d4cSrvcoresjw    ("BpCRight               ", PopCount(mbpCRights)                                                        ),
1504cd365d4cSrvcoresjw    ("BpCWrong               ", PopCount(mbpCWrongs)                                                        ),
1505cd365d4cSrvcoresjw    ("BpRRight               ", PopCount(mbpRRights)                                                        ),
1506cd365d4cSrvcoresjw    ("BpRWrong               ", PopCount(mbpRWrongs)                                                        ),
1507cd365d4cSrvcoresjw    ("ftb_false_hit          ", PopCount(ftb_false_hit)                                                     ),
1508cd365d4cSrvcoresjw    ("ftb_hit                ", PopCount(ftb_hit)                                                           ),
1509cd365d4cSrvcoresjw  )
15101ca0e4f3SYinan Xu  generatePerfEvent()
151109c6f1ddSLingrui98}