xref: /XiangShan/src/main/scala/xiangshan/frontend/NewFtq.scala (revision da3bf434d2eaa53cd07e3992eb63aefb88a6f0da)
109c6f1ddSLingrui98/***************************************************************************************
209c6f1ddSLingrui98* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
309c6f1ddSLingrui98* Copyright (c) 2020-2021 Peng Cheng Laboratory
409c6f1ddSLingrui98*
509c6f1ddSLingrui98* XiangShan is licensed under Mulan PSL v2.
609c6f1ddSLingrui98* You can use this software according to the terms and conditions of the Mulan PSL v2.
709c6f1ddSLingrui98* You may obtain a copy of Mulan PSL v2 at:
809c6f1ddSLingrui98*          http://license.coscl.org.cn/MulanPSL2
909c6f1ddSLingrui98*
1009c6f1ddSLingrui98* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
1109c6f1ddSLingrui98* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
1209c6f1ddSLingrui98* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
1309c6f1ddSLingrui98*
1409c6f1ddSLingrui98* See the Mulan PSL v2 for more details.
1509c6f1ddSLingrui98***************************************************************************************/
1609c6f1ddSLingrui98
1709c6f1ddSLingrui98package xiangshan.frontend
1809c6f1ddSLingrui98
1909c6f1ddSLingrui98import chipsalliance.rocketchip.config.Parameters
2009c6f1ddSLingrui98import chisel3._
2109c6f1ddSLingrui98import chisel3.util._
221ca0e4f3SYinan Xuimport utils._
233c02ee8fSwakafaimport utility._
2409c6f1ddSLingrui98import xiangshan._
25e30430c2SJayimport xiangshan.frontend.icache._
261ca0e4f3SYinan Xuimport xiangshan.backend.CtrlToFtqIO
272e1be6e1SSteve Gouimport xiangshan.backend.decode.ImmUnion
283c02ee8fSwakafaimport utility.ChiselDB
2951532d8bSGuokai Chen
3051532d8bSGuokai Chenclass FtqDebugBundle extends Bundle {
3151532d8bSGuokai Chen  val pc = UInt(39.W)
3251532d8bSGuokai Chen  val target = UInt(39.W)
3351532d8bSGuokai Chen  val isBr = Bool()
3451532d8bSGuokai Chen  val isJmp = Bool()
3551532d8bSGuokai Chen  val isCall = Bool()
3651532d8bSGuokai Chen  val isRet = Bool()
3751532d8bSGuokai Chen  val misPred = Bool()
3851532d8bSGuokai Chen  val isTaken = Bool()
3951532d8bSGuokai Chen  val predStage = UInt(2.W)
4051532d8bSGuokai Chen}
4109c6f1ddSLingrui98
4209c6f1ddSLingrui98class FtqPtr(implicit p: Parameters) extends CircularQueuePtr[FtqPtr](
4309c6f1ddSLingrui98  p => p(XSCoreParamsKey).FtqSize
4409c6f1ddSLingrui98){
4509c6f1ddSLingrui98}
4609c6f1ddSLingrui98
4709c6f1ddSLingrui98object FtqPtr {
4809c6f1ddSLingrui98  def apply(f: Bool, v: UInt)(implicit p: Parameters): FtqPtr = {
4909c6f1ddSLingrui98    val ptr = Wire(new FtqPtr)
5009c6f1ddSLingrui98    ptr.flag := f
5109c6f1ddSLingrui98    ptr.value := v
5209c6f1ddSLingrui98    ptr
5309c6f1ddSLingrui98  }
5409c6f1ddSLingrui98  def inverse(ptr: FtqPtr)(implicit p: Parameters): FtqPtr = {
5509c6f1ddSLingrui98    apply(!ptr.flag, ptr.value)
5609c6f1ddSLingrui98  }
5709c6f1ddSLingrui98}
5809c6f1ddSLingrui98
5909c6f1ddSLingrui98class FtqNRSRAM[T <: Data](gen: T, numRead: Int)(implicit p: Parameters) extends XSModule {
6009c6f1ddSLingrui98
6109c6f1ddSLingrui98  val io = IO(new Bundle() {
6209c6f1ddSLingrui98    val raddr = Input(Vec(numRead, UInt(log2Up(FtqSize).W)))
6309c6f1ddSLingrui98    val ren = Input(Vec(numRead, Bool()))
6409c6f1ddSLingrui98    val rdata = Output(Vec(numRead, gen))
6509c6f1ddSLingrui98    val waddr = Input(UInt(log2Up(FtqSize).W))
6609c6f1ddSLingrui98    val wen = Input(Bool())
6709c6f1ddSLingrui98    val wdata = Input(gen)
6809c6f1ddSLingrui98  })
6909c6f1ddSLingrui98
7009c6f1ddSLingrui98  for(i <- 0 until numRead){
7109c6f1ddSLingrui98    val sram = Module(new SRAMTemplate(gen, FtqSize))
7209c6f1ddSLingrui98    sram.io.r.req.valid := io.ren(i)
7309c6f1ddSLingrui98    sram.io.r.req.bits.setIdx := io.raddr(i)
7409c6f1ddSLingrui98    io.rdata(i) := sram.io.r.resp.data(0)
7509c6f1ddSLingrui98    sram.io.w.req.valid := io.wen
7609c6f1ddSLingrui98    sram.io.w.req.bits.setIdx := io.waddr
7709c6f1ddSLingrui98    sram.io.w.req.bits.data := VecInit(io.wdata)
7809c6f1ddSLingrui98  }
7909c6f1ddSLingrui98
8009c6f1ddSLingrui98}
8109c6f1ddSLingrui98
8209c6f1ddSLingrui98class Ftq_RF_Components(implicit p: Parameters) extends XSBundle with BPUUtils {
8309c6f1ddSLingrui98  val startAddr = UInt(VAddrBits.W)
84b37e4b45SLingrui98  val nextLineAddr = UInt(VAddrBits.W)
8509c6f1ddSLingrui98  val isNextMask = Vec(PredictWidth, Bool())
86b37e4b45SLingrui98  val fallThruError = Bool()
87b37e4b45SLingrui98  // val carry = Bool()
8809c6f1ddSLingrui98  def getPc(offset: UInt) = {
8985215037SLingrui98    def getHigher(pc: UInt) = pc(VAddrBits-1, log2Ceil(PredictWidth)+instOffsetBits+1)
9085215037SLingrui98    def getOffset(pc: UInt) = pc(log2Ceil(PredictWidth)+instOffsetBits, instOffsetBits)
91b37e4b45SLingrui98    Cat(getHigher(Mux(isNextMask(offset) && startAddr(log2Ceil(PredictWidth)+instOffsetBits), nextLineAddr, startAddr)),
9209c6f1ddSLingrui98        getOffset(startAddr)+offset, 0.U(instOffsetBits.W))
9309c6f1ddSLingrui98  }
9409c6f1ddSLingrui98  def fromBranchPrediction(resp: BranchPredictionBundle) = {
95a229ab6cSLingrui98    def carryPos(addr: UInt) = addr(instOffsetBits+log2Ceil(PredictWidth)+1)
9609c6f1ddSLingrui98    this.startAddr := resp.pc
97a60a2901SLingrui98    this.nextLineAddr := resp.pc + (FetchWidth * 4 * 2).U // may be broken on other configs
9809c6f1ddSLingrui98    this.isNextMask := VecInit((0 until PredictWidth).map(i =>
9909c6f1ddSLingrui98      (resp.pc(log2Ceil(PredictWidth), 1) +& i.U)(log2Ceil(PredictWidth)).asBool()
10009c6f1ddSLingrui98    ))
101b37e4b45SLingrui98    this.fallThruError := resp.fallThruError
10209c6f1ddSLingrui98    this
10309c6f1ddSLingrui98  }
10409c6f1ddSLingrui98  override def toPrintable: Printable = {
105b37e4b45SLingrui98    p"startAddr:${Hexadecimal(startAddr)}"
10609c6f1ddSLingrui98  }
10709c6f1ddSLingrui98}
10809c6f1ddSLingrui98
10909c6f1ddSLingrui98class Ftq_pd_Entry(implicit p: Parameters) extends XSBundle {
11009c6f1ddSLingrui98  val brMask = Vec(PredictWidth, Bool())
11109c6f1ddSLingrui98  val jmpInfo = ValidUndirectioned(Vec(3, Bool()))
11209c6f1ddSLingrui98  val jmpOffset = UInt(log2Ceil(PredictWidth).W)
11309c6f1ddSLingrui98  val jalTarget = UInt(VAddrBits.W)
11409c6f1ddSLingrui98  val rvcMask = Vec(PredictWidth, Bool())
11509c6f1ddSLingrui98  def hasJal  = jmpInfo.valid && !jmpInfo.bits(0)
11609c6f1ddSLingrui98  def hasJalr = jmpInfo.valid && jmpInfo.bits(0)
11709c6f1ddSLingrui98  def hasCall = jmpInfo.valid && jmpInfo.bits(1)
11809c6f1ddSLingrui98  def hasRet  = jmpInfo.valid && jmpInfo.bits(2)
11909c6f1ddSLingrui98
12009c6f1ddSLingrui98  def fromPdWb(pdWb: PredecodeWritebackBundle) = {
12109c6f1ddSLingrui98    val pds = pdWb.pd
12209c6f1ddSLingrui98    this.brMask := VecInit(pds.map(pd => pd.isBr && pd.valid))
12309c6f1ddSLingrui98    this.jmpInfo.valid := VecInit(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid)).asUInt.orR
12409c6f1ddSLingrui98    this.jmpInfo.bits := ParallelPriorityMux(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid),
12509c6f1ddSLingrui98                                             pds.map(pd => VecInit(pd.isJalr, pd.isCall, pd.isRet)))
12609c6f1ddSLingrui98    this.jmpOffset := ParallelPriorityEncoder(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid))
12709c6f1ddSLingrui98    this.rvcMask := VecInit(pds.map(pd => pd.isRVC))
12809c6f1ddSLingrui98    this.jalTarget := pdWb.jalTarget
12909c6f1ddSLingrui98  }
13009c6f1ddSLingrui98
13109c6f1ddSLingrui98  def toPd(offset: UInt) = {
13209c6f1ddSLingrui98    require(offset.getWidth == log2Ceil(PredictWidth))
13309c6f1ddSLingrui98    val pd = Wire(new PreDecodeInfo)
13409c6f1ddSLingrui98    pd.valid := true.B
13509c6f1ddSLingrui98    pd.isRVC := rvcMask(offset)
13609c6f1ddSLingrui98    val isBr = brMask(offset)
13709c6f1ddSLingrui98    val isJalr = offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(0)
13809c6f1ddSLingrui98    pd.brType := Cat(offset === jmpOffset && jmpInfo.valid, isJalr || isBr)
13909c6f1ddSLingrui98    pd.isCall := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(1)
14009c6f1ddSLingrui98    pd.isRet  := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(2)
14109c6f1ddSLingrui98    pd
14209c6f1ddSLingrui98  }
14309c6f1ddSLingrui98}
14409c6f1ddSLingrui98
14509c6f1ddSLingrui98
14609c6f1ddSLingrui98
147c2d1ec7dSLingrui98class Ftq_Redirect_SRAMEntry(implicit p: Parameters) extends SpeculativeInfo {}
14809c6f1ddSLingrui98
14909c6f1ddSLingrui98class Ftq_1R_SRAMEntry(implicit p: Parameters) extends XSBundle with HasBPUConst {
15009c6f1ddSLingrui98  val meta = UInt(MaxMetaLength.W)
15109c6f1ddSLingrui98}
15209c6f1ddSLingrui98
15309c6f1ddSLingrui98class Ftq_Pred_Info(implicit p: Parameters) extends XSBundle {
15409c6f1ddSLingrui98  val target = UInt(VAddrBits.W)
15509c6f1ddSLingrui98  val cfiIndex = ValidUndirectioned(UInt(log2Ceil(PredictWidth).W))
15609c6f1ddSLingrui98}
15709c6f1ddSLingrui98
15809c6f1ddSLingrui98
15909c6f1ddSLingrui98class FtqRead[T <: Data](private val gen: T)(implicit p: Parameters) extends XSBundle {
16009c6f1ddSLingrui98  val ptr = Output(new FtqPtr)
16109c6f1ddSLingrui98  val offset = Output(UInt(log2Ceil(PredictWidth).W))
16209c6f1ddSLingrui98  val data = Input(gen)
16309c6f1ddSLingrui98  def apply(ptr: FtqPtr, offset: UInt) = {
16409c6f1ddSLingrui98    this.ptr := ptr
16509c6f1ddSLingrui98    this.offset := offset
16609c6f1ddSLingrui98    this.data
16709c6f1ddSLingrui98  }
16809c6f1ddSLingrui98}
16909c6f1ddSLingrui98
17009c6f1ddSLingrui98
17109c6f1ddSLingrui98class FtqToBpuIO(implicit p: Parameters) extends XSBundle {
17209c6f1ddSLingrui98  val redirect = Valid(new BranchPredictionRedirect)
17309c6f1ddSLingrui98  val update = Valid(new BranchPredictionUpdate)
17409c6f1ddSLingrui98  val enq_ptr = Output(new FtqPtr)
17509c6f1ddSLingrui98}
17609c6f1ddSLingrui98
17709c6f1ddSLingrui98class FtqToIfuIO(implicit p: Parameters) extends XSBundle with HasCircularQueuePtrHelper {
17809c6f1ddSLingrui98  val req = Decoupled(new FetchRequestBundle)
17909c6f1ddSLingrui98  val redirect = Valid(new Redirect)
18009c6f1ddSLingrui98  val flushFromBpu = new Bundle {
18109c6f1ddSLingrui98    // when ifu pipeline is not stalled,
18209c6f1ddSLingrui98    // a packet from bpu s3 can reach f1 at most
18309c6f1ddSLingrui98    val s2 = Valid(new FtqPtr)
184cb4f77ceSLingrui98    val s3 = Valid(new FtqPtr)
18509c6f1ddSLingrui98    def shouldFlushBy(src: Valid[FtqPtr], idx_to_flush: FtqPtr) = {
18609c6f1ddSLingrui98      src.valid && !isAfter(src.bits, idx_to_flush)
18709c6f1ddSLingrui98    }
18809c6f1ddSLingrui98    def shouldFlushByStage2(idx: FtqPtr) = shouldFlushBy(s2, idx)
189cb4f77ceSLingrui98    def shouldFlushByStage3(idx: FtqPtr) = shouldFlushBy(s3, idx)
19009c6f1ddSLingrui98  }
19109c6f1ddSLingrui98}
19209c6f1ddSLingrui98
193c5c5edaeSJeniusclass FtqToICacheIO(implicit p: Parameters) extends XSBundle with HasCircularQueuePtrHelper {
194c5c5edaeSJenius  //NOTE: req.bits must be prepare in T cycle
195c5c5edaeSJenius  // while req.valid is set true in T + 1 cycle
196c5c5edaeSJenius  val req = Decoupled(new FtqToICacheRequestBundle)
197c5c5edaeSJenius}
198c5c5edaeSJenius
19909c6f1ddSLingrui98trait HasBackendRedirectInfo extends HasXSParameter {
2002e1be6e1SSteve Gou  def numRedirectPcRead = exuParameters.JmpCnt + exuParameters.AluCnt + 1
20109c6f1ddSLingrui98  def isLoadReplay(r: Valid[Redirect]) = r.bits.flushItself()
20209c6f1ddSLingrui98}
20309c6f1ddSLingrui98
20409c6f1ddSLingrui98class FtqToCtrlIO(implicit p: Parameters) extends XSBundle with HasBackendRedirectInfo {
205b56f947eSYinan Xu  // write to backend pc mem
206b56f947eSYinan Xu  val pc_mem_wen = Output(Bool())
207b56f947eSYinan Xu  val pc_mem_waddr = Output(UInt(log2Ceil(FtqSize).W))
208b56f947eSYinan Xu  val pc_mem_wdata = Output(new Ftq_RF_Components)
209873dc383SLingrui98  // newest target
210873dc383SLingrui98  val newest_entry_target = Output(UInt(VAddrBits.W))
211873dc383SLingrui98  val newest_entry_ptr = Output(new FtqPtr)
21209c6f1ddSLingrui98}
21309c6f1ddSLingrui98
21409c6f1ddSLingrui98
21509c6f1ddSLingrui98class FTBEntryGen(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo with HasBPUParameter {
21609c6f1ddSLingrui98  val io = IO(new Bundle {
21709c6f1ddSLingrui98    val start_addr = Input(UInt(VAddrBits.W))
21809c6f1ddSLingrui98    val old_entry = Input(new FTBEntry)
21909c6f1ddSLingrui98    val pd = Input(new Ftq_pd_Entry)
22009c6f1ddSLingrui98    val cfiIndex = Flipped(Valid(UInt(log2Ceil(PredictWidth).W)))
22109c6f1ddSLingrui98    val target = Input(UInt(VAddrBits.W))
22209c6f1ddSLingrui98    val hit = Input(Bool())
22309c6f1ddSLingrui98    val mispredict_vec = Input(Vec(PredictWidth, Bool()))
22409c6f1ddSLingrui98
22509c6f1ddSLingrui98    val new_entry = Output(new FTBEntry)
22609c6f1ddSLingrui98    val new_br_insert_pos = Output(Vec(numBr, Bool()))
22709c6f1ddSLingrui98    val taken_mask = Output(Vec(numBr, Bool()))
228803124a6SLingrui98    val jmp_taken = Output(Bool())
22909c6f1ddSLingrui98    val mispred_mask = Output(Vec(numBr+1, Bool()))
23009c6f1ddSLingrui98
23109c6f1ddSLingrui98    // for perf counters
23209c6f1ddSLingrui98    val is_init_entry = Output(Bool())
23309c6f1ddSLingrui98    val is_old_entry = Output(Bool())
23409c6f1ddSLingrui98    val is_new_br = Output(Bool())
23509c6f1ddSLingrui98    val is_jalr_target_modified = Output(Bool())
23609c6f1ddSLingrui98    val is_always_taken_modified = Output(Bool())
23709c6f1ddSLingrui98    val is_br_full = Output(Bool())
23809c6f1ddSLingrui98  })
23909c6f1ddSLingrui98
24009c6f1ddSLingrui98  // no mispredictions detected at predecode
24109c6f1ddSLingrui98  val hit = io.hit
24209c6f1ddSLingrui98  val pd = io.pd
24309c6f1ddSLingrui98
24409c6f1ddSLingrui98  val init_entry = WireInit(0.U.asTypeOf(new FTBEntry))
24509c6f1ddSLingrui98
24609c6f1ddSLingrui98
24709c6f1ddSLingrui98  val cfi_is_br = pd.brMask(io.cfiIndex.bits) && io.cfiIndex.valid
24809c6f1ddSLingrui98  val entry_has_jmp = pd.jmpInfo.valid
24909c6f1ddSLingrui98  val new_jmp_is_jal  = entry_has_jmp && !pd.jmpInfo.bits(0) && io.cfiIndex.valid
25009c6f1ddSLingrui98  val new_jmp_is_jalr = entry_has_jmp &&  pd.jmpInfo.bits(0) && io.cfiIndex.valid
25109c6f1ddSLingrui98  val new_jmp_is_call = entry_has_jmp &&  pd.jmpInfo.bits(1) && io.cfiIndex.valid
25209c6f1ddSLingrui98  val new_jmp_is_ret  = entry_has_jmp &&  pd.jmpInfo.bits(2) && io.cfiIndex.valid
25309c6f1ddSLingrui98  val last_jmp_rvi = entry_has_jmp && pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask.last
254a60a2901SLingrui98  // val last_br_rvi = cfi_is_br && io.cfiIndex.bits === (PredictWidth-1).U && !pd.rvcMask.last
25509c6f1ddSLingrui98
25609c6f1ddSLingrui98  val cfi_is_jal = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jal
25709c6f1ddSLingrui98  val cfi_is_jalr = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jalr
25809c6f1ddSLingrui98
259a60a2901SLingrui98  def carryPos = log2Ceil(PredictWidth)+instOffsetBits
26009c6f1ddSLingrui98  def getLower(pc: UInt) = pc(carryPos-1, instOffsetBits)
26109c6f1ddSLingrui98  // if not hit, establish a new entry
26209c6f1ddSLingrui98  init_entry.valid := true.B
26309c6f1ddSLingrui98  // tag is left for ftb to assign
264eeb5ff92SLingrui98
265eeb5ff92SLingrui98  // case br
266eeb5ff92SLingrui98  val init_br_slot = init_entry.getSlotForBr(0)
267eeb5ff92SLingrui98  when (cfi_is_br) {
268eeb5ff92SLingrui98    init_br_slot.valid := true.B
269eeb5ff92SLingrui98    init_br_slot.offset := io.cfiIndex.bits
270b37e4b45SLingrui98    init_br_slot.setLowerStatByTarget(io.start_addr, io.target, numBr == 1)
271eeb5ff92SLingrui98    init_entry.always_taken(0) := true.B // set to always taken on init
272eeb5ff92SLingrui98  }
273eeb5ff92SLingrui98
274eeb5ff92SLingrui98  // case jmp
275eeb5ff92SLingrui98  when (entry_has_jmp) {
276eeb5ff92SLingrui98    init_entry.tailSlot.offset := pd.jmpOffset
277eeb5ff92SLingrui98    init_entry.tailSlot.valid := new_jmp_is_jal || new_jmp_is_jalr
278eeb5ff92SLingrui98    init_entry.tailSlot.setLowerStatByTarget(io.start_addr, Mux(cfi_is_jalr, io.target, pd.jalTarget), isShare=false)
279eeb5ff92SLingrui98  }
280eeb5ff92SLingrui98
28109c6f1ddSLingrui98  val jmpPft = getLower(io.start_addr) +& pd.jmpOffset +& Mux(pd.rvcMask(pd.jmpOffset), 1.U, 2.U)
282a60a2901SLingrui98  init_entry.pftAddr := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft, getLower(io.start_addr))
283a60a2901SLingrui98  init_entry.carry   := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft(carryPos-instOffsetBits), true.B)
28409c6f1ddSLingrui98  init_entry.isJalr := new_jmp_is_jalr
28509c6f1ddSLingrui98  init_entry.isCall := new_jmp_is_call
28609c6f1ddSLingrui98  init_entry.isRet  := new_jmp_is_ret
287f4ebc4b2SLingrui98  // that means fall thru points to the middle of an inst
288ae409b75SSteve Gou  init_entry.last_may_be_rvi_call := pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask(pd.jmpOffset)
28909c6f1ddSLingrui98
29009c6f1ddSLingrui98  // if hit, check whether a new cfi(only br is possible) is detected
29109c6f1ddSLingrui98  val oe = io.old_entry
292eeb5ff92SLingrui98  val br_recorded_vec = oe.getBrRecordedVec(io.cfiIndex.bits)
29309c6f1ddSLingrui98  val br_recorded = br_recorded_vec.asUInt.orR
29409c6f1ddSLingrui98  val is_new_br = cfi_is_br && !br_recorded
29509c6f1ddSLingrui98  val new_br_offset = io.cfiIndex.bits
29609c6f1ddSLingrui98  // vec(i) means new br will be inserted BEFORE old br(i)
297eeb5ff92SLingrui98  val allBrSlotsVec = oe.allSlotsForBr
29809c6f1ddSLingrui98  val new_br_insert_onehot = VecInit((0 until numBr).map{
29909c6f1ddSLingrui98    i => i match {
300eeb5ff92SLingrui98      case 0 =>
301eeb5ff92SLingrui98        !allBrSlotsVec(0).valid || new_br_offset < allBrSlotsVec(0).offset
302eeb5ff92SLingrui98      case idx =>
303eeb5ff92SLingrui98        allBrSlotsVec(idx-1).valid && new_br_offset > allBrSlotsVec(idx-1).offset &&
304eeb5ff92SLingrui98        (!allBrSlotsVec(idx).valid || new_br_offset < allBrSlotsVec(idx).offset)
30509c6f1ddSLingrui98    }
30609c6f1ddSLingrui98  })
30709c6f1ddSLingrui98
30809c6f1ddSLingrui98  val old_entry_modified = WireInit(io.old_entry)
30909c6f1ddSLingrui98  for (i <- 0 until numBr) {
310eeb5ff92SLingrui98    val slot = old_entry_modified.allSlotsForBr(i)
311eeb5ff92SLingrui98    when (new_br_insert_onehot(i)) {
312eeb5ff92SLingrui98      slot.valid := true.B
313eeb5ff92SLingrui98      slot.offset := new_br_offset
314b37e4b45SLingrui98      slot.setLowerStatByTarget(io.start_addr, io.target, i == numBr-1)
315eeb5ff92SLingrui98      old_entry_modified.always_taken(i) := true.B
316eeb5ff92SLingrui98    }.elsewhen (new_br_offset > oe.allSlotsForBr(i).offset) {
317eeb5ff92SLingrui98      old_entry_modified.always_taken(i) := false.B
318eeb5ff92SLingrui98      // all other fields remain unchanged
319eeb5ff92SLingrui98    }.otherwise {
320eeb5ff92SLingrui98      // case i == 0, remain unchanged
321eeb5ff92SLingrui98      if (i != 0) {
322b37e4b45SLingrui98        val noNeedToMoveFromFormerSlot = (i == numBr-1).B && !oe.brSlots.last.valid
323eeb5ff92SLingrui98        when (!noNeedToMoveFromFormerSlot) {
324eeb5ff92SLingrui98          slot.fromAnotherSlot(oe.allSlotsForBr(i-1))
325eeb5ff92SLingrui98          old_entry_modified.always_taken(i) := oe.always_taken(i)
32609c6f1ddSLingrui98        }
327eeb5ff92SLingrui98      }
328eeb5ff92SLingrui98    }
329eeb5ff92SLingrui98  }
33009c6f1ddSLingrui98
331eeb5ff92SLingrui98  // two circumstances:
332eeb5ff92SLingrui98  // 1. oe: | br | j  |, new br should be in front of j, thus addr of j should be new pft
333eeb5ff92SLingrui98  // 2. oe: | br | br |, new br could be anywhere between, thus new pft is the addr of either
334eeb5ff92SLingrui98  //        the previous last br or the new br
335eeb5ff92SLingrui98  val may_have_to_replace = oe.noEmptySlotForNewBr
336eeb5ff92SLingrui98  val pft_need_to_change = is_new_br && may_have_to_replace
33709c6f1ddSLingrui98  // it should either be the given last br or the new br
33809c6f1ddSLingrui98  when (pft_need_to_change) {
339eeb5ff92SLingrui98    val new_pft_offset =
340710a8720SLingrui98      Mux(!new_br_insert_onehot.asUInt.orR,
341710a8720SLingrui98        new_br_offset, oe.allSlotsForBr.last.offset)
342eeb5ff92SLingrui98
343710a8720SLingrui98    // set jmp to invalid
34409c6f1ddSLingrui98    old_entry_modified.pftAddr := getLower(io.start_addr) + new_pft_offset
34509c6f1ddSLingrui98    old_entry_modified.carry := (getLower(io.start_addr) +& new_pft_offset).head(1).asBool
346f4ebc4b2SLingrui98    old_entry_modified.last_may_be_rvi_call := false.B
34709c6f1ddSLingrui98    old_entry_modified.isCall := false.B
34809c6f1ddSLingrui98    old_entry_modified.isRet := false.B
349eeb5ff92SLingrui98    old_entry_modified.isJalr := false.B
35009c6f1ddSLingrui98  }
35109c6f1ddSLingrui98
35209c6f1ddSLingrui98  val old_entry_jmp_target_modified = WireInit(oe)
353710a8720SLingrui98  val old_target = oe.tailSlot.getTarget(io.start_addr) // may be wrong because we store only 20 lowest bits
354b37e4b45SLingrui98  val old_tail_is_jmp = !oe.tailSlot.sharing
355eeb5ff92SLingrui98  val jalr_target_modified = cfi_is_jalr && (old_target =/= io.target) && old_tail_is_jmp // TODO: pass full jalr target
3563bcae573SLingrui98  when (jalr_target_modified) {
35709c6f1ddSLingrui98    old_entry_jmp_target_modified.setByJmpTarget(io.start_addr, io.target)
35809c6f1ddSLingrui98    old_entry_jmp_target_modified.always_taken := 0.U.asTypeOf(Vec(numBr, Bool()))
35909c6f1ddSLingrui98  }
36009c6f1ddSLingrui98
36109c6f1ddSLingrui98  val old_entry_always_taken = WireInit(oe)
36209c6f1ddSLingrui98  val always_taken_modified_vec = Wire(Vec(numBr, Bool())) // whether modified or not
36309c6f1ddSLingrui98  for (i <- 0 until numBr) {
36409c6f1ddSLingrui98    old_entry_always_taken.always_taken(i) :=
36509c6f1ddSLingrui98      oe.always_taken(i) && io.cfiIndex.valid && oe.brValids(i) && io.cfiIndex.bits === oe.brOffset(i)
366710a8720SLingrui98    always_taken_modified_vec(i) := oe.always_taken(i) && !old_entry_always_taken.always_taken(i)
36709c6f1ddSLingrui98  }
36809c6f1ddSLingrui98  val always_taken_modified = always_taken_modified_vec.reduce(_||_)
36909c6f1ddSLingrui98
37009c6f1ddSLingrui98
37109c6f1ddSLingrui98
37209c6f1ddSLingrui98  val derived_from_old_entry =
37309c6f1ddSLingrui98    Mux(is_new_br, old_entry_modified,
3743bcae573SLingrui98      Mux(jalr_target_modified, old_entry_jmp_target_modified, old_entry_always_taken))
37509c6f1ddSLingrui98
37609c6f1ddSLingrui98
37709c6f1ddSLingrui98  io.new_entry := Mux(!hit, init_entry, derived_from_old_entry)
37809c6f1ddSLingrui98
37909c6f1ddSLingrui98  io.new_br_insert_pos := new_br_insert_onehot
38009c6f1ddSLingrui98  io.taken_mask := VecInit((io.new_entry.brOffset zip io.new_entry.brValids).map{
38109c6f1ddSLingrui98    case (off, v) => io.cfiIndex.bits === off && io.cfiIndex.valid && v
38209c6f1ddSLingrui98  })
383803124a6SLingrui98  io.jmp_taken := io.new_entry.jmpValid && io.new_entry.tailSlot.offset === io.cfiIndex.bits
38409c6f1ddSLingrui98  for (i <- 0 until numBr) {
38509c6f1ddSLingrui98    io.mispred_mask(i) := io.new_entry.brValids(i) && io.mispredict_vec(io.new_entry.brOffset(i))
38609c6f1ddSLingrui98  }
38709c6f1ddSLingrui98  io.mispred_mask.last := io.new_entry.jmpValid && io.mispredict_vec(pd.jmpOffset)
38809c6f1ddSLingrui98
38909c6f1ddSLingrui98  // for perf counters
39009c6f1ddSLingrui98  io.is_init_entry := !hit
3913bcae573SLingrui98  io.is_old_entry := hit && !is_new_br && !jalr_target_modified && !always_taken_modified
39209c6f1ddSLingrui98  io.is_new_br := hit && is_new_br
3933bcae573SLingrui98  io.is_jalr_target_modified := hit && jalr_target_modified
39409c6f1ddSLingrui98  io.is_always_taken_modified := hit && always_taken_modified
395eeb5ff92SLingrui98  io.is_br_full := hit && is_new_br && may_have_to_replace
39609c6f1ddSLingrui98}
39709c6f1ddSLingrui98
398c5c5edaeSJeniusclass FtqPcMemWrapper(numOtherReads: Int)(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo {
399c5c5edaeSJenius  val io = IO(new Bundle {
400c5c5edaeSJenius    val ifuPtr_w       = Input(new FtqPtr)
401c5c5edaeSJenius    val ifuPtrPlus1_w  = Input(new FtqPtr)
4026bf9b30dSLingrui98    val ifuPtrPlus2_w  = Input(new FtqPtr)
403c5c5edaeSJenius    val commPtr_w      = Input(new FtqPtr)
4046bf9b30dSLingrui98    val commPtrPlus1_w = Input(new FtqPtr)
405c5c5edaeSJenius    val ifuPtr_rdata       = Output(new Ftq_RF_Components)
406c5c5edaeSJenius    val ifuPtrPlus1_rdata  = Output(new Ftq_RF_Components)
4076bf9b30dSLingrui98    val ifuPtrPlus2_rdata  = Output(new Ftq_RF_Components)
408c5c5edaeSJenius    val commPtr_rdata      = Output(new Ftq_RF_Components)
4096bf9b30dSLingrui98    val commPtrPlus1_rdata = Output(new Ftq_RF_Components)
410c5c5edaeSJenius
411c5c5edaeSJenius    val other_raddrs = Input(Vec(numOtherReads, UInt(log2Ceil(FtqSize).W)))
412c5c5edaeSJenius    val other_rdatas = Output(Vec(numOtherReads, new Ftq_RF_Components))
413c5c5edaeSJenius
414c5c5edaeSJenius    val wen = Input(Bool())
415c5c5edaeSJenius    val waddr = Input(UInt(log2Ceil(FtqSize).W))
416c5c5edaeSJenius    val wdata = Input(new Ftq_RF_Components)
417c5c5edaeSJenius  })
418c5c5edaeSJenius
4196bf9b30dSLingrui98  val num_pc_read = numOtherReads + 5
420c5c5edaeSJenius  val mem = Module(new SyncDataModuleTemplate(new Ftq_RF_Components, FtqSize,
42128f2cf58SLingrui98    num_pc_read, 1, "FtqPC"))
422c5c5edaeSJenius  mem.io.wen(0)   := io.wen
423c5c5edaeSJenius  mem.io.waddr(0) := io.waddr
424c5c5edaeSJenius  mem.io.wdata(0) := io.wdata
425c5c5edaeSJenius
4266bf9b30dSLingrui98  // read one cycle ahead for ftq local reads
427c5c5edaeSJenius  val raddr_vec = VecInit(io.other_raddrs ++
42888bc4f90SLingrui98    Seq(io.ifuPtr_w.value, io.ifuPtrPlus1_w.value, io.ifuPtrPlus2_w.value, io.commPtrPlus1_w.value, io.commPtr_w.value))
429c5c5edaeSJenius
430c5c5edaeSJenius  mem.io.raddr := raddr_vec
431c5c5edaeSJenius
4326bf9b30dSLingrui98  io.other_rdatas       := mem.io.rdata.dropRight(5)
4336bf9b30dSLingrui98  io.ifuPtr_rdata       := mem.io.rdata.dropRight(4).last
4346bf9b30dSLingrui98  io.ifuPtrPlus1_rdata  := mem.io.rdata.dropRight(3).last
4356bf9b30dSLingrui98  io.ifuPtrPlus2_rdata  := mem.io.rdata.dropRight(2).last
4366bf9b30dSLingrui98  io.commPtrPlus1_rdata := mem.io.rdata.dropRight(1).last
437c5c5edaeSJenius  io.commPtr_rdata      := mem.io.rdata.last
438c5c5edaeSJenius}
439c5c5edaeSJenius
44009c6f1ddSLingrui98class Ftq(implicit p: Parameters) extends XSModule with HasCircularQueuePtrHelper
441e30430c2SJay  with HasBackendRedirectInfo with BPUUtils with HasBPUConst with HasPerfEvents
442e30430c2SJay  with HasICacheParameters{
44309c6f1ddSLingrui98  val io = IO(new Bundle {
44409c6f1ddSLingrui98    val fromBpu = Flipped(new BpuToFtqIO)
44509c6f1ddSLingrui98    val fromIfu = Flipped(new IfuToFtqIO)
44609c6f1ddSLingrui98    val fromBackend = Flipped(new CtrlToFtqIO)
44709c6f1ddSLingrui98
44809c6f1ddSLingrui98    val toBpu = new FtqToBpuIO
44909c6f1ddSLingrui98    val toIfu = new FtqToIfuIO
450c5c5edaeSJenius    val toICache = new FtqToICacheIO
45109c6f1ddSLingrui98    val toBackend = new FtqToCtrlIO
45209c6f1ddSLingrui98
4537052722fSJay    val toPrefetch = new FtqPrefechBundle
4547052722fSJay
45509c6f1ddSLingrui98    val bpuInfo = new Bundle {
45609c6f1ddSLingrui98      val bpRight = Output(UInt(XLEN.W))
45709c6f1ddSLingrui98      val bpWrong = Output(UInt(XLEN.W))
45809c6f1ddSLingrui98    }
4591d1e6d4dSJenius
4601d1e6d4dSJenius    val mmioCommitRead = Flipped(new mmioCommitRead)
46109c6f1ddSLingrui98  })
46209c6f1ddSLingrui98  io.bpuInfo := DontCare
46309c6f1ddSLingrui98
4642e1be6e1SSteve Gou  val backendRedirect = Wire(Valid(new Redirect))
4652e1be6e1SSteve Gou  val backendRedirectReg = RegNext(backendRedirect)
46609c6f1ddSLingrui98
467df5b4b8eSYinan Xu  val stage2Flush = backendRedirect.valid
46809c6f1ddSLingrui98  val backendFlush = stage2Flush || RegNext(stage2Flush)
46909c6f1ddSLingrui98  val ifuFlush = Wire(Bool())
47009c6f1ddSLingrui98
47109c6f1ddSLingrui98  val flush = stage2Flush || RegNext(stage2Flush)
47209c6f1ddSLingrui98
47309c6f1ddSLingrui98  val allowBpuIn, allowToIfu = WireInit(false.B)
47409c6f1ddSLingrui98  val flushToIfu = !allowToIfu
475df5b4b8eSYinan Xu  allowBpuIn := !ifuFlush && !backendRedirect.valid && !backendRedirectReg.valid
476df5b4b8eSYinan Xu  allowToIfu := !ifuFlush && !backendRedirect.valid && !backendRedirectReg.valid
47709c6f1ddSLingrui98
478f56177cbSJenius  def copyNum = 5
479e30430c2SJay  val bpuPtr, ifuPtr, ifuWbPtr, commPtr = RegInit(FtqPtr(false.B, 0.U))
480c9bc5480SLingrui98  val ifuPtrPlus1 = RegInit(FtqPtr(false.B, 1.U))
4816bf9b30dSLingrui98  val ifuPtrPlus2 = RegInit(FtqPtr(false.B, 2.U))
4826bf9b30dSLingrui98  val commPtrPlus1 = RegInit(FtqPtr(false.B, 1.U))
483f56177cbSJenius  val copied_ifu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U)))
484dc270d3bSJenius  val copied_bpu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U)))
4856bf9b30dSLingrui98  require(FtqSize >= 4)
486c5c5edaeSJenius  val ifuPtr_write       = WireInit(ifuPtr)
487c5c5edaeSJenius  val ifuPtrPlus1_write  = WireInit(ifuPtrPlus1)
4886bf9b30dSLingrui98  val ifuPtrPlus2_write  = WireInit(ifuPtrPlus2)
489c5c5edaeSJenius  val ifuWbPtr_write     = WireInit(ifuWbPtr)
490c5c5edaeSJenius  val commPtr_write      = WireInit(commPtr)
4916bf9b30dSLingrui98  val commPtrPlus1_write = WireInit(commPtrPlus1)
492c5c5edaeSJenius  ifuPtr       := ifuPtr_write
493c5c5edaeSJenius  ifuPtrPlus1  := ifuPtrPlus1_write
4946bf9b30dSLingrui98  ifuPtrPlus2  := ifuPtrPlus2_write
495c5c5edaeSJenius  ifuWbPtr     := ifuWbPtr_write
496c5c5edaeSJenius  commPtr      := commPtr_write
497f83ef67eSLingrui98  commPtrPlus1 := commPtrPlus1_write
498f56177cbSJenius  copied_ifu_ptr.map{ptr =>
499f56177cbSJenius    ptr := ifuPtr_write
500f56177cbSJenius    dontTouch(ptr)
501f56177cbSJenius  }
50209c6f1ddSLingrui98  val validEntries = distanceBetween(bpuPtr, commPtr)
50309c6f1ddSLingrui98
50409c6f1ddSLingrui98  // **********************************************************************
50509c6f1ddSLingrui98  // **************************** enq from bpu ****************************
50609c6f1ddSLingrui98  // **********************************************************************
50709c6f1ddSLingrui98  val new_entry_ready = validEntries < FtqSize.U
50809c6f1ddSLingrui98  io.fromBpu.resp.ready := new_entry_ready
50909c6f1ddSLingrui98
51009c6f1ddSLingrui98  val bpu_s2_resp = io.fromBpu.resp.bits.s2
511cb4f77ceSLingrui98  val bpu_s3_resp = io.fromBpu.resp.bits.s3
51209c6f1ddSLingrui98  val bpu_s2_redirect = bpu_s2_resp.valid && bpu_s2_resp.hasRedirect
513cb4f77ceSLingrui98  val bpu_s3_redirect = bpu_s3_resp.valid && bpu_s3_resp.hasRedirect
51409c6f1ddSLingrui98
51509c6f1ddSLingrui98  io.toBpu.enq_ptr := bpuPtr
51609c6f1ddSLingrui98  val enq_fire = io.fromBpu.resp.fire() && allowBpuIn // from bpu s1
517cb4f77ceSLingrui98  val bpu_in_fire = (io.fromBpu.resp.fire() || bpu_s2_redirect || bpu_s3_redirect) && allowBpuIn
51809c6f1ddSLingrui98
519b37e4b45SLingrui98  val bpu_in_resp = io.fromBpu.resp.bits.selectedResp
520b37e4b45SLingrui98  val bpu_in_stage = io.fromBpu.resp.bits.selectedRespIdx
52109c6f1ddSLingrui98  val bpu_in_resp_ptr = Mux(bpu_in_stage === BP_S1, bpuPtr, bpu_in_resp.ftq_idx)
52209c6f1ddSLingrui98  val bpu_in_resp_idx = bpu_in_resp_ptr.value
52309c6f1ddSLingrui98
524378f00d9SJenius  // read ports:      prefetchReq ++  ifuReq1 + ifuReq2 + ifuReq3 + commitUpdate2 + commitUpdate
525378f00d9SJenius  val ftq_pc_mem = Module(new FtqPcMemWrapper(1))
5266bf9b30dSLingrui98  // resp from uBTB
527c5c5edaeSJenius  ftq_pc_mem.io.wen := bpu_in_fire
528c5c5edaeSJenius  ftq_pc_mem.io.waddr := bpu_in_resp_idx
529c5c5edaeSJenius  ftq_pc_mem.io.wdata.fromBranchPrediction(bpu_in_resp)
53009c6f1ddSLingrui98
53109c6f1ddSLingrui98  //                                                            ifuRedirect + backendRedirect + commit
53209c6f1ddSLingrui98  val ftq_redirect_sram = Module(new FtqNRSRAM(new Ftq_Redirect_SRAMEntry, 1+1+1))
53309c6f1ddSLingrui98  // these info is intended to enq at the last stage of bpu
53409c6f1ddSLingrui98  ftq_redirect_sram.io.wen := io.fromBpu.resp.bits.lastStage.valid
53509c6f1ddSLingrui98  ftq_redirect_sram.io.waddr := io.fromBpu.resp.bits.lastStage.ftq_idx.value
536c2d1ec7dSLingrui98  ftq_redirect_sram.io.wdata := io.fromBpu.resp.bits.last_stage_spec_info
53749cbc998SLingrui98  println(f"ftq redirect SRAM: entry ${ftq_redirect_sram.io.wdata.getWidth} * ${FtqSize} * 3")
53849cbc998SLingrui98  println(f"ftq redirect SRAM: ahead fh ${ftq_redirect_sram.io.wdata.afhob.getWidth} * ${FtqSize} * 3")
53909c6f1ddSLingrui98
54009c6f1ddSLingrui98  val ftq_meta_1r_sram = Module(new FtqNRSRAM(new Ftq_1R_SRAMEntry, 1))
54109c6f1ddSLingrui98  // these info is intended to enq at the last stage of bpu
54209c6f1ddSLingrui98  ftq_meta_1r_sram.io.wen := io.fromBpu.resp.bits.lastStage.valid
54309c6f1ddSLingrui98  ftq_meta_1r_sram.io.waddr := io.fromBpu.resp.bits.lastStage.ftq_idx.value
544c2d1ec7dSLingrui98  ftq_meta_1r_sram.io.wdata.meta := io.fromBpu.resp.bits.last_stage_meta
54509c6f1ddSLingrui98  //                                                            ifuRedirect + backendRedirect + commit
54609c6f1ddSLingrui98  val ftb_entry_mem = Module(new SyncDataModuleTemplate(new FTBEntry, FtqSize, 1+1+1, 1))
54709c6f1ddSLingrui98  ftb_entry_mem.io.wen(0) := io.fromBpu.resp.bits.lastStage.valid
54809c6f1ddSLingrui98  ftb_entry_mem.io.waddr(0) := io.fromBpu.resp.bits.lastStage.ftq_idx.value
549c2d1ec7dSLingrui98  ftb_entry_mem.io.wdata(0) := io.fromBpu.resp.bits.last_stage_ftb_entry
55009c6f1ddSLingrui98
55109c6f1ddSLingrui98
55209c6f1ddSLingrui98  // multi-write
553b0ed7239SLingrui98  val update_target = Reg(Vec(FtqSize, UInt(VAddrBits.W))) // could be taken target or fallThrough //TODO: remove this
5546bf9b30dSLingrui98  val newest_entry_target = Reg(UInt(VAddrBits.W))
5556bf9b30dSLingrui98  val newest_entry_ptr = Reg(new FtqPtr)
55609c6f1ddSLingrui98  val cfiIndex_vec = Reg(Vec(FtqSize, ValidUndirectioned(UInt(log2Ceil(PredictWidth).W))))
55709c6f1ddSLingrui98  val mispredict_vec = Reg(Vec(FtqSize, Vec(PredictWidth, Bool())))
55809c6f1ddSLingrui98  val pred_stage = Reg(Vec(FtqSize, UInt(2.W)))
55909c6f1ddSLingrui98
560b5808fc2Ssfencevma  val c_invalid :: c_valid :: c_commited :: Nil = Enum(3)
56109c6f1ddSLingrui98  val commitStateQueue = RegInit(VecInit(Seq.fill(FtqSize) {
56209c6f1ddSLingrui98    VecInit(Seq.fill(PredictWidth)(c_invalid))
56309c6f1ddSLingrui98  }))
56409c6f1ddSLingrui98
56509c6f1ddSLingrui98  val f_to_send :: f_sent :: Nil = Enum(2)
56609c6f1ddSLingrui98  val entry_fetch_status = RegInit(VecInit(Seq.fill(FtqSize)(f_sent)))
56709c6f1ddSLingrui98
56809c6f1ddSLingrui98  val h_not_hit :: h_false_hit :: h_hit :: Nil = Enum(3)
56909c6f1ddSLingrui98  val entry_hit_status = RegInit(VecInit(Seq.fill(FtqSize)(h_not_hit)))
57009c6f1ddSLingrui98
571f63797a4SLingrui98  // modify registers one cycle later to cut critical path
572f63797a4SLingrui98  val last_cycle_bpu_in = RegNext(bpu_in_fire)
5736bf9b30dSLingrui98  val last_cycle_bpu_in_ptr = RegNext(bpu_in_resp_ptr)
5746bf9b30dSLingrui98  val last_cycle_bpu_in_idx = last_cycle_bpu_in_ptr.value
5756bf9b30dSLingrui98  val last_cycle_bpu_target = RegNext(bpu_in_resp.getTarget)
576f63797a4SLingrui98  val last_cycle_cfiIndex = RegNext(bpu_in_resp.cfiIndex)
577f63797a4SLingrui98  val last_cycle_bpu_in_stage = RegNext(bpu_in_stage)
578f56177cbSJenius
5797be982afSLingrui98  def extra_copyNum_for_commitStateQueue = 2
5807be982afSLingrui98  val copied_last_cycle_bpu_in = VecInit(Seq.fill(copyNum+extra_copyNum_for_commitStateQueue)(RegNext(bpu_in_fire)))
5817be982afSLingrui98  val copied_last_cycle_bpu_in_ptr_for_ftq = VecInit(Seq.fill(extra_copyNum_for_commitStateQueue)(RegNext(bpu_in_resp_ptr)))
582f56177cbSJenius
583f63797a4SLingrui98  when (last_cycle_bpu_in) {
584f63797a4SLingrui98    entry_fetch_status(last_cycle_bpu_in_idx) := f_to_send
585f63797a4SLingrui98    cfiIndex_vec(last_cycle_bpu_in_idx) := last_cycle_cfiIndex
586f63797a4SLingrui98    pred_stage(last_cycle_bpu_in_idx) := last_cycle_bpu_in_stage
5876bf9b30dSLingrui98
588b0ed7239SLingrui98    update_target(last_cycle_bpu_in_idx) := last_cycle_bpu_target // TODO: remove this
5896bf9b30dSLingrui98    newest_entry_target := last_cycle_bpu_target
5906bf9b30dSLingrui98    newest_entry_ptr := last_cycle_bpu_in_ptr
59109c6f1ddSLingrui98  }
59209c6f1ddSLingrui98
5937be982afSLingrui98  // reduce fanout by delay write for a cycle
5947be982afSLingrui98  when (RegNext(last_cycle_bpu_in)) {
5957be982afSLingrui98    mispredict_vec(RegNext(last_cycle_bpu_in_idx)) := WireInit(VecInit(Seq.fill(PredictWidth)(false.B)))
5967be982afSLingrui98  }
5977be982afSLingrui98
5987be982afSLingrui98  // reduce fanout using copied last_cycle_bpu_in and copied last_cycle_bpu_in_ptr
5997be982afSLingrui98  val copied_last_cycle_bpu_in_for_ftq = copied_last_cycle_bpu_in.takeRight(extra_copyNum_for_commitStateQueue)
6007be982afSLingrui98  copied_last_cycle_bpu_in_for_ftq.zip(copied_last_cycle_bpu_in_ptr_for_ftq).zipWithIndex.map {
6017be982afSLingrui98    case ((in, ptr), i) =>
6027be982afSLingrui98      when (in) {
6037be982afSLingrui98        val perSetEntries = FtqSize / extra_copyNum_for_commitStateQueue // 32
6047be982afSLingrui98        require(FtqSize % extra_copyNum_for_commitStateQueue == 0)
6057be982afSLingrui98        for (j <- 0 until perSetEntries) {
6069361b0c5SLingrui98          when (ptr.value === (i*perSetEntries+j).U) {
6077be982afSLingrui98            commitStateQueue(i*perSetEntries+j) := VecInit(Seq.fill(PredictWidth)(c_invalid))
6087be982afSLingrui98          }
6097be982afSLingrui98        }
6107be982afSLingrui98      }
6119361b0c5SLingrui98  }
6127be982afSLingrui98
613873dc383SLingrui98  // num cycle is fixed
614873dc383SLingrui98  io.toBackend.newest_entry_ptr := RegNext(newest_entry_ptr)
615873dc383SLingrui98  io.toBackend.newest_entry_target := RegNext(newest_entry_target)
616873dc383SLingrui98
617f63797a4SLingrui98
61809c6f1ddSLingrui98  bpuPtr := bpuPtr + enq_fire
619dc270d3bSJenius  copied_bpu_ptr.map(_ := bpuPtr + enq_fire)
620c9bc5480SLingrui98  when (io.toIfu.req.fire && allowToIfu) {
621c5c5edaeSJenius    ifuPtr_write := ifuPtrPlus1
6226bf9b30dSLingrui98    ifuPtrPlus1_write := ifuPtrPlus2
6236bf9b30dSLingrui98    ifuPtrPlus2_write := ifuPtrPlus2 + 1.U
624c9bc5480SLingrui98  }
62509c6f1ddSLingrui98
62609c6f1ddSLingrui98  // only use ftb result to assign hit status
62709c6f1ddSLingrui98  when (bpu_s2_resp.valid) {
628b37e4b45SLingrui98    entry_hit_status(bpu_s2_resp.ftq_idx.value) := Mux(bpu_s2_resp.full_pred.hit, h_hit, h_not_hit)
62909c6f1ddSLingrui98  }
63009c6f1ddSLingrui98
63109c6f1ddSLingrui98
6322f4a3aa4SLingrui98  io.toIfu.flushFromBpu.s2.valid := bpu_s2_redirect
63309c6f1ddSLingrui98  io.toIfu.flushFromBpu.s2.bits := bpu_s2_resp.ftq_idx
63409c6f1ddSLingrui98  when (bpu_s2_resp.valid && bpu_s2_resp.hasRedirect) {
63509c6f1ddSLingrui98    bpuPtr := bpu_s2_resp.ftq_idx + 1.U
636dc270d3bSJenius    copied_bpu_ptr.map(_ := bpu_s2_resp.ftq_idx + 1.U)
63709c6f1ddSLingrui98    // only when ifuPtr runs ahead of bpu s2 resp should we recover it
63809c6f1ddSLingrui98    when (!isBefore(ifuPtr, bpu_s2_resp.ftq_idx)) {
639c5c5edaeSJenius      ifuPtr_write := bpu_s2_resp.ftq_idx
640c5c5edaeSJenius      ifuPtrPlus1_write := bpu_s2_resp.ftq_idx + 1.U
6416bf9b30dSLingrui98      ifuPtrPlus2_write := bpu_s2_resp.ftq_idx + 2.U
64209c6f1ddSLingrui98    }
64309c6f1ddSLingrui98  }
64409c6f1ddSLingrui98
645cb4f77ceSLingrui98  io.toIfu.flushFromBpu.s3.valid := bpu_s3_redirect
646cb4f77ceSLingrui98  io.toIfu.flushFromBpu.s3.bits := bpu_s3_resp.ftq_idx
647cb4f77ceSLingrui98  when (bpu_s3_resp.valid && bpu_s3_resp.hasRedirect) {
648cb4f77ceSLingrui98    bpuPtr := bpu_s3_resp.ftq_idx + 1.U
649dc270d3bSJenius    copied_bpu_ptr.map(_ := bpu_s3_resp.ftq_idx + 1.U)
650cb4f77ceSLingrui98    // only when ifuPtr runs ahead of bpu s2 resp should we recover it
651cb4f77ceSLingrui98    when (!isBefore(ifuPtr, bpu_s3_resp.ftq_idx)) {
652c5c5edaeSJenius      ifuPtr_write := bpu_s3_resp.ftq_idx
653c5c5edaeSJenius      ifuPtrPlus1_write := bpu_s3_resp.ftq_idx + 1.U
6546bf9b30dSLingrui98      ifuPtrPlus2_write := bpu_s3_resp.ftq_idx + 2.U
655cb4f77ceSLingrui98    }
656cb4f77ceSLingrui98  }
657cb4f77ceSLingrui98
65809c6f1ddSLingrui98  XSError(isBefore(bpuPtr, ifuPtr) && !isFull(bpuPtr, ifuPtr), "\nifuPtr is before bpuPtr!\n")
6592448f137SGuokai Chen  XSError(isBefore(ifuWbPtr, commPtr) && !isFull(ifuWbPtr, commPtr), "\ncommPtr is before ifuWbPtr!\n")
66009c6f1ddSLingrui98
661dc270d3bSJenius  (0 until copyNum).map{i =>
662dc270d3bSJenius    XSError(copied_bpu_ptr(i) =/= bpuPtr, "\ncopiedBpuPtr is different from bpuPtr!\n")
663dc270d3bSJenius  }
664dc270d3bSJenius
66509c6f1ddSLingrui98  // ****************************************************************
66609c6f1ddSLingrui98  // **************************** to ifu ****************************
66709c6f1ddSLingrui98  // ****************************************************************
668f22cf846SJenius  // 0  for ifu, and 1-4 for ICache
669f56177cbSJenius  val bpu_in_bypass_buf = RegEnable(ftq_pc_mem.io.wdata, enable=bpu_in_fire)
670f56177cbSJenius  val copied_bpu_in_bypass_buf = VecInit(Seq.fill(copyNum)(RegEnable(ftq_pc_mem.io.wdata, enable=bpu_in_fire)))
671f56177cbSJenius  val bpu_in_bypass_buf_for_ifu = bpu_in_bypass_buf
67209c6f1ddSLingrui98  val bpu_in_bypass_ptr = RegNext(bpu_in_resp_ptr)
67309c6f1ddSLingrui98  val last_cycle_to_ifu_fire = RegNext(io.toIfu.req.fire)
67409c6f1ddSLingrui98
675f56177cbSJenius  val copied_bpu_in_bypass_ptr = VecInit(Seq.fill(copyNum)(RegNext(bpu_in_resp_ptr)))
676f56177cbSJenius  val copied_last_cycle_to_ifu_fire = VecInit(Seq.fill(copyNum)(RegNext(io.toIfu.req.fire)))
67788bc4f90SLingrui98
67809c6f1ddSLingrui98  // read pc and target
6796bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtr_w       := ifuPtr_write
6806bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtrPlus1_w  := ifuPtrPlus1_write
6816bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtrPlus2_w  := ifuPtrPlus2_write
6826bf9b30dSLingrui98  ftq_pc_mem.io.commPtr_w      := commPtr_write
6836bf9b30dSLingrui98  ftq_pc_mem.io.commPtrPlus1_w := commPtrPlus1_write
684c5c5edaeSJenius
68509c6f1ddSLingrui98
6865ff19bd8SLingrui98  io.toIfu.req.bits.ftqIdx := ifuPtr
687f63797a4SLingrui98
688f56177cbSJenius  val toICachePcBundle = Wire(Vec(copyNum,new Ftq_RF_Components))
689dc270d3bSJenius  val toICacheEntryToSend = Wire(Vec(copyNum,Bool()))
690b37e4b45SLingrui98  val toIfuPcBundle = Wire(new Ftq_RF_Components)
691f63797a4SLingrui98  val entry_is_to_send = WireInit(entry_fetch_status(ifuPtr.value) === f_to_send)
692f63797a4SLingrui98  val entry_ftq_offset = WireInit(cfiIndex_vec(ifuPtr.value))
6936bf9b30dSLingrui98  val entry_next_addr  = Wire(UInt(VAddrBits.W))
694b004fa13SJenius
695f56177cbSJenius  val pc_mem_ifu_ptr_rdata   = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtr_rdata)))
696f56177cbSJenius  val pc_mem_ifu_plus1_rdata = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata)))
697b0ed7239SLingrui98  val diff_entry_next_addr = WireInit(update_target(ifuPtr.value)) //TODO: remove this
698f63797a4SLingrui98
699dc270d3bSJenius  val copied_ifu_plus1_to_send = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1))))
700dc270d3bSJenius  val copied_ifu_ptr_to_send   = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr)))
701dc270d3bSJenius
702f56177cbSJenius  for(i <- 0 until copyNum){
703f56177cbSJenius    when(copied_last_cycle_bpu_in(i) && copied_bpu_in_bypass_ptr(i) === copied_ifu_ptr(i)){
704f56177cbSJenius      toICachePcBundle(i) := copied_bpu_in_bypass_buf(i)
705dc270d3bSJenius      toICacheEntryToSend(i)   := true.B
706f56177cbSJenius    }.elsewhen(copied_last_cycle_to_ifu_fire(i)){
707f56177cbSJenius      toICachePcBundle(i) := pc_mem_ifu_plus1_rdata(i)
708dc270d3bSJenius      toICacheEntryToSend(i)   := copied_ifu_plus1_to_send(i)
709f56177cbSJenius    }.otherwise{
710f56177cbSJenius      toICachePcBundle(i) := pc_mem_ifu_ptr_rdata(i)
711dc270d3bSJenius      toICacheEntryToSend(i)   := copied_ifu_ptr_to_send(i)
712f56177cbSJenius    }
713f56177cbSJenius  }
714f56177cbSJenius
715873dc383SLingrui98  // TODO: reconsider target address bypass logic
71609c6f1ddSLingrui98  when (last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) {
71788bc4f90SLingrui98    toIfuPcBundle := bpu_in_bypass_buf_for_ifu
718f678dd91SSteve Gou    entry_is_to_send := true.B
7196bf9b30dSLingrui98    entry_next_addr := last_cycle_bpu_target
720f63797a4SLingrui98    entry_ftq_offset := last_cycle_cfiIndex
721b0ed7239SLingrui98    diff_entry_next_addr := last_cycle_bpu_target // TODO: remove this
72209c6f1ddSLingrui98  }.elsewhen (last_cycle_to_ifu_fire) {
723c5c5edaeSJenius    toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata)
724c5c5edaeSJenius    entry_is_to_send := RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) ||
725c5c5edaeSJenius                        RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1)) // reduce potential bubbles
726ed434d67SLingrui98    entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1),
72788bc4f90SLingrui98                          bpu_in_bypass_buf_for_ifu.startAddr,
728fef810c0SLingrui98                          Mux(ifuPtr === newest_entry_ptr,
7296bf9b30dSLingrui98                            newest_entry_target,
730f83ef67eSLingrui98                            RegNext(ftq_pc_mem.io.ifuPtrPlus2_rdata.startAddr))) // ifuPtr+2
731c5c5edaeSJenius  }.otherwise {
732c5c5edaeSJenius    toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtr_rdata)
73328f2cf58SLingrui98    entry_is_to_send := RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) ||
73428f2cf58SLingrui98                        RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) // reduce potential bubbles
7356bf9b30dSLingrui98    entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1),
73688bc4f90SLingrui98                          bpu_in_bypass_buf_for_ifu.startAddr,
737fef810c0SLingrui98                          Mux(ifuPtr === newest_entry_ptr,
7386bf9b30dSLingrui98                            newest_entry_target,
739f83ef67eSLingrui98                            RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata.startAddr))) // ifuPtr+1
74009c6f1ddSLingrui98  }
74109c6f1ddSLingrui98
742f678dd91SSteve Gou  io.toIfu.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr
743f63797a4SLingrui98  io.toIfu.req.bits.nextStartAddr := entry_next_addr
744f63797a4SLingrui98  io.toIfu.req.bits.ftqOffset := entry_ftq_offset
745b37e4b45SLingrui98  io.toIfu.req.bits.fromFtqPcBundle(toIfuPcBundle)
746c5c5edaeSJenius
747c5c5edaeSJenius  io.toICache.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr
748dc270d3bSJenius  io.toICache.req.bits.readValid.zipWithIndex.map{case(copy, i) => copy := toICacheEntryToSend(i) && copied_ifu_ptr(i) =/= copied_bpu_ptr(i)}
749b004fa13SJenius  io.toICache.req.bits.pcMemRead.zipWithIndex.map{case(copy,i) => copy.fromFtqPcBundle(toICachePcBundle(i))}
750b004fa13SJenius  // io.toICache.req.bits.bypassSelect := last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr
751b004fa13SJenius  // io.toICache.req.bits.bpuBypassWrite.zipWithIndex.map{case(bypassWrtie, i) =>
752b004fa13SJenius  //   bypassWrtie.startAddr := bpu_in_bypass_buf.tail(i).startAddr
753b004fa13SJenius  //   bypassWrtie.nextlineStart := bpu_in_bypass_buf.tail(i).nextLineAddr
754b004fa13SJenius  // }
755f22cf846SJenius
756b0ed7239SLingrui98  // TODO: remove this
757b0ed7239SLingrui98  XSError(io.toIfu.req.valid && diff_entry_next_addr =/= entry_next_addr,
7585a674179SLingrui98          p"\nifu_req_target wrong! ifuPtr: ${ifuPtr}, entry_next_addr: ${Hexadecimal(entry_next_addr)} diff_entry_next_addr: ${Hexadecimal(diff_entry_next_addr)}\n")
759b0ed7239SLingrui98
76009c6f1ddSLingrui98  // when fall through is smaller in value than start address, there must be a false hit
761b37e4b45SLingrui98  when (toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit) {
76209c6f1ddSLingrui98    when (io.toIfu.req.fire &&
763cb4f77ceSLingrui98      !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) &&
764cb4f77ceSLingrui98      !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr)
76509c6f1ddSLingrui98    ) {
76609c6f1ddSLingrui98      entry_hit_status(ifuPtr.value) := h_false_hit
767352db50aSLingrui98      // XSError(true.B, "FTB false hit by fallThroughError, startAddr: %x, fallTHru: %x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr)
76809c6f1ddSLingrui98    }
769b37e4b45SLingrui98    XSDebug(true.B, "fallThruError! start:%x, fallThru:%x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr)
77009c6f1ddSLingrui98  }
77109c6f1ddSLingrui98
772a60a2901SLingrui98  XSPerfAccumulate(f"fall_through_error_to_ifu", toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit &&
773a60a2901SLingrui98    io.toIfu.req.fire && !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) && !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr))
774a60a2901SLingrui98
77509c6f1ddSLingrui98  val ifu_req_should_be_flushed =
776cb4f77ceSLingrui98    io.toIfu.flushFromBpu.shouldFlushByStage2(io.toIfu.req.bits.ftqIdx) ||
777cb4f77ceSLingrui98    io.toIfu.flushFromBpu.shouldFlushByStage3(io.toIfu.req.bits.ftqIdx)
77809c6f1ddSLingrui98
77909c6f1ddSLingrui98    when (io.toIfu.req.fire && !ifu_req_should_be_flushed) {
78009c6f1ddSLingrui98      entry_fetch_status(ifuPtr.value) := f_sent
78109c6f1ddSLingrui98    }
78209c6f1ddSLingrui98
78309c6f1ddSLingrui98  // *********************************************************************
78409c6f1ddSLingrui98  // **************************** wb from ifu ****************************
78509c6f1ddSLingrui98  // *********************************************************************
78609c6f1ddSLingrui98  val pdWb = io.fromIfu.pdWb
78709c6f1ddSLingrui98  val pds = pdWb.bits.pd
78809c6f1ddSLingrui98  val ifu_wb_valid = pdWb.valid
78909c6f1ddSLingrui98  val ifu_wb_idx = pdWb.bits.ftqIdx.value
79009c6f1ddSLingrui98  // read ports:                                                         commit update
79109c6f1ddSLingrui98  val ftq_pd_mem = Module(new SyncDataModuleTemplate(new Ftq_pd_Entry, FtqSize, 1, 1))
79209c6f1ddSLingrui98  ftq_pd_mem.io.wen(0) := ifu_wb_valid
79309c6f1ddSLingrui98  ftq_pd_mem.io.waddr(0) := pdWb.bits.ftqIdx.value
79409c6f1ddSLingrui98  ftq_pd_mem.io.wdata(0).fromPdWb(pdWb.bits)
79509c6f1ddSLingrui98
79609c6f1ddSLingrui98  val hit_pd_valid = entry_hit_status(ifu_wb_idx) === h_hit && ifu_wb_valid
79709c6f1ddSLingrui98  val hit_pd_mispred = hit_pd_valid && pdWb.bits.misOffset.valid
79809c6f1ddSLingrui98  val hit_pd_mispred_reg = RegNext(hit_pd_mispred, init=false.B)
799005e809bSJiuyang Liu  val pd_reg       = RegEnable(pds,             pdWb.valid)
800005e809bSJiuyang Liu  val start_pc_reg = RegEnable(pdWb.bits.pc(0), pdWb.valid)
801005e809bSJiuyang Liu  val wb_idx_reg   = RegEnable(ifu_wb_idx,      pdWb.valid)
80209c6f1ddSLingrui98
80309c6f1ddSLingrui98  when (ifu_wb_valid) {
80409c6f1ddSLingrui98    val comm_stq_wen = VecInit(pds.map(_.valid).zip(pdWb.bits.instrRange).map{
80509c6f1ddSLingrui98      case (v, inRange) => v && inRange
80609c6f1ddSLingrui98    })
80709c6f1ddSLingrui98    (commitStateQueue(ifu_wb_idx) zip comm_stq_wen).map{
80809c6f1ddSLingrui98      case (qe, v) => when (v) { qe := c_valid }
80909c6f1ddSLingrui98    }
81009c6f1ddSLingrui98  }
81109c6f1ddSLingrui98
812c5c5edaeSJenius  when (ifu_wb_valid) {
813c5c5edaeSJenius    ifuWbPtr_write := ifuWbPtr + 1.U
814c5c5edaeSJenius  }
81509c6f1ddSLingrui98
81609c6f1ddSLingrui98  ftb_entry_mem.io.raddr.head := ifu_wb_idx
81709c6f1ddSLingrui98  val has_false_hit = WireInit(false.B)
81809c6f1ddSLingrui98  when (RegNext(hit_pd_valid)) {
81909c6f1ddSLingrui98    // check for false hit
82009c6f1ddSLingrui98    val pred_ftb_entry = ftb_entry_mem.io.rdata.head
821eeb5ff92SLingrui98    val brSlots = pred_ftb_entry.brSlots
822eeb5ff92SLingrui98    val tailSlot = pred_ftb_entry.tailSlot
82309c6f1ddSLingrui98    // we check cfis that bpu predicted
82409c6f1ddSLingrui98
825eeb5ff92SLingrui98    // bpu predicted branches but denied by predecode
826eeb5ff92SLingrui98    val br_false_hit =
827eeb5ff92SLingrui98      brSlots.map{
828eeb5ff92SLingrui98        s => s.valid && !(pd_reg(s.offset).valid && pd_reg(s.offset).isBr)
829eeb5ff92SLingrui98      }.reduce(_||_) ||
830b37e4b45SLingrui98      (tailSlot.valid && pred_ftb_entry.tailSlot.sharing &&
831eeb5ff92SLingrui98        !(pd_reg(tailSlot.offset).valid && pd_reg(tailSlot.offset).isBr))
832eeb5ff92SLingrui98
833eeb5ff92SLingrui98    val jmpOffset = tailSlot.offset
83409c6f1ddSLingrui98    val jmp_pd = pd_reg(jmpOffset)
83509c6f1ddSLingrui98    val jal_false_hit = pred_ftb_entry.jmpValid &&
83609c6f1ddSLingrui98      ((pred_ftb_entry.isJal  && !(jmp_pd.valid && jmp_pd.isJal)) ||
83709c6f1ddSLingrui98       (pred_ftb_entry.isJalr && !(jmp_pd.valid && jmp_pd.isJalr)) ||
83809c6f1ddSLingrui98       (pred_ftb_entry.isCall && !(jmp_pd.valid && jmp_pd.isCall)) ||
83909c6f1ddSLingrui98       (pred_ftb_entry.isRet  && !(jmp_pd.valid && jmp_pd.isRet))
84009c6f1ddSLingrui98      )
84109c6f1ddSLingrui98
84209c6f1ddSLingrui98    has_false_hit := br_false_hit || jal_false_hit || hit_pd_mispred_reg
84365fddcf0Szoujr    XSDebug(has_false_hit, "FTB false hit by br or jal or hit_pd, startAddr: %x\n", pdWb.bits.pc(0))
84465fddcf0Szoujr
845352db50aSLingrui98    // assert(!has_false_hit)
84609c6f1ddSLingrui98  }
84709c6f1ddSLingrui98
84809c6f1ddSLingrui98  when (has_false_hit) {
84909c6f1ddSLingrui98    entry_hit_status(wb_idx_reg) := h_false_hit
85009c6f1ddSLingrui98  }
85109c6f1ddSLingrui98
85209c6f1ddSLingrui98
85309c6f1ddSLingrui98  // **********************************************************************
854b56f947eSYinan Xu  // ***************************** to backend *****************************
85509c6f1ddSLingrui98  // **********************************************************************
856b56f947eSYinan Xu  // to backend pc mem / target
857b56f947eSYinan Xu  io.toBackend.pc_mem_wen   := RegNext(last_cycle_bpu_in)
858b56f947eSYinan Xu  io.toBackend.pc_mem_waddr := RegNext(last_cycle_bpu_in_idx)
85988bc4f90SLingrui98  io.toBackend.pc_mem_wdata := RegNext(bpu_in_bypass_buf_for_ifu)
86009c6f1ddSLingrui98
86109c6f1ddSLingrui98  // *******************************************************************************
86209c6f1ddSLingrui98  // **************************** redirect from backend ****************************
86309c6f1ddSLingrui98  // *******************************************************************************
86409c6f1ddSLingrui98
86509c6f1ddSLingrui98  // redirect read cfiInfo, couples to redirectGen s2
8662e1be6e1SSteve Gou  ftq_redirect_sram.io.ren.init.last := backendRedirect.valid
8672e1be6e1SSteve Gou  ftq_redirect_sram.io.raddr.init.last := backendRedirect.bits.ftqIdx.value
86809c6f1ddSLingrui98
8692e1be6e1SSteve Gou  ftb_entry_mem.io.raddr.init.last := backendRedirect.bits.ftqIdx.value
87009c6f1ddSLingrui98
87109c6f1ddSLingrui98  val stage3CfiInfo = ftq_redirect_sram.io.rdata.init.last
872df5b4b8eSYinan Xu  val fromBackendRedirect = WireInit(backendRedirectReg)
87309c6f1ddSLingrui98  val backendRedirectCfi = fromBackendRedirect.bits.cfiUpdate
87409c6f1ddSLingrui98  backendRedirectCfi.fromFtqRedirectSram(stage3CfiInfo)
87509c6f1ddSLingrui98
87609c6f1ddSLingrui98  val r_ftb_entry = ftb_entry_mem.io.rdata.init.last
87709c6f1ddSLingrui98  val r_ftqOffset = fromBackendRedirect.bits.ftqOffset
87809c6f1ddSLingrui98
87909c6f1ddSLingrui98  when (entry_hit_status(fromBackendRedirect.bits.ftqIdx.value) === h_hit) {
88009c6f1ddSLingrui98    backendRedirectCfi.shift := PopCount(r_ftb_entry.getBrMaskByOffset(r_ftqOffset)) +&
88109c6f1ddSLingrui98      (backendRedirectCfi.pd.isBr && !r_ftb_entry.brIsSaved(r_ftqOffset) &&
882eeb5ff92SLingrui98      !r_ftb_entry.newBrCanNotInsert(r_ftqOffset))
88309c6f1ddSLingrui98
88409c6f1ddSLingrui98    backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr && (r_ftb_entry.brIsSaved(r_ftqOffset) ||
885eeb5ff92SLingrui98        !r_ftb_entry.newBrCanNotInsert(r_ftqOffset))
88609c6f1ddSLingrui98  }.otherwise {
88709c6f1ddSLingrui98    backendRedirectCfi.shift := (backendRedirectCfi.pd.isBr && backendRedirectCfi.taken).asUInt
88809c6f1ddSLingrui98    backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr.asUInt
88909c6f1ddSLingrui98  }
89009c6f1ddSLingrui98
89109c6f1ddSLingrui98
89209c6f1ddSLingrui98  // ***************************************************************************
89309c6f1ddSLingrui98  // **************************** redirect from ifu ****************************
89409c6f1ddSLingrui98  // ***************************************************************************
89509c6f1ddSLingrui98  val fromIfuRedirect = WireInit(0.U.asTypeOf(Valid(new Redirect)))
89609c6f1ddSLingrui98  fromIfuRedirect.valid := pdWb.valid && pdWb.bits.misOffset.valid && !backendFlush
89709c6f1ddSLingrui98  fromIfuRedirect.bits.ftqIdx := pdWb.bits.ftqIdx
89809c6f1ddSLingrui98  fromIfuRedirect.bits.ftqOffset := pdWb.bits.misOffset.bits
89909c6f1ddSLingrui98  fromIfuRedirect.bits.level := RedirectLevel.flushAfter
90009c6f1ddSLingrui98
90109c6f1ddSLingrui98  val ifuRedirectCfiUpdate = fromIfuRedirect.bits.cfiUpdate
90209c6f1ddSLingrui98  ifuRedirectCfiUpdate.pc := pdWb.bits.pc(pdWb.bits.misOffset.bits)
90309c6f1ddSLingrui98  ifuRedirectCfiUpdate.pd := pdWb.bits.pd(pdWb.bits.misOffset.bits)
90409c6f1ddSLingrui98  ifuRedirectCfiUpdate.predTaken := cfiIndex_vec(pdWb.bits.ftqIdx.value).valid
90509c6f1ddSLingrui98  ifuRedirectCfiUpdate.target := pdWb.bits.target
90609c6f1ddSLingrui98  ifuRedirectCfiUpdate.taken := pdWb.bits.cfiOffset.valid
90709c6f1ddSLingrui98  ifuRedirectCfiUpdate.isMisPred := pdWb.bits.misOffset.valid
90809c6f1ddSLingrui98
90909c6f1ddSLingrui98  val ifuRedirectReg = RegNext(fromIfuRedirect, init=0.U.asTypeOf(Valid(new Redirect)))
91009c6f1ddSLingrui98  val ifuRedirectToBpu = WireInit(ifuRedirectReg)
91109c6f1ddSLingrui98  ifuFlush := fromIfuRedirect.valid || ifuRedirectToBpu.valid
91209c6f1ddSLingrui98
91309c6f1ddSLingrui98  ftq_redirect_sram.io.ren.head := fromIfuRedirect.valid
91409c6f1ddSLingrui98  ftq_redirect_sram.io.raddr.head := fromIfuRedirect.bits.ftqIdx.value
91509c6f1ddSLingrui98
91609c6f1ddSLingrui98  ftb_entry_mem.io.raddr.head := fromIfuRedirect.bits.ftqIdx.value
91709c6f1ddSLingrui98
91809c6f1ddSLingrui98  val toBpuCfi = ifuRedirectToBpu.bits.cfiUpdate
91909c6f1ddSLingrui98  toBpuCfi.fromFtqRedirectSram(ftq_redirect_sram.io.rdata.head)
92009c6f1ddSLingrui98  when (ifuRedirectReg.bits.cfiUpdate.pd.isRet) {
92109c6f1ddSLingrui98    toBpuCfi.target := toBpuCfi.rasEntry.retAddr
92209c6f1ddSLingrui98  }
92309c6f1ddSLingrui98
92409c6f1ddSLingrui98  // *********************************************************************
92509c6f1ddSLingrui98  // **************************** wb from exu ****************************
92609c6f1ddSLingrui98  // *********************************************************************
92709c6f1ddSLingrui98
928b56f947eSYinan Xu  backendRedirect := io.fromBackend.redirect
9292e1be6e1SSteve Gou
93009c6f1ddSLingrui98  def extractRedirectInfo(wb: Valid[Redirect]) = {
9316bf9b30dSLingrui98    val ftqPtr = wb.bits.ftqIdx
93209c6f1ddSLingrui98    val ftqOffset = wb.bits.ftqOffset
93309c6f1ddSLingrui98    val taken = wb.bits.cfiUpdate.taken
93409c6f1ddSLingrui98    val mispred = wb.bits.cfiUpdate.isMisPred
9356bf9b30dSLingrui98    (wb.valid, ftqPtr, ftqOffset, taken, mispred)
93609c6f1ddSLingrui98  }
93709c6f1ddSLingrui98
93809c6f1ddSLingrui98  // fix mispredict entry
93909c6f1ddSLingrui98  val lastIsMispredict = RegNext(
940df5b4b8eSYinan Xu    backendRedirect.valid && backendRedirect.bits.level === RedirectLevel.flushAfter, init = false.B
94109c6f1ddSLingrui98  )
94209c6f1ddSLingrui98
94309c6f1ddSLingrui98  def updateCfiInfo(redirect: Valid[Redirect], isBackend: Boolean = true) = {
9446bf9b30dSLingrui98    val (r_valid, r_ptr, r_offset, r_taken, r_mispred) = extractRedirectInfo(redirect)
9456bf9b30dSLingrui98    val r_idx = r_ptr.value
94609c6f1ddSLingrui98    val cfiIndex_bits_wen = r_valid && r_taken && r_offset < cfiIndex_vec(r_idx).bits
94709c6f1ddSLingrui98    val cfiIndex_valid_wen = r_valid && r_offset === cfiIndex_vec(r_idx).bits
94809c6f1ddSLingrui98    when (cfiIndex_bits_wen || cfiIndex_valid_wen) {
94909c6f1ddSLingrui98      cfiIndex_vec(r_idx).valid := cfiIndex_bits_wen || cfiIndex_valid_wen && r_taken
9503f88c020SGuokai Chen    } .elsewhen (r_valid && !r_taken && r_offset =/= cfiIndex_vec(r_idx).bits) {
9513f88c020SGuokai Chen      cfiIndex_vec(r_idx).valid :=false.B
95209c6f1ddSLingrui98    }
95309c6f1ddSLingrui98    when (cfiIndex_bits_wen) {
95409c6f1ddSLingrui98      cfiIndex_vec(r_idx).bits := r_offset
95509c6f1ddSLingrui98    }
9566bf9b30dSLingrui98    newest_entry_target := redirect.bits.cfiUpdate.target
957873dc383SLingrui98    newest_entry_ptr := r_ptr
958b0ed7239SLingrui98    update_target(r_idx) := redirect.bits.cfiUpdate.target // TODO: remove this
95909c6f1ddSLingrui98    if (isBackend) {
96009c6f1ddSLingrui98      mispredict_vec(r_idx)(r_offset) := r_mispred
96109c6f1ddSLingrui98    }
96209c6f1ddSLingrui98  }
96309c6f1ddSLingrui98
96481e362d8SLingrui98  when(backendRedirectReg.valid) {
965df5b4b8eSYinan Xu    updateCfiInfo(backendRedirectReg)
96609c6f1ddSLingrui98  }.elsewhen (ifuRedirectToBpu.valid) {
96709c6f1ddSLingrui98    updateCfiInfo(ifuRedirectToBpu, isBackend=false)
96809c6f1ddSLingrui98  }
96909c6f1ddSLingrui98
97009c6f1ddSLingrui98  // ***********************************************************************************
97109c6f1ddSLingrui98  // **************************** flush ptr and state queue ****************************
97209c6f1ddSLingrui98  // ***********************************************************************************
97309c6f1ddSLingrui98
974df5b4b8eSYinan Xu  val redirectVec = VecInit(backendRedirect, fromIfuRedirect)
97509c6f1ddSLingrui98
97609c6f1ddSLingrui98  // when redirect, we should reset ptrs and status queues
97709c6f1ddSLingrui98  when(redirectVec.map(r => r.valid).reduce(_||_)){
9782f4a3aa4SLingrui98    val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits)))
97909c6f1ddSLingrui98    val notIfu = redirectVec.dropRight(1).map(r => r.valid).reduce(_||_)
9802f4a3aa4SLingrui98    val (idx, offset, flushItSelf) = (r.ftqIdx, r.ftqOffset, RedirectLevel.flushItself(r.level))
98109c6f1ddSLingrui98    val next = idx + 1.U
98209c6f1ddSLingrui98    bpuPtr := next
983dc270d3bSJenius    copied_bpu_ptr.map(_ := next)
984c5c5edaeSJenius    ifuPtr_write := next
985c5c5edaeSJenius    ifuWbPtr_write := next
986c5c5edaeSJenius    ifuPtrPlus1_write := idx + 2.U
9876bf9b30dSLingrui98    ifuPtrPlus2_write := idx + 3.U
9883f88c020SGuokai Chen
9893f88c020SGuokai Chen  }
9903f88c020SGuokai Chen  when(RegNext(redirectVec.map(r => r.valid).reduce(_||_))){
9913f88c020SGuokai Chen    val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits)))
9923f88c020SGuokai Chen    val notIfu = redirectVec.dropRight(1).map(r => r.valid).reduce(_||_)
9933f88c020SGuokai Chen    val (idx, offset, flushItSelf) = (r.ftqIdx, r.ftqOffset, RedirectLevel.flushItself(r.level))
9943f88c020SGuokai Chen    when (RegNext(notIfu)) {
9953f88c020SGuokai Chen      commitStateQueue(RegNext(idx.value)).zipWithIndex.foreach({ case (s, i) =>
9963f88c020SGuokai Chen        when(i.U > RegNext(offset) || i.U === RegNext(offset) && RegNext(flushItSelf)){
997b5808fc2Ssfencevma          s := c_invalid
99809c6f1ddSLingrui98        }
99909c6f1ddSLingrui98      })
100009c6f1ddSLingrui98    }
100109c6f1ddSLingrui98  }
100209c6f1ddSLingrui98
10033f88c020SGuokai Chen
100409c6f1ddSLingrui98  // only the valid bit is actually needed
1005df5b4b8eSYinan Xu  io.toIfu.redirect.bits    := backendRedirect.bits
100609c6f1ddSLingrui98  io.toIfu.redirect.valid   := stage2Flush
100709c6f1ddSLingrui98
100809c6f1ddSLingrui98  // commit
10099aca92b9SYinan Xu  for (c <- io.fromBackend.rob_commits) {
101009c6f1ddSLingrui98    when(c.valid) {
101109c6f1ddSLingrui98      commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset) := c_commited
101288825c5cSYinan Xu      // TODO: remove this
101388825c5cSYinan Xu      // For instruction fusions, we also update the next instruction
1014c3abb8b6SYinan Xu      when (c.bits.commitType === 4.U) {
101588825c5cSYinan Xu        commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset + 1.U) := c_commited
1016c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 5.U) {
101788825c5cSYinan Xu        commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset + 2.U) := c_commited
1018c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 6.U) {
101988825c5cSYinan Xu        val index = (c.bits.ftqIdx + 1.U).value
102088825c5cSYinan Xu        commitStateQueue(index)(0) := c_commited
1021c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 7.U) {
102288825c5cSYinan Xu        val index = (c.bits.ftqIdx + 1.U).value
102388825c5cSYinan Xu        commitStateQueue(index)(1) := c_commited
102488825c5cSYinan Xu      }
102509c6f1ddSLingrui98    }
102609c6f1ddSLingrui98  }
102709c6f1ddSLingrui98
102809c6f1ddSLingrui98  // ****************************************************************
102909c6f1ddSLingrui98  // **************************** to bpu ****************************
103009c6f1ddSLingrui98  // ****************************************************************
103109c6f1ddSLingrui98
103251981c77SbugGenerator  io.toBpu.redirect := Mux(fromBackendRedirect.valid, fromBackendRedirect, ifuRedirectToBpu)
103309c6f1ddSLingrui98
103402f21c16SLingrui98  val may_have_stall_from_bpu = Wire(Bool())
103502f21c16SLingrui98  val bpu_ftb_update_stall = RegInit(0.U(2.W)) // 2-cycle stall, so we need 3 states
103602f21c16SLingrui98  may_have_stall_from_bpu := bpu_ftb_update_stall =/= 0.U
1037b5808fc2Ssfencevma  val canCommit = commPtr =/= ifuWbPtr && !may_have_stall_from_bpu &&
103809c6f1ddSLingrui98    Cat(commitStateQueue(commPtr.value).map(s => {
1039b5808fc2Ssfencevma      s === c_invalid || s === c_commited
1040b5808fc2Ssfencevma    })).andR()
104109c6f1ddSLingrui98
10421d1e6d4dSJenius  val mmioReadPtr = io.mmioCommitRead.mmioFtqPtr
10431d1e6d4dSJenius  val mmioLastCommit = isBefore(commPtr, mmioReadPtr) && (isAfter(ifuPtr,mmioReadPtr)  ||  mmioReadPtr ===   ifuPtr) &&
1044b5808fc2Ssfencevma                       Cat(commitStateQueue(mmioReadPtr.value).map(s => { s === c_invalid || s === c_commited})).andR()
10451d1e6d4dSJenius  io.mmioCommitRead.mmioLastCommit := RegNext(mmioLastCommit)
10461d1e6d4dSJenius
104709c6f1ddSLingrui98  // commit reads
1048c5c5edaeSJenius  val commit_pc_bundle = RegNext(ftq_pc_mem.io.commPtr_rdata)
104981101dc4SLingrui98  val commit_target =
105034cf890eSLingrui98    Mux(RegNext(commPtr === newest_entry_ptr),
105134cf890eSLingrui98      RegNext(newest_entry_target),
105281101dc4SLingrui98      RegNext(ftq_pc_mem.io.commPtrPlus1_rdata.startAddr))
105309c6f1ddSLingrui98  ftq_pd_mem.io.raddr.last := commPtr.value
105409c6f1ddSLingrui98  val commit_pd = ftq_pd_mem.io.rdata.last
105509c6f1ddSLingrui98  ftq_redirect_sram.io.ren.last := canCommit
105609c6f1ddSLingrui98  ftq_redirect_sram.io.raddr.last := commPtr.value
105709c6f1ddSLingrui98  val commit_spec_meta = ftq_redirect_sram.io.rdata.last
105809c6f1ddSLingrui98  ftq_meta_1r_sram.io.ren(0) := canCommit
105909c6f1ddSLingrui98  ftq_meta_1r_sram.io.raddr(0) := commPtr.value
106009c6f1ddSLingrui98  val commit_meta = ftq_meta_1r_sram.io.rdata(0)
106109c6f1ddSLingrui98  ftb_entry_mem.io.raddr.last := commPtr.value
106209c6f1ddSLingrui98  val commit_ftb_entry = ftb_entry_mem.io.rdata.last
106309c6f1ddSLingrui98
106409c6f1ddSLingrui98  // need one cycle to read mem and srams
106509c6f1ddSLingrui98  val do_commit_ptr = RegNext(commPtr)
10665371700eSzoujr  val do_commit = RegNext(canCommit, init=false.B)
10676bf9b30dSLingrui98  when (canCommit) {
10686bf9b30dSLingrui98    commPtr_write := commPtrPlus1
10696bf9b30dSLingrui98    commPtrPlus1_write := commPtrPlus1 + 1.U
10706bf9b30dSLingrui98  }
107109c6f1ddSLingrui98  val commit_state = RegNext(commitStateQueue(commPtr.value))
10725371700eSzoujr  val can_commit_cfi = WireInit(cfiIndex_vec(commPtr.value))
10733f88c020SGuokai Chen  //
10743f88c020SGuokai Chen  //when (commitStateQueue(commPtr.value)(can_commit_cfi.bits) =/= c_commited) {
10753f88c020SGuokai Chen  //  can_commit_cfi.valid := false.B
10763f88c020SGuokai Chen  //}
10775371700eSzoujr  val commit_cfi = RegNext(can_commit_cfi)
10783f88c020SGuokai Chen  val debug_cfi = RegNext(commitStateQueue(commPtr.value)(can_commit_cfi.bits) =/= c_commited && can_commit_cfi.valid)
107909c6f1ddSLingrui98
108009c6f1ddSLingrui98  val commit_mispredict = VecInit((RegNext(mispredict_vec(commPtr.value)) zip commit_state).map {
108109c6f1ddSLingrui98    case (mis, state) => mis && state === c_commited
108209c6f1ddSLingrui98  })
10835371700eSzoujr  val can_commit_hit = entry_hit_status(commPtr.value)
10845371700eSzoujr  val commit_hit = RegNext(can_commit_hit)
10855fa3df0dSLingrui98  val diff_commit_target = RegNext(update_target(commPtr.value)) // TODO: remove this
1086edc18578SLingrui98  val commit_stage = RegNext(pred_stage(commPtr.value))
108709c6f1ddSLingrui98  val commit_valid = commit_hit === h_hit || commit_cfi.valid // hit or taken
108809c6f1ddSLingrui98
10895371700eSzoujr  val to_bpu_hit = can_commit_hit === h_hit || can_commit_hit === h_false_hit
109002f21c16SLingrui98  switch (bpu_ftb_update_stall) {
109102f21c16SLingrui98    is (0.U) {
109202f21c16SLingrui98      when (can_commit_cfi.valid && !to_bpu_hit && canCommit) {
109302f21c16SLingrui98        bpu_ftb_update_stall := 2.U // 2-cycle stall
109402f21c16SLingrui98      }
109502f21c16SLingrui98    }
109602f21c16SLingrui98    is (2.U) {
109702f21c16SLingrui98      bpu_ftb_update_stall := 1.U
109802f21c16SLingrui98    }
109902f21c16SLingrui98    is (1.U) {
110002f21c16SLingrui98      bpu_ftb_update_stall := 0.U
110102f21c16SLingrui98    }
110202f21c16SLingrui98    is (3.U) {
110302f21c16SLingrui98      XSError(true.B, "bpu_ftb_update_stall should be 0, 1 or 2")
110402f21c16SLingrui98    }
110502f21c16SLingrui98  }
110609c6f1ddSLingrui98
1107b0ed7239SLingrui98  // TODO: remove this
1108b0ed7239SLingrui98  XSError(do_commit && diff_commit_target =/= commit_target, "\ncommit target should be the same as update target\n")
1109b0ed7239SLingrui98
111009c6f1ddSLingrui98  io.toBpu.update := DontCare
111109c6f1ddSLingrui98  io.toBpu.update.valid := commit_valid && do_commit
111209c6f1ddSLingrui98  val update = io.toBpu.update.bits
111309c6f1ddSLingrui98  update.false_hit   := commit_hit === h_false_hit
111409c6f1ddSLingrui98  update.pc          := commit_pc_bundle.startAddr
111509c6f1ddSLingrui98  update.meta        := commit_meta.meta
1116803124a6SLingrui98  update.cfi_idx     := commit_cfi
11178ffcd86aSLingrui98  update.full_target := commit_target
1118edc18578SLingrui98  update.from_stage  := commit_stage
1119c2d1ec7dSLingrui98  update.spec_info   := commit_spec_meta
11203f88c020SGuokai Chen  XSError(commit_valid && do_commit && debug_cfi, "\ncommit cfi can be non c_commited\n")
112109c6f1ddSLingrui98
112209c6f1ddSLingrui98  val commit_real_hit = commit_hit === h_hit
112309c6f1ddSLingrui98  val update_ftb_entry = update.ftb_entry
112409c6f1ddSLingrui98
112509c6f1ddSLingrui98  val ftbEntryGen = Module(new FTBEntryGen).io
112609c6f1ddSLingrui98  ftbEntryGen.start_addr     := commit_pc_bundle.startAddr
112709c6f1ddSLingrui98  ftbEntryGen.old_entry      := commit_ftb_entry
112809c6f1ddSLingrui98  ftbEntryGen.pd             := commit_pd
112909c6f1ddSLingrui98  ftbEntryGen.cfiIndex       := commit_cfi
113009c6f1ddSLingrui98  ftbEntryGen.target         := commit_target
113109c6f1ddSLingrui98  ftbEntryGen.hit            := commit_real_hit
113209c6f1ddSLingrui98  ftbEntryGen.mispredict_vec := commit_mispredict
113309c6f1ddSLingrui98
113409c6f1ddSLingrui98  update_ftb_entry         := ftbEntryGen.new_entry
113509c6f1ddSLingrui98  update.new_br_insert_pos := ftbEntryGen.new_br_insert_pos
113609c6f1ddSLingrui98  update.mispred_mask      := ftbEntryGen.mispred_mask
113709c6f1ddSLingrui98  update.old_entry         := ftbEntryGen.is_old_entry
1138edc18578SLingrui98  update.pred_hit          := commit_hit === h_hit || commit_hit === h_false_hit
1139803124a6SLingrui98  update.br_taken_mask     := ftbEntryGen.taken_mask
1140803124a6SLingrui98  update.jmp_taken         := ftbEntryGen.jmp_taken
1141b37e4b45SLingrui98
1142803124a6SLingrui98  // update.full_pred.fromFtbEntry(ftbEntryGen.new_entry, update.pc)
1143803124a6SLingrui98  // update.full_pred.jalr_target := commit_target
1144803124a6SLingrui98  // update.full_pred.hit := true.B
1145803124a6SLingrui98  // when (update.full_pred.is_jalr) {
1146803124a6SLingrui98  //   update.full_pred.targets.last := commit_target
1147803124a6SLingrui98  // }
114809c6f1ddSLingrui98
1149e30430c2SJay  // ****************************************************************
1150e30430c2SJay  // *********************** to prefetch ****************************
1151e30430c2SJay  // ****************************************************************
1152e30430c2SJay
11539c8f16f2SJenius  ftq_pc_mem.io.other_raddrs(0) := DontCare
1154e30430c2SJay  if(cacheParams.hasPrefetch){
1155e30430c2SJay    val prefetchPtr = RegInit(FtqPtr(false.B, 0.U))
1156378f00d9SJenius    val diff_prefetch_addr = WireInit(update_target(prefetchPtr.value)) //TODO: remove this
1157378f00d9SJenius
1158e30430c2SJay    prefetchPtr := prefetchPtr + io.toPrefetch.req.fire()
1159e30430c2SJay
1160378f00d9SJenius    ftq_pc_mem.io.other_raddrs(0) := prefetchPtr.value
1161378f00d9SJenius
1162e30430c2SJay    when (bpu_s2_resp.valid && bpu_s2_resp.hasRedirect && !isBefore(prefetchPtr, bpu_s2_resp.ftq_idx)) {
1163e30430c2SJay      prefetchPtr := bpu_s2_resp.ftq_idx
1164e30430c2SJay    }
1165e30430c2SJay
1166cb4f77ceSLingrui98    when (bpu_s3_resp.valid && bpu_s3_resp.hasRedirect && !isBefore(prefetchPtr, bpu_s3_resp.ftq_idx)) {
1167cb4f77ceSLingrui98      prefetchPtr := bpu_s3_resp.ftq_idx
1168a3c55791SJinYue      // XSError(true.B, "\ns3_redirect mechanism not implemented!\n")
1169cb4f77ceSLingrui98    }
1170de7689fcSJay
1171f63797a4SLingrui98
1172f63797a4SLingrui98    val prefetch_is_to_send = WireInit(entry_fetch_status(prefetchPtr.value) === f_to_send)
1173f56177cbSJenius    val prefetch_addr = Wire(UInt(VAddrBits.W))
1174f63797a4SLingrui98
1175f63797a4SLingrui98    when (last_cycle_bpu_in && bpu_in_bypass_ptr === prefetchPtr) {
1176f63797a4SLingrui98      prefetch_is_to_send := true.B
11776bf9b30dSLingrui98      prefetch_addr := last_cycle_bpu_target
1178378f00d9SJenius      diff_prefetch_addr := last_cycle_bpu_target // TODO: remove this
1179f56177cbSJenius    }.otherwise{
1180f56177cbSJenius      prefetch_addr := RegNext( ftq_pc_mem.io.other_rdatas(0).startAddr)
1181f63797a4SLingrui98    }
1182f63797a4SLingrui98    io.toPrefetch.req.valid := prefetchPtr =/= bpuPtr && prefetch_is_to_send
1183f63797a4SLingrui98    io.toPrefetch.req.bits.target := prefetch_addr
1184de7689fcSJay
1185de7689fcSJay    when(redirectVec.map(r => r.valid).reduce(_||_)){
1186de7689fcSJay      val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits)))
1187de7689fcSJay      val next = r.ftqIdx + 1.U
1188de7689fcSJay      prefetchPtr := next
1189de7689fcSJay    }
1190de7689fcSJay
1191378f00d9SJenius    // TODO: remove this
119210f8eea3SLingrui98    // XSError(io.toPrefetch.req.valid && diff_prefetch_addr =/= prefetch_addr,
119310f8eea3SLingrui98    //         f"\nprefetch_req_target wrong! prefetchPtr: ${prefetchPtr}, prefetch_addr: ${Hexadecimal(prefetch_addr)} diff_prefetch_addr: ${Hexadecimal(diff_prefetch_addr)}\n")
1194378f00d9SJenius
1195378f00d9SJenius
1196de7689fcSJay    XSError(isBefore(bpuPtr, prefetchPtr) && !isFull(bpuPtr, prefetchPtr), "\nprefetchPtr is before bpuPtr!\n")
1197e8747464SJenius    XSError(isBefore(prefetchPtr, ifuPtr) && !isFull(ifuPtr, prefetchPtr), "\nifuPtr is before prefetchPtr!\n")
1198de7689fcSJay  }
1199de7689fcSJay  else {
1200de7689fcSJay    io.toPrefetch.req <> DontCare
1201de7689fcSJay  }
1202de7689fcSJay
120309c6f1ddSLingrui98  // ******************************************************************************
120409c6f1ddSLingrui98  // **************************** commit perf counters ****************************
120509c6f1ddSLingrui98  // ******************************************************************************
120609c6f1ddSLingrui98
120709c6f1ddSLingrui98  val commit_inst_mask    = VecInit(commit_state.map(c => c === c_commited && do_commit)).asUInt
120809c6f1ddSLingrui98  val commit_mispred_mask = commit_mispredict.asUInt
120909c6f1ddSLingrui98  val commit_not_mispred_mask = ~commit_mispred_mask
121009c6f1ddSLingrui98
121109c6f1ddSLingrui98  val commit_br_mask = commit_pd.brMask.asUInt
121209c6f1ddSLingrui98  val commit_jmp_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.jmpInfo.valid.asTypeOf(UInt(1.W)))
121309c6f1ddSLingrui98  val commit_cfi_mask = (commit_br_mask | commit_jmp_mask)
121409c6f1ddSLingrui98
121509c6f1ddSLingrui98  val mbpInstrs = commit_inst_mask & commit_cfi_mask
121609c6f1ddSLingrui98
121709c6f1ddSLingrui98  val mbpRights = mbpInstrs & commit_not_mispred_mask
121809c6f1ddSLingrui98  val mbpWrongs = mbpInstrs & commit_mispred_mask
121909c6f1ddSLingrui98
122009c6f1ddSLingrui98  io.bpuInfo.bpRight := PopCount(mbpRights)
122109c6f1ddSLingrui98  io.bpuInfo.bpWrong := PopCount(mbpWrongs)
122209c6f1ddSLingrui98
1223*da3bf434SMaxpicca-Li  val isWriteFTQTable = WireInit(Constantin.createRecord("isWriteFTQTable" + p(XSCoreParamsKey).HartId.toString))
122451532d8bSGuokai Chen  val ftqBranchTraceDB = ChiselDB.createTable("FTQTable" + p(XSCoreParamsKey).HartId.toString, new FtqDebugBundle)
122509c6f1ddSLingrui98  // Cfi Info
122609c6f1ddSLingrui98  for (i <- 0 until PredictWidth) {
122709c6f1ddSLingrui98    val pc = commit_pc_bundle.startAddr + (i * instBytes).U
122809c6f1ddSLingrui98    val v = commit_state(i) === c_commited
122909c6f1ddSLingrui98    val isBr = commit_pd.brMask(i)
123009c6f1ddSLingrui98    val isJmp = commit_pd.jmpInfo.valid && commit_pd.jmpOffset === i.U
123109c6f1ddSLingrui98    val isCfi = isBr || isJmp
123209c6f1ddSLingrui98    val isTaken = commit_cfi.valid && commit_cfi.bits === i.U
123309c6f1ddSLingrui98    val misPred = commit_mispredict(i)
1234c2ad24ebSLingrui98    // val ghist = commit_spec_meta.ghist.predHist
1235c2ad24ebSLingrui98    val histPtr = commit_spec_meta.histPtr
123609c6f1ddSLingrui98    val predCycle = commit_meta.meta(63, 0)
123709c6f1ddSLingrui98    val target = commit_target
123809c6f1ddSLingrui98
123909c6f1ddSLingrui98    val brIdx = OHToUInt(Reverse(Cat(update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U})))
124009c6f1ddSLingrui98    val inFtbEntry = update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U}.reduce(_||_)
124109c6f1ddSLingrui98    val addIntoHist = ((commit_hit === h_hit) && inFtbEntry) || ((!(commit_hit === h_hit) && i.U === commit_cfi.bits && isBr && commit_cfi.valid))
124209c6f1ddSLingrui98    XSDebug(v && do_commit && isCfi, p"cfi_update: isBr(${isBr}) pc(${Hexadecimal(pc)}) " +
1243c2ad24ebSLingrui98    p"taken(${isTaken}) mispred(${misPred}) cycle($predCycle) hist(${histPtr.value}) " +
124409c6f1ddSLingrui98    p"startAddr(${Hexadecimal(commit_pc_bundle.startAddr)}) AddIntoHist(${addIntoHist}) " +
124509c6f1ddSLingrui98    p"brInEntry(${inFtbEntry}) brIdx(${brIdx}) target(${Hexadecimal(target)})\n")
124651532d8bSGuokai Chen
124751532d8bSGuokai Chen    val logbundle = Wire(new FtqDebugBundle)
124851532d8bSGuokai Chen    logbundle.pc := pc
124951532d8bSGuokai Chen    logbundle.target := target
125051532d8bSGuokai Chen    logbundle.isBr := isBr
125151532d8bSGuokai Chen    logbundle.isJmp := isJmp
125251532d8bSGuokai Chen    logbundle.isCall := isJmp && commit_pd.hasCall
125351532d8bSGuokai Chen    logbundle.isRet := isJmp && commit_pd.hasRet
125451532d8bSGuokai Chen    logbundle.misPred := misPred
125551532d8bSGuokai Chen    logbundle.isTaken := isTaken
125651532d8bSGuokai Chen    logbundle.predStage := commit_stage
125751532d8bSGuokai Chen
125851532d8bSGuokai Chen    ftqBranchTraceDB.log(
125951532d8bSGuokai Chen      data = logbundle /* hardware of type T */,
1260*da3bf434SMaxpicca-Li      en = isWriteFTQTable.orR && v && do_commit && isCfi,
126151532d8bSGuokai Chen      site = "FTQ" + p(XSCoreParamsKey).HartId.toString,
126251532d8bSGuokai Chen      clock = clock,
126351532d8bSGuokai Chen      reset = reset
126451532d8bSGuokai Chen    )
126509c6f1ddSLingrui98  }
126609c6f1ddSLingrui98
126709c6f1ddSLingrui98  val enq = io.fromBpu.resp
12682e1be6e1SSteve Gou  val perf_redirect = backendRedirect
126909c6f1ddSLingrui98
127009c6f1ddSLingrui98  XSPerfAccumulate("entry", validEntries)
127109c6f1ddSLingrui98  XSPerfAccumulate("bpu_to_ftq_stall", enq.valid && !enq.ready)
127209c6f1ddSLingrui98  XSPerfAccumulate("mispredictRedirect", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level)
127309c6f1ddSLingrui98  XSPerfAccumulate("replayRedirect", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level))
127409c6f1ddSLingrui98  XSPerfAccumulate("predecodeRedirect", fromIfuRedirect.valid)
127509c6f1ddSLingrui98
127609c6f1ddSLingrui98  XSPerfAccumulate("to_ifu_bubble", io.toIfu.req.ready && !io.toIfu.req.valid)
127709c6f1ddSLingrui98
127809c6f1ddSLingrui98  XSPerfAccumulate("to_ifu_stall", io.toIfu.req.valid && !io.toIfu.req.ready)
127909c6f1ddSLingrui98  XSPerfAccumulate("from_bpu_real_bubble", !enq.valid && enq.ready && allowBpuIn)
128012cedb6fSLingrui98  XSPerfAccumulate("bpu_to_ifu_bubble", bpuPtr === ifuPtr)
128109c6f1ddSLingrui98
128209c6f1ddSLingrui98  val from_bpu = io.fromBpu.resp.bits
1283c2d1ec7dSLingrui98  def in_entry_len_map_gen(resp: BpuToFtqBundle)(stage: String) = {
1284c2d1ec7dSLingrui98    val entry_len = (resp.last_stage_ftb_entry.getFallThrough(resp.s3.pc) - resp.s3.pc) >> instOffsetBits
128509c6f1ddSLingrui98    val entry_len_recording_vec = (1 to PredictWidth+1).map(i => entry_len === i.U)
128609c6f1ddSLingrui98    val entry_len_map = (1 to PredictWidth+1).map(i =>
1287c2d1ec7dSLingrui98      f"${stage}_ftb_entry_len_$i" -> (entry_len_recording_vec(i-1) && resp.s3.valid)
128809c6f1ddSLingrui98    ).foldLeft(Map[String, UInt]())(_+_)
128909c6f1ddSLingrui98    entry_len_map
129009c6f1ddSLingrui98  }
1291c2d1ec7dSLingrui98  val s3_entry_len_map = in_entry_len_map_gen(from_bpu)("s3")
129209c6f1ddSLingrui98
129309c6f1ddSLingrui98  val to_ifu = io.toIfu.req.bits
129409c6f1ddSLingrui98
129509c6f1ddSLingrui98
129609c6f1ddSLingrui98
129709c6f1ddSLingrui98  val commit_num_inst_recording_vec = (1 to PredictWidth).map(i => PopCount(commit_inst_mask) === i.U)
129809c6f1ddSLingrui98  val commit_num_inst_map = (1 to PredictWidth).map(i =>
129909c6f1ddSLingrui98    f"commit_num_inst_$i" -> (commit_num_inst_recording_vec(i-1) && do_commit)
130009c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
130109c6f1ddSLingrui98
130209c6f1ddSLingrui98
130309c6f1ddSLingrui98
130409c6f1ddSLingrui98  val commit_jal_mask  = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJal.asTypeOf(UInt(1.W)))
130509c6f1ddSLingrui98  val commit_jalr_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJalr.asTypeOf(UInt(1.W)))
130609c6f1ddSLingrui98  val commit_call_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasCall.asTypeOf(UInt(1.W)))
130709c6f1ddSLingrui98  val commit_ret_mask  = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasRet.asTypeOf(UInt(1.W)))
130809c6f1ddSLingrui98
130909c6f1ddSLingrui98
131009c6f1ddSLingrui98  val mbpBRights = mbpRights & commit_br_mask
131109c6f1ddSLingrui98  val mbpJRights = mbpRights & commit_jal_mask
131209c6f1ddSLingrui98  val mbpIRights = mbpRights & commit_jalr_mask
131309c6f1ddSLingrui98  val mbpCRights = mbpRights & commit_call_mask
131409c6f1ddSLingrui98  val mbpRRights = mbpRights & commit_ret_mask
131509c6f1ddSLingrui98
131609c6f1ddSLingrui98  val mbpBWrongs = mbpWrongs & commit_br_mask
131709c6f1ddSLingrui98  val mbpJWrongs = mbpWrongs & commit_jal_mask
131809c6f1ddSLingrui98  val mbpIWrongs = mbpWrongs & commit_jalr_mask
131909c6f1ddSLingrui98  val mbpCWrongs = mbpWrongs & commit_call_mask
132009c6f1ddSLingrui98  val mbpRWrongs = mbpWrongs & commit_ret_mask
132109c6f1ddSLingrui98
13221d7e5011SLingrui98  val commit_pred_stage = RegNext(pred_stage(commPtr.value))
13231d7e5011SLingrui98
13241d7e5011SLingrui98  def pred_stage_map(src: UInt, name: String) = {
13251d7e5011SLingrui98    (0 until numBpStages).map(i =>
13261d7e5011SLingrui98      f"${name}_stage_${i+1}" -> PopCount(src.asBools.map(_ && commit_pred_stage === BP_STAGES(i)))
13271d7e5011SLingrui98    ).foldLeft(Map[String, UInt]())(_+_)
13281d7e5011SLingrui98  }
13291d7e5011SLingrui98
13301d7e5011SLingrui98  val mispred_stage_map      = pred_stage_map(mbpWrongs,  "mispredict")
13311d7e5011SLingrui98  val br_mispred_stage_map   = pred_stage_map(mbpBWrongs, "br_mispredict")
13321d7e5011SLingrui98  val jalr_mispred_stage_map = pred_stage_map(mbpIWrongs, "jalr_mispredict")
13331d7e5011SLingrui98  val correct_stage_map      = pred_stage_map(mbpRights,  "correct")
13341d7e5011SLingrui98  val br_correct_stage_map   = pred_stage_map(mbpBRights, "br_correct")
13351d7e5011SLingrui98  val jalr_correct_stage_map = pred_stage_map(mbpIRights, "jalr_correct")
13361d7e5011SLingrui98
133709c6f1ddSLingrui98  val update_valid = io.toBpu.update.valid
133809c6f1ddSLingrui98  def u(cond: Bool) = update_valid && cond
133909c6f1ddSLingrui98  val ftb_false_hit = u(update.false_hit)
134065fddcf0Szoujr  // assert(!ftb_false_hit)
134109c6f1ddSLingrui98  val ftb_hit = u(commit_hit === h_hit)
134209c6f1ddSLingrui98
134309c6f1ddSLingrui98  val ftb_new_entry = u(ftbEntryGen.is_init_entry)
1344b37e4b45SLingrui98  val ftb_new_entry_only_br = ftb_new_entry && !update_ftb_entry.jmpValid
1345b37e4b45SLingrui98  val ftb_new_entry_only_jmp = ftb_new_entry && !update_ftb_entry.brValids(0)
1346b37e4b45SLingrui98  val ftb_new_entry_has_br_and_jmp = ftb_new_entry && update_ftb_entry.brValids(0) && update_ftb_entry.jmpValid
134709c6f1ddSLingrui98
134809c6f1ddSLingrui98  val ftb_old_entry = u(ftbEntryGen.is_old_entry)
134909c6f1ddSLingrui98
135009c6f1ddSLingrui98  val ftb_modified_entry = u(ftbEntryGen.is_new_br || ftbEntryGen.is_jalr_target_modified || ftbEntryGen.is_always_taken_modified)
135109c6f1ddSLingrui98  val ftb_modified_entry_new_br = u(ftbEntryGen.is_new_br)
135209c6f1ddSLingrui98  val ftb_modified_entry_jalr_target_modified = u(ftbEntryGen.is_jalr_target_modified)
135309c6f1ddSLingrui98  val ftb_modified_entry_br_full = ftb_modified_entry && ftbEntryGen.is_br_full
135409c6f1ddSLingrui98  val ftb_modified_entry_always_taken = ftb_modified_entry && ftbEntryGen.is_always_taken_modified
135509c6f1ddSLingrui98
135609c6f1ddSLingrui98  val ftb_entry_len = (ftbEntryGen.new_entry.getFallThrough(update.pc) - update.pc) >> instOffsetBits
135709c6f1ddSLingrui98  val ftb_entry_len_recording_vec = (1 to PredictWidth+1).map(i => ftb_entry_len === i.U)
135809c6f1ddSLingrui98  val ftb_init_entry_len_map = (1 to PredictWidth+1).map(i =>
135909c6f1ddSLingrui98    f"ftb_init_entry_len_$i" -> (ftb_entry_len_recording_vec(i-1) && ftb_new_entry)
136009c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
136109c6f1ddSLingrui98  val ftb_modified_entry_len_map = (1 to PredictWidth+1).map(i =>
136209c6f1ddSLingrui98    f"ftb_modified_entry_len_$i" -> (ftb_entry_len_recording_vec(i-1) && ftb_modified_entry)
136309c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
136409c6f1ddSLingrui98
136509c6f1ddSLingrui98  val ftq_occupancy_map = (0 to FtqSize).map(i =>
136609c6f1ddSLingrui98    f"ftq_has_entry_$i" ->( validEntries === i.U)
136709c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
136809c6f1ddSLingrui98
136909c6f1ddSLingrui98  val perfCountsMap = Map(
137009c6f1ddSLingrui98    "BpInstr" -> PopCount(mbpInstrs),
137109c6f1ddSLingrui98    "BpBInstr" -> PopCount(mbpBRights | mbpBWrongs),
137209c6f1ddSLingrui98    "BpRight"  -> PopCount(mbpRights),
137309c6f1ddSLingrui98    "BpWrong"  -> PopCount(mbpWrongs),
137409c6f1ddSLingrui98    "BpBRight" -> PopCount(mbpBRights),
137509c6f1ddSLingrui98    "BpBWrong" -> PopCount(mbpBWrongs),
137609c6f1ddSLingrui98    "BpJRight" -> PopCount(mbpJRights),
137709c6f1ddSLingrui98    "BpJWrong" -> PopCount(mbpJWrongs),
137809c6f1ddSLingrui98    "BpIRight" -> PopCount(mbpIRights),
137909c6f1ddSLingrui98    "BpIWrong" -> PopCount(mbpIWrongs),
138009c6f1ddSLingrui98    "BpCRight" -> PopCount(mbpCRights),
138109c6f1ddSLingrui98    "BpCWrong" -> PopCount(mbpCWrongs),
138209c6f1ddSLingrui98    "BpRRight" -> PopCount(mbpRRights),
138309c6f1ddSLingrui98    "BpRWrong" -> PopCount(mbpRWrongs),
138409c6f1ddSLingrui98
138509c6f1ddSLingrui98    "ftb_false_hit"                -> PopCount(ftb_false_hit),
138609c6f1ddSLingrui98    "ftb_hit"                      -> PopCount(ftb_hit),
138709c6f1ddSLingrui98    "ftb_new_entry"                -> PopCount(ftb_new_entry),
138809c6f1ddSLingrui98    "ftb_new_entry_only_br"        -> PopCount(ftb_new_entry_only_br),
138909c6f1ddSLingrui98    "ftb_new_entry_only_jmp"       -> PopCount(ftb_new_entry_only_jmp),
139009c6f1ddSLingrui98    "ftb_new_entry_has_br_and_jmp" -> PopCount(ftb_new_entry_has_br_and_jmp),
139109c6f1ddSLingrui98    "ftb_old_entry"                -> PopCount(ftb_old_entry),
139209c6f1ddSLingrui98    "ftb_modified_entry"           -> PopCount(ftb_modified_entry),
139309c6f1ddSLingrui98    "ftb_modified_entry_new_br"    -> PopCount(ftb_modified_entry_new_br),
139409c6f1ddSLingrui98    "ftb_jalr_target_modified"     -> PopCount(ftb_modified_entry_jalr_target_modified),
139509c6f1ddSLingrui98    "ftb_modified_entry_br_full"   -> PopCount(ftb_modified_entry_br_full),
139609c6f1ddSLingrui98    "ftb_modified_entry_always_taken" -> PopCount(ftb_modified_entry_always_taken)
1397c2d1ec7dSLingrui98  ) ++ ftb_init_entry_len_map ++ ftb_modified_entry_len_map ++
1398cb4f77ceSLingrui98  s3_entry_len_map ++ commit_num_inst_map ++ ftq_occupancy_map ++
13991d7e5011SLingrui98  mispred_stage_map ++ br_mispred_stage_map ++ jalr_mispred_stage_map ++
14001d7e5011SLingrui98  correct_stage_map ++ br_correct_stage_map ++ jalr_correct_stage_map
140109c6f1ddSLingrui98
140209c6f1ddSLingrui98  for((key, value) <- perfCountsMap) {
140309c6f1ddSLingrui98    XSPerfAccumulate(key, value)
140409c6f1ddSLingrui98  }
140509c6f1ddSLingrui98
140609c6f1ddSLingrui98  // --------------------------- Debug --------------------------------
140709c6f1ddSLingrui98  // XSDebug(enq_fire, p"enq! " + io.fromBpu.resp.bits.toPrintable)
140809c6f1ddSLingrui98  XSDebug(io.toIfu.req.fire, p"fire to ifu " + io.toIfu.req.bits.toPrintable)
140909c6f1ddSLingrui98  XSDebug(do_commit, p"deq! [ptr] $do_commit_ptr\n")
141009c6f1ddSLingrui98  XSDebug(true.B, p"[bpuPtr] $bpuPtr, [ifuPtr] $ifuPtr, [ifuWbPtr] $ifuWbPtr [commPtr] $commPtr\n")
141109c6f1ddSLingrui98  XSDebug(true.B, p"[in] v:${io.fromBpu.resp.valid} r:${io.fromBpu.resp.ready} " +
141209c6f1ddSLingrui98    p"[out] v:${io.toIfu.req.valid} r:${io.toIfu.req.ready}\n")
141309c6f1ddSLingrui98  XSDebug(do_commit, p"[deq info] cfiIndex: $commit_cfi, $commit_pc_bundle, target: ${Hexadecimal(commit_target)}\n")
141409c6f1ddSLingrui98
141509c6f1ddSLingrui98  //   def ubtbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
141609c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
141709c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
141809c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
141909c6f1ddSLingrui98  //         isWrong ^ Mux(ans.hit.asBool,
142009c6f1ddSLingrui98  //           Mux(ans.taken.asBool, taken && ans.target === commitEntry.target,
142109c6f1ddSLingrui98  //           !taken),
142209c6f1ddSLingrui98  //         !taken),
142309c6f1ddSLingrui98  //       false.B)
142409c6f1ddSLingrui98  //     }
142509c6f1ddSLingrui98  //   }
142609c6f1ddSLingrui98
142709c6f1ddSLingrui98  //   def btbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
142809c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
142909c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
143009c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
143109c6f1ddSLingrui98  //         isWrong ^ Mux(ans.hit.asBool,
143209c6f1ddSLingrui98  //           Mux(ans.taken.asBool, taken && ans.target === commitEntry.target,
143309c6f1ddSLingrui98  //           !taken),
143409c6f1ddSLingrui98  //         !taken),
143509c6f1ddSLingrui98  //       false.B)
143609c6f1ddSLingrui98  //     }
143709c6f1ddSLingrui98  //   }
143809c6f1ddSLingrui98
143909c6f1ddSLingrui98  //   def tageCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
144009c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
144109c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
144209c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
144309c6f1ddSLingrui98  //         isWrong ^ (ans.taken.asBool === taken),
144409c6f1ddSLingrui98  //       false.B)
144509c6f1ddSLingrui98  //     }
144609c6f1ddSLingrui98  //   }
144709c6f1ddSLingrui98
144809c6f1ddSLingrui98  //   def loopCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
144909c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
145009c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
145109c6f1ddSLingrui98  //       Mux(valid && (pd.isBr) && ans.hit.asBool,
145209c6f1ddSLingrui98  //         isWrong ^ (!taken),
145309c6f1ddSLingrui98  //           false.B)
145409c6f1ddSLingrui98  //     }
145509c6f1ddSLingrui98  //   }
145609c6f1ddSLingrui98
145709c6f1ddSLingrui98  //   def rasCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
145809c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
145909c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
146009c6f1ddSLingrui98  //       Mux(valid && pd.isRet.asBool /*&& taken*/ && ans.hit.asBool,
146109c6f1ddSLingrui98  //         isWrong ^ (ans.target === commitEntry.target),
146209c6f1ddSLingrui98  //           false.B)
146309c6f1ddSLingrui98  //     }
146409c6f1ddSLingrui98  //   }
146509c6f1ddSLingrui98
146609c6f1ddSLingrui98  //   val ubtbRights = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), false.B)
146709c6f1ddSLingrui98  //   val ubtbWrongs = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), true.B)
146809c6f1ddSLingrui98  //   // btb and ubtb pred jal and jalr as well
146909c6f1ddSLingrui98  //   val btbRights = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), false.B)
147009c6f1ddSLingrui98  //   val btbWrongs = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), true.B)
147109c6f1ddSLingrui98  //   val tageRights = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), false.B)
147209c6f1ddSLingrui98  //   val tageWrongs = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), true.B)
147309c6f1ddSLingrui98
147409c6f1ddSLingrui98  //   val loopRights = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), false.B)
147509c6f1ddSLingrui98  //   val loopWrongs = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), true.B)
147609c6f1ddSLingrui98
147709c6f1ddSLingrui98  //   val rasRights = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), false.B)
147809c6f1ddSLingrui98  //   val rasWrongs = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), true.B)
14791ca0e4f3SYinan Xu
1480cd365d4cSrvcoresjw  val perfEvents = Seq(
1481cd365d4cSrvcoresjw    ("bpu_s2_redirect        ", bpu_s2_redirect                                                             ),
1482cb4f77ceSLingrui98    ("bpu_s3_redirect        ", bpu_s3_redirect                                                             ),
1483cd365d4cSrvcoresjw    ("bpu_to_ftq_stall       ", enq.valid && ~enq.ready                                                     ),
1484cd365d4cSrvcoresjw    ("mispredictRedirect     ", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level),
1485cd365d4cSrvcoresjw    ("replayRedirect         ", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level)  ),
1486cd365d4cSrvcoresjw    ("predecodeRedirect      ", fromIfuRedirect.valid                                                       ),
1487cd365d4cSrvcoresjw    ("to_ifu_bubble          ", io.toIfu.req.ready && !io.toIfu.req.valid                                   ),
1488cd365d4cSrvcoresjw    ("from_bpu_real_bubble   ", !enq.valid && enq.ready && allowBpuIn                                       ),
1489cd365d4cSrvcoresjw    ("BpInstr                ", PopCount(mbpInstrs)                                                         ),
1490cd365d4cSrvcoresjw    ("BpBInstr               ", PopCount(mbpBRights | mbpBWrongs)                                           ),
1491cd365d4cSrvcoresjw    ("BpRight                ", PopCount(mbpRights)                                                         ),
1492cd365d4cSrvcoresjw    ("BpWrong                ", PopCount(mbpWrongs)                                                         ),
1493cd365d4cSrvcoresjw    ("BpBRight               ", PopCount(mbpBRights)                                                        ),
1494cd365d4cSrvcoresjw    ("BpBWrong               ", PopCount(mbpBWrongs)                                                        ),
1495cd365d4cSrvcoresjw    ("BpJRight               ", PopCount(mbpJRights)                                                        ),
1496cd365d4cSrvcoresjw    ("BpJWrong               ", PopCount(mbpJWrongs)                                                        ),
1497cd365d4cSrvcoresjw    ("BpIRight               ", PopCount(mbpIRights)                                                        ),
1498cd365d4cSrvcoresjw    ("BpIWrong               ", PopCount(mbpIWrongs)                                                        ),
1499cd365d4cSrvcoresjw    ("BpCRight               ", PopCount(mbpCRights)                                                        ),
1500cd365d4cSrvcoresjw    ("BpCWrong               ", PopCount(mbpCWrongs)                                                        ),
1501cd365d4cSrvcoresjw    ("BpRRight               ", PopCount(mbpRRights)                                                        ),
1502cd365d4cSrvcoresjw    ("BpRWrong               ", PopCount(mbpRWrongs)                                                        ),
1503cd365d4cSrvcoresjw    ("ftb_false_hit          ", PopCount(ftb_false_hit)                                                     ),
1504cd365d4cSrvcoresjw    ("ftb_hit                ", PopCount(ftb_hit)                                                           ),
1505cd365d4cSrvcoresjw  )
15061ca0e4f3SYinan Xu  generatePerfEvent()
150709c6f1ddSLingrui98}