xref: /XiangShan/src/main/scala/xiangshan/frontend/NewFtq.scala (revision c2d1ec7d8734e9b271854cd55dc29c8b1826b3cf)
109c6f1ddSLingrui98/***************************************************************************************
209c6f1ddSLingrui98* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
309c6f1ddSLingrui98* Copyright (c) 2020-2021 Peng Cheng Laboratory
409c6f1ddSLingrui98*
509c6f1ddSLingrui98* XiangShan is licensed under Mulan PSL v2.
609c6f1ddSLingrui98* You can use this software according to the terms and conditions of the Mulan PSL v2.
709c6f1ddSLingrui98* You may obtain a copy of Mulan PSL v2 at:
809c6f1ddSLingrui98*          http://license.coscl.org.cn/MulanPSL2
909c6f1ddSLingrui98*
1009c6f1ddSLingrui98* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
1109c6f1ddSLingrui98* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
1209c6f1ddSLingrui98* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
1309c6f1ddSLingrui98*
1409c6f1ddSLingrui98* See the Mulan PSL v2 for more details.
1509c6f1ddSLingrui98***************************************************************************************/
1609c6f1ddSLingrui98
1709c6f1ddSLingrui98package xiangshan.frontend
1809c6f1ddSLingrui98
1909c6f1ddSLingrui98import chipsalliance.rocketchip.config.Parameters
2009c6f1ddSLingrui98import chisel3._
2109c6f1ddSLingrui98import chisel3.util._
221ca0e4f3SYinan Xuimport utils._
2309c6f1ddSLingrui98import xiangshan._
24e30430c2SJayimport xiangshan.frontend.icache._
251ca0e4f3SYinan Xuimport xiangshan.backend.CtrlToFtqIO
262e1be6e1SSteve Gouimport xiangshan.backend.decode.ImmUnion
2709c6f1ddSLingrui98
2809c6f1ddSLingrui98class FtqPtr(implicit p: Parameters) extends CircularQueuePtr[FtqPtr](
2909c6f1ddSLingrui98  p => p(XSCoreParamsKey).FtqSize
3009c6f1ddSLingrui98){
3109c6f1ddSLingrui98}
3209c6f1ddSLingrui98
3309c6f1ddSLingrui98object FtqPtr {
3409c6f1ddSLingrui98  def apply(f: Bool, v: UInt)(implicit p: Parameters): FtqPtr = {
3509c6f1ddSLingrui98    val ptr = Wire(new FtqPtr)
3609c6f1ddSLingrui98    ptr.flag := f
3709c6f1ddSLingrui98    ptr.value := v
3809c6f1ddSLingrui98    ptr
3909c6f1ddSLingrui98  }
4009c6f1ddSLingrui98  def inverse(ptr: FtqPtr)(implicit p: Parameters): FtqPtr = {
4109c6f1ddSLingrui98    apply(!ptr.flag, ptr.value)
4209c6f1ddSLingrui98  }
4309c6f1ddSLingrui98}
4409c6f1ddSLingrui98
4509c6f1ddSLingrui98class FtqNRSRAM[T <: Data](gen: T, numRead: Int)(implicit p: Parameters) extends XSModule {
4609c6f1ddSLingrui98
4709c6f1ddSLingrui98  val io = IO(new Bundle() {
4809c6f1ddSLingrui98    val raddr = Input(Vec(numRead, UInt(log2Up(FtqSize).W)))
4909c6f1ddSLingrui98    val ren = Input(Vec(numRead, Bool()))
5009c6f1ddSLingrui98    val rdata = Output(Vec(numRead, gen))
5109c6f1ddSLingrui98    val waddr = Input(UInt(log2Up(FtqSize).W))
5209c6f1ddSLingrui98    val wen = Input(Bool())
5309c6f1ddSLingrui98    val wdata = Input(gen)
5409c6f1ddSLingrui98  })
5509c6f1ddSLingrui98
5609c6f1ddSLingrui98  for(i <- 0 until numRead){
5709c6f1ddSLingrui98    val sram = Module(new SRAMTemplate(gen, FtqSize))
5809c6f1ddSLingrui98    sram.io.r.req.valid := io.ren(i)
5909c6f1ddSLingrui98    sram.io.r.req.bits.setIdx := io.raddr(i)
6009c6f1ddSLingrui98    io.rdata(i) := sram.io.r.resp.data(0)
6109c6f1ddSLingrui98    sram.io.w.req.valid := io.wen
6209c6f1ddSLingrui98    sram.io.w.req.bits.setIdx := io.waddr
6309c6f1ddSLingrui98    sram.io.w.req.bits.data := VecInit(io.wdata)
6409c6f1ddSLingrui98  }
6509c6f1ddSLingrui98
6609c6f1ddSLingrui98}
6709c6f1ddSLingrui98
6809c6f1ddSLingrui98class Ftq_RF_Components(implicit p: Parameters) extends XSBundle with BPUUtils {
6909c6f1ddSLingrui98  val startAddr = UInt(VAddrBits.W)
70b37e4b45SLingrui98  val nextLineAddr = UInt(VAddrBits.W)
7109c6f1ddSLingrui98  val isNextMask = Vec(PredictWidth, Bool())
72b37e4b45SLingrui98  val fallThruError = Bool()
73b37e4b45SLingrui98  // val carry = Bool()
7409c6f1ddSLingrui98  def getPc(offset: UInt) = {
7585215037SLingrui98    def getHigher(pc: UInt) = pc(VAddrBits-1, log2Ceil(PredictWidth)+instOffsetBits+1)
7685215037SLingrui98    def getOffset(pc: UInt) = pc(log2Ceil(PredictWidth)+instOffsetBits, instOffsetBits)
77b37e4b45SLingrui98    Cat(getHigher(Mux(isNextMask(offset) && startAddr(log2Ceil(PredictWidth)+instOffsetBits), nextLineAddr, startAddr)),
7809c6f1ddSLingrui98        getOffset(startAddr)+offset, 0.U(instOffsetBits.W))
7909c6f1ddSLingrui98  }
8009c6f1ddSLingrui98  def fromBranchPrediction(resp: BranchPredictionBundle) = {
81a229ab6cSLingrui98    def carryPos(addr: UInt) = addr(instOffsetBits+log2Ceil(PredictWidth)+1)
8209c6f1ddSLingrui98    this.startAddr := resp.pc
83a60a2901SLingrui98    this.nextLineAddr := resp.pc + (FetchWidth * 4 * 2).U // may be broken on other configs
8409c6f1ddSLingrui98    this.isNextMask := VecInit((0 until PredictWidth).map(i =>
8509c6f1ddSLingrui98      (resp.pc(log2Ceil(PredictWidth), 1) +& i.U)(log2Ceil(PredictWidth)).asBool()
8609c6f1ddSLingrui98    ))
87b37e4b45SLingrui98    this.fallThruError := resp.fallThruError
8809c6f1ddSLingrui98    this
8909c6f1ddSLingrui98  }
9009c6f1ddSLingrui98  override def toPrintable: Printable = {
91b37e4b45SLingrui98    p"startAddr:${Hexadecimal(startAddr)}"
9209c6f1ddSLingrui98  }
9309c6f1ddSLingrui98}
9409c6f1ddSLingrui98
9509c6f1ddSLingrui98class Ftq_pd_Entry(implicit p: Parameters) extends XSBundle {
9609c6f1ddSLingrui98  val brMask = Vec(PredictWidth, Bool())
9709c6f1ddSLingrui98  val jmpInfo = ValidUndirectioned(Vec(3, Bool()))
9809c6f1ddSLingrui98  val jmpOffset = UInt(log2Ceil(PredictWidth).W)
9909c6f1ddSLingrui98  val jalTarget = UInt(VAddrBits.W)
10009c6f1ddSLingrui98  val rvcMask = Vec(PredictWidth, Bool())
10109c6f1ddSLingrui98  def hasJal  = jmpInfo.valid && !jmpInfo.bits(0)
10209c6f1ddSLingrui98  def hasJalr = jmpInfo.valid && jmpInfo.bits(0)
10309c6f1ddSLingrui98  def hasCall = jmpInfo.valid && jmpInfo.bits(1)
10409c6f1ddSLingrui98  def hasRet  = jmpInfo.valid && jmpInfo.bits(2)
10509c6f1ddSLingrui98
10609c6f1ddSLingrui98  def fromPdWb(pdWb: PredecodeWritebackBundle) = {
10709c6f1ddSLingrui98    val pds = pdWb.pd
10809c6f1ddSLingrui98    this.brMask := VecInit(pds.map(pd => pd.isBr && pd.valid))
10909c6f1ddSLingrui98    this.jmpInfo.valid := VecInit(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid)).asUInt.orR
11009c6f1ddSLingrui98    this.jmpInfo.bits := ParallelPriorityMux(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid),
11109c6f1ddSLingrui98                                             pds.map(pd => VecInit(pd.isJalr, pd.isCall, pd.isRet)))
11209c6f1ddSLingrui98    this.jmpOffset := ParallelPriorityEncoder(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid))
11309c6f1ddSLingrui98    this.rvcMask := VecInit(pds.map(pd => pd.isRVC))
11409c6f1ddSLingrui98    this.jalTarget := pdWb.jalTarget
11509c6f1ddSLingrui98  }
11609c6f1ddSLingrui98
11709c6f1ddSLingrui98  def toPd(offset: UInt) = {
11809c6f1ddSLingrui98    require(offset.getWidth == log2Ceil(PredictWidth))
11909c6f1ddSLingrui98    val pd = Wire(new PreDecodeInfo)
12009c6f1ddSLingrui98    pd.valid := true.B
12109c6f1ddSLingrui98    pd.isRVC := rvcMask(offset)
12209c6f1ddSLingrui98    val isBr = brMask(offset)
12309c6f1ddSLingrui98    val isJalr = offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(0)
12409c6f1ddSLingrui98    pd.brType := Cat(offset === jmpOffset && jmpInfo.valid, isJalr || isBr)
12509c6f1ddSLingrui98    pd.isCall := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(1)
12609c6f1ddSLingrui98    pd.isRet  := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(2)
12709c6f1ddSLingrui98    pd
12809c6f1ddSLingrui98  }
12909c6f1ddSLingrui98}
13009c6f1ddSLingrui98
13109c6f1ddSLingrui98
13209c6f1ddSLingrui98
133*c2d1ec7dSLingrui98class Ftq_Redirect_SRAMEntry(implicit p: Parameters) extends SpeculativeInfo {}
13409c6f1ddSLingrui98
13509c6f1ddSLingrui98class Ftq_1R_SRAMEntry(implicit p: Parameters) extends XSBundle with HasBPUConst {
13609c6f1ddSLingrui98  val meta = UInt(MaxMetaLength.W)
13709c6f1ddSLingrui98}
13809c6f1ddSLingrui98
13909c6f1ddSLingrui98class Ftq_Pred_Info(implicit p: Parameters) extends XSBundle {
14009c6f1ddSLingrui98  val target = UInt(VAddrBits.W)
14109c6f1ddSLingrui98  val cfiIndex = ValidUndirectioned(UInt(log2Ceil(PredictWidth).W))
14209c6f1ddSLingrui98}
14309c6f1ddSLingrui98
14409c6f1ddSLingrui98
14509c6f1ddSLingrui98class FtqRead[T <: Data](private val gen: T)(implicit p: Parameters) extends XSBundle {
14609c6f1ddSLingrui98  val ptr = Output(new FtqPtr)
14709c6f1ddSLingrui98  val offset = Output(UInt(log2Ceil(PredictWidth).W))
14809c6f1ddSLingrui98  val data = Input(gen)
14909c6f1ddSLingrui98  def apply(ptr: FtqPtr, offset: UInt) = {
15009c6f1ddSLingrui98    this.ptr := ptr
15109c6f1ddSLingrui98    this.offset := offset
15209c6f1ddSLingrui98    this.data
15309c6f1ddSLingrui98  }
15409c6f1ddSLingrui98}
15509c6f1ddSLingrui98
15609c6f1ddSLingrui98
15709c6f1ddSLingrui98class FtqToBpuIO(implicit p: Parameters) extends XSBundle {
15809c6f1ddSLingrui98  val redirect = Valid(new BranchPredictionRedirect)
15909c6f1ddSLingrui98  val update = Valid(new BranchPredictionUpdate)
16009c6f1ddSLingrui98  val enq_ptr = Output(new FtqPtr)
16109c6f1ddSLingrui98}
16209c6f1ddSLingrui98
16309c6f1ddSLingrui98class FtqToIfuIO(implicit p: Parameters) extends XSBundle with HasCircularQueuePtrHelper {
16409c6f1ddSLingrui98  val req = Decoupled(new FetchRequestBundle)
16509c6f1ddSLingrui98  val redirect = Valid(new Redirect)
16609c6f1ddSLingrui98  val flushFromBpu = new Bundle {
16709c6f1ddSLingrui98    // when ifu pipeline is not stalled,
16809c6f1ddSLingrui98    // a packet from bpu s3 can reach f1 at most
16909c6f1ddSLingrui98    val s2 = Valid(new FtqPtr)
170cb4f77ceSLingrui98    val s3 = Valid(new FtqPtr)
17109c6f1ddSLingrui98    def shouldFlushBy(src: Valid[FtqPtr], idx_to_flush: FtqPtr) = {
17209c6f1ddSLingrui98      src.valid && !isAfter(src.bits, idx_to_flush)
17309c6f1ddSLingrui98    }
17409c6f1ddSLingrui98    def shouldFlushByStage2(idx: FtqPtr) = shouldFlushBy(s2, idx)
175cb4f77ceSLingrui98    def shouldFlushByStage3(idx: FtqPtr) = shouldFlushBy(s3, idx)
17609c6f1ddSLingrui98  }
17709c6f1ddSLingrui98}
17809c6f1ddSLingrui98
179c5c5edaeSJeniusclass FtqToICacheIO(implicit p: Parameters) extends XSBundle with HasCircularQueuePtrHelper {
180c5c5edaeSJenius  //NOTE: req.bits must be prepare in T cycle
181c5c5edaeSJenius  // while req.valid is set true in T + 1 cycle
182c5c5edaeSJenius  val req = Decoupled(new FtqToICacheRequestBundle)
183c5c5edaeSJenius}
184c5c5edaeSJenius
18509c6f1ddSLingrui98trait HasBackendRedirectInfo extends HasXSParameter {
1862e1be6e1SSteve Gou  def numRedirectPcRead = exuParameters.JmpCnt + exuParameters.AluCnt + 1
18709c6f1ddSLingrui98  def isLoadReplay(r: Valid[Redirect]) = r.bits.flushItself()
18809c6f1ddSLingrui98}
18909c6f1ddSLingrui98
19009c6f1ddSLingrui98class FtqToCtrlIO(implicit p: Parameters) extends XSBundle with HasBackendRedirectInfo {
191b56f947eSYinan Xu  // write to backend pc mem
192b56f947eSYinan Xu  val pc_mem_wen = Output(Bool())
193b56f947eSYinan Xu  val pc_mem_waddr = Output(UInt(log2Ceil(FtqSize).W))
194b56f947eSYinan Xu  val pc_mem_wdata = Output(new Ftq_RF_Components)
195873dc383SLingrui98  // newest target
196873dc383SLingrui98  val newest_entry_target = Output(UInt(VAddrBits.W))
197873dc383SLingrui98  val newest_entry_ptr = Output(new FtqPtr)
19809c6f1ddSLingrui98}
19909c6f1ddSLingrui98
20009c6f1ddSLingrui98
20109c6f1ddSLingrui98class FTBEntryGen(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo with HasBPUParameter {
20209c6f1ddSLingrui98  val io = IO(new Bundle {
20309c6f1ddSLingrui98    val start_addr = Input(UInt(VAddrBits.W))
20409c6f1ddSLingrui98    val old_entry = Input(new FTBEntry)
20509c6f1ddSLingrui98    val pd = Input(new Ftq_pd_Entry)
20609c6f1ddSLingrui98    val cfiIndex = Flipped(Valid(UInt(log2Ceil(PredictWidth).W)))
20709c6f1ddSLingrui98    val target = Input(UInt(VAddrBits.W))
20809c6f1ddSLingrui98    val hit = Input(Bool())
20909c6f1ddSLingrui98    val mispredict_vec = Input(Vec(PredictWidth, Bool()))
21009c6f1ddSLingrui98
21109c6f1ddSLingrui98    val new_entry = Output(new FTBEntry)
21209c6f1ddSLingrui98    val new_br_insert_pos = Output(Vec(numBr, Bool()))
21309c6f1ddSLingrui98    val taken_mask = Output(Vec(numBr, Bool()))
214803124a6SLingrui98    val jmp_taken = Output(Bool())
21509c6f1ddSLingrui98    val mispred_mask = Output(Vec(numBr+1, Bool()))
21609c6f1ddSLingrui98
21709c6f1ddSLingrui98    // for perf counters
21809c6f1ddSLingrui98    val is_init_entry = Output(Bool())
21909c6f1ddSLingrui98    val is_old_entry = Output(Bool())
22009c6f1ddSLingrui98    val is_new_br = Output(Bool())
22109c6f1ddSLingrui98    val is_jalr_target_modified = Output(Bool())
22209c6f1ddSLingrui98    val is_always_taken_modified = Output(Bool())
22309c6f1ddSLingrui98    val is_br_full = Output(Bool())
22409c6f1ddSLingrui98  })
22509c6f1ddSLingrui98
22609c6f1ddSLingrui98  // no mispredictions detected at predecode
22709c6f1ddSLingrui98  val hit = io.hit
22809c6f1ddSLingrui98  val pd = io.pd
22909c6f1ddSLingrui98
23009c6f1ddSLingrui98  val init_entry = WireInit(0.U.asTypeOf(new FTBEntry))
23109c6f1ddSLingrui98
23209c6f1ddSLingrui98
23309c6f1ddSLingrui98  val cfi_is_br = pd.brMask(io.cfiIndex.bits) && io.cfiIndex.valid
23409c6f1ddSLingrui98  val entry_has_jmp = pd.jmpInfo.valid
23509c6f1ddSLingrui98  val new_jmp_is_jal  = entry_has_jmp && !pd.jmpInfo.bits(0) && io.cfiIndex.valid
23609c6f1ddSLingrui98  val new_jmp_is_jalr = entry_has_jmp &&  pd.jmpInfo.bits(0) && io.cfiIndex.valid
23709c6f1ddSLingrui98  val new_jmp_is_call = entry_has_jmp &&  pd.jmpInfo.bits(1) && io.cfiIndex.valid
23809c6f1ddSLingrui98  val new_jmp_is_ret  = entry_has_jmp &&  pd.jmpInfo.bits(2) && io.cfiIndex.valid
23909c6f1ddSLingrui98  val last_jmp_rvi = entry_has_jmp && pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask.last
240a60a2901SLingrui98  // val last_br_rvi = cfi_is_br && io.cfiIndex.bits === (PredictWidth-1).U && !pd.rvcMask.last
24109c6f1ddSLingrui98
24209c6f1ddSLingrui98  val cfi_is_jal = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jal
24309c6f1ddSLingrui98  val cfi_is_jalr = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jalr
24409c6f1ddSLingrui98
245a60a2901SLingrui98  def carryPos = log2Ceil(PredictWidth)+instOffsetBits
24609c6f1ddSLingrui98  def getLower(pc: UInt) = pc(carryPos-1, instOffsetBits)
24709c6f1ddSLingrui98  // if not hit, establish a new entry
24809c6f1ddSLingrui98  init_entry.valid := true.B
24909c6f1ddSLingrui98  // tag is left for ftb to assign
250eeb5ff92SLingrui98
251eeb5ff92SLingrui98  // case br
252eeb5ff92SLingrui98  val init_br_slot = init_entry.getSlotForBr(0)
253eeb5ff92SLingrui98  when (cfi_is_br) {
254eeb5ff92SLingrui98    init_br_slot.valid := true.B
255eeb5ff92SLingrui98    init_br_slot.offset := io.cfiIndex.bits
256b37e4b45SLingrui98    init_br_slot.setLowerStatByTarget(io.start_addr, io.target, numBr == 1)
257eeb5ff92SLingrui98    init_entry.always_taken(0) := true.B // set to always taken on init
258eeb5ff92SLingrui98  }
259eeb5ff92SLingrui98
260eeb5ff92SLingrui98  // case jmp
261eeb5ff92SLingrui98  when (entry_has_jmp) {
262eeb5ff92SLingrui98    init_entry.tailSlot.offset := pd.jmpOffset
263eeb5ff92SLingrui98    init_entry.tailSlot.valid := new_jmp_is_jal || new_jmp_is_jalr
264eeb5ff92SLingrui98    init_entry.tailSlot.setLowerStatByTarget(io.start_addr, Mux(cfi_is_jalr, io.target, pd.jalTarget), isShare=false)
265eeb5ff92SLingrui98  }
266eeb5ff92SLingrui98
26709c6f1ddSLingrui98  val jmpPft = getLower(io.start_addr) +& pd.jmpOffset +& Mux(pd.rvcMask(pd.jmpOffset), 1.U, 2.U)
268a60a2901SLingrui98  init_entry.pftAddr := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft, getLower(io.start_addr))
269a60a2901SLingrui98  init_entry.carry   := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft(carryPos-instOffsetBits), true.B)
27009c6f1ddSLingrui98  init_entry.isJalr := new_jmp_is_jalr
27109c6f1ddSLingrui98  init_entry.isCall := new_jmp_is_call
27209c6f1ddSLingrui98  init_entry.isRet  := new_jmp_is_ret
273f4ebc4b2SLingrui98  // that means fall thru points to the middle of an inst
274ae409b75SSteve Gou  init_entry.last_may_be_rvi_call := pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask(pd.jmpOffset)
27509c6f1ddSLingrui98
27609c6f1ddSLingrui98  // if hit, check whether a new cfi(only br is possible) is detected
27709c6f1ddSLingrui98  val oe = io.old_entry
278eeb5ff92SLingrui98  val br_recorded_vec = oe.getBrRecordedVec(io.cfiIndex.bits)
27909c6f1ddSLingrui98  val br_recorded = br_recorded_vec.asUInt.orR
28009c6f1ddSLingrui98  val is_new_br = cfi_is_br && !br_recorded
28109c6f1ddSLingrui98  val new_br_offset = io.cfiIndex.bits
28209c6f1ddSLingrui98  // vec(i) means new br will be inserted BEFORE old br(i)
283eeb5ff92SLingrui98  val allBrSlotsVec = oe.allSlotsForBr
28409c6f1ddSLingrui98  val new_br_insert_onehot = VecInit((0 until numBr).map{
28509c6f1ddSLingrui98    i => i match {
286eeb5ff92SLingrui98      case 0 =>
287eeb5ff92SLingrui98        !allBrSlotsVec(0).valid || new_br_offset < allBrSlotsVec(0).offset
288eeb5ff92SLingrui98      case idx =>
289eeb5ff92SLingrui98        allBrSlotsVec(idx-1).valid && new_br_offset > allBrSlotsVec(idx-1).offset &&
290eeb5ff92SLingrui98        (!allBrSlotsVec(idx).valid || new_br_offset < allBrSlotsVec(idx).offset)
29109c6f1ddSLingrui98    }
29209c6f1ddSLingrui98  })
29309c6f1ddSLingrui98
29409c6f1ddSLingrui98  val old_entry_modified = WireInit(io.old_entry)
29509c6f1ddSLingrui98  for (i <- 0 until numBr) {
296eeb5ff92SLingrui98    val slot = old_entry_modified.allSlotsForBr(i)
297eeb5ff92SLingrui98    when (new_br_insert_onehot(i)) {
298eeb5ff92SLingrui98      slot.valid := true.B
299eeb5ff92SLingrui98      slot.offset := new_br_offset
300b37e4b45SLingrui98      slot.setLowerStatByTarget(io.start_addr, io.target, i == numBr-1)
301eeb5ff92SLingrui98      old_entry_modified.always_taken(i) := true.B
302eeb5ff92SLingrui98    }.elsewhen (new_br_offset > oe.allSlotsForBr(i).offset) {
303eeb5ff92SLingrui98      old_entry_modified.always_taken(i) := false.B
304eeb5ff92SLingrui98      // all other fields remain unchanged
305eeb5ff92SLingrui98    }.otherwise {
306eeb5ff92SLingrui98      // case i == 0, remain unchanged
307eeb5ff92SLingrui98      if (i != 0) {
308b37e4b45SLingrui98        val noNeedToMoveFromFormerSlot = (i == numBr-1).B && !oe.brSlots.last.valid
309eeb5ff92SLingrui98        when (!noNeedToMoveFromFormerSlot) {
310eeb5ff92SLingrui98          slot.fromAnotherSlot(oe.allSlotsForBr(i-1))
311eeb5ff92SLingrui98          old_entry_modified.always_taken(i) := oe.always_taken(i)
31209c6f1ddSLingrui98        }
313eeb5ff92SLingrui98      }
314eeb5ff92SLingrui98    }
315eeb5ff92SLingrui98  }
31609c6f1ddSLingrui98
317eeb5ff92SLingrui98  // two circumstances:
318eeb5ff92SLingrui98  // 1. oe: | br | j  |, new br should be in front of j, thus addr of j should be new pft
319eeb5ff92SLingrui98  // 2. oe: | br | br |, new br could be anywhere between, thus new pft is the addr of either
320eeb5ff92SLingrui98  //        the previous last br or the new br
321eeb5ff92SLingrui98  val may_have_to_replace = oe.noEmptySlotForNewBr
322eeb5ff92SLingrui98  val pft_need_to_change = is_new_br && may_have_to_replace
32309c6f1ddSLingrui98  // it should either be the given last br or the new br
32409c6f1ddSLingrui98  when (pft_need_to_change) {
325eeb5ff92SLingrui98    val new_pft_offset =
326710a8720SLingrui98      Mux(!new_br_insert_onehot.asUInt.orR,
327710a8720SLingrui98        new_br_offset, oe.allSlotsForBr.last.offset)
328eeb5ff92SLingrui98
329710a8720SLingrui98    // set jmp to invalid
33009c6f1ddSLingrui98    old_entry_modified.pftAddr := getLower(io.start_addr) + new_pft_offset
33109c6f1ddSLingrui98    old_entry_modified.carry := (getLower(io.start_addr) +& new_pft_offset).head(1).asBool
332f4ebc4b2SLingrui98    old_entry_modified.last_may_be_rvi_call := false.B
33309c6f1ddSLingrui98    old_entry_modified.isCall := false.B
33409c6f1ddSLingrui98    old_entry_modified.isRet := false.B
335eeb5ff92SLingrui98    old_entry_modified.isJalr := false.B
33609c6f1ddSLingrui98  }
33709c6f1ddSLingrui98
33809c6f1ddSLingrui98  val old_entry_jmp_target_modified = WireInit(oe)
339710a8720SLingrui98  val old_target = oe.tailSlot.getTarget(io.start_addr) // may be wrong because we store only 20 lowest bits
340b37e4b45SLingrui98  val old_tail_is_jmp = !oe.tailSlot.sharing
341eeb5ff92SLingrui98  val jalr_target_modified = cfi_is_jalr && (old_target =/= io.target) && old_tail_is_jmp // TODO: pass full jalr target
3423bcae573SLingrui98  when (jalr_target_modified) {
34309c6f1ddSLingrui98    old_entry_jmp_target_modified.setByJmpTarget(io.start_addr, io.target)
34409c6f1ddSLingrui98    old_entry_jmp_target_modified.always_taken := 0.U.asTypeOf(Vec(numBr, Bool()))
34509c6f1ddSLingrui98  }
34609c6f1ddSLingrui98
34709c6f1ddSLingrui98  val old_entry_always_taken = WireInit(oe)
34809c6f1ddSLingrui98  val always_taken_modified_vec = Wire(Vec(numBr, Bool())) // whether modified or not
34909c6f1ddSLingrui98  for (i <- 0 until numBr) {
35009c6f1ddSLingrui98    old_entry_always_taken.always_taken(i) :=
35109c6f1ddSLingrui98      oe.always_taken(i) && io.cfiIndex.valid && oe.brValids(i) && io.cfiIndex.bits === oe.brOffset(i)
352710a8720SLingrui98    always_taken_modified_vec(i) := oe.always_taken(i) && !old_entry_always_taken.always_taken(i)
35309c6f1ddSLingrui98  }
35409c6f1ddSLingrui98  val always_taken_modified = always_taken_modified_vec.reduce(_||_)
35509c6f1ddSLingrui98
35609c6f1ddSLingrui98
35709c6f1ddSLingrui98
35809c6f1ddSLingrui98  val derived_from_old_entry =
35909c6f1ddSLingrui98    Mux(is_new_br, old_entry_modified,
3603bcae573SLingrui98      Mux(jalr_target_modified, old_entry_jmp_target_modified, old_entry_always_taken))
36109c6f1ddSLingrui98
36209c6f1ddSLingrui98
36309c6f1ddSLingrui98  io.new_entry := Mux(!hit, init_entry, derived_from_old_entry)
36409c6f1ddSLingrui98
36509c6f1ddSLingrui98  io.new_br_insert_pos := new_br_insert_onehot
36609c6f1ddSLingrui98  io.taken_mask := VecInit((io.new_entry.brOffset zip io.new_entry.brValids).map{
36709c6f1ddSLingrui98    case (off, v) => io.cfiIndex.bits === off && io.cfiIndex.valid && v
36809c6f1ddSLingrui98  })
369803124a6SLingrui98  io.jmp_taken := io.new_entry.jmpValid && io.new_entry.tailSlot.offset === io.cfiIndex.bits
37009c6f1ddSLingrui98  for (i <- 0 until numBr) {
37109c6f1ddSLingrui98    io.mispred_mask(i) := io.new_entry.brValids(i) && io.mispredict_vec(io.new_entry.brOffset(i))
37209c6f1ddSLingrui98  }
37309c6f1ddSLingrui98  io.mispred_mask.last := io.new_entry.jmpValid && io.mispredict_vec(pd.jmpOffset)
37409c6f1ddSLingrui98
37509c6f1ddSLingrui98  // for perf counters
37609c6f1ddSLingrui98  io.is_init_entry := !hit
3773bcae573SLingrui98  io.is_old_entry := hit && !is_new_br && !jalr_target_modified && !always_taken_modified
37809c6f1ddSLingrui98  io.is_new_br := hit && is_new_br
3793bcae573SLingrui98  io.is_jalr_target_modified := hit && jalr_target_modified
38009c6f1ddSLingrui98  io.is_always_taken_modified := hit && always_taken_modified
381eeb5ff92SLingrui98  io.is_br_full := hit && is_new_br && may_have_to_replace
38209c6f1ddSLingrui98}
38309c6f1ddSLingrui98
384c5c5edaeSJeniusclass FtqPcMemWrapper(numOtherReads: Int)(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo {
385c5c5edaeSJenius  val io = IO(new Bundle {
386c5c5edaeSJenius    val ifuPtr_w       = Input(new FtqPtr)
387c5c5edaeSJenius    val ifuPtrPlus1_w  = Input(new FtqPtr)
3886bf9b30dSLingrui98    val ifuPtrPlus2_w  = Input(new FtqPtr)
389c5c5edaeSJenius    val commPtr_w      = Input(new FtqPtr)
3906bf9b30dSLingrui98    val commPtrPlus1_w = Input(new FtqPtr)
391c5c5edaeSJenius    val ifuPtr_rdata       = Output(new Ftq_RF_Components)
392c5c5edaeSJenius    val ifuPtrPlus1_rdata  = Output(new Ftq_RF_Components)
3936bf9b30dSLingrui98    val ifuPtrPlus2_rdata  = Output(new Ftq_RF_Components)
394c5c5edaeSJenius    val commPtr_rdata      = Output(new Ftq_RF_Components)
3956bf9b30dSLingrui98    val commPtrPlus1_rdata = Output(new Ftq_RF_Components)
396c5c5edaeSJenius
397c5c5edaeSJenius    val other_raddrs = Input(Vec(numOtherReads, UInt(log2Ceil(FtqSize).W)))
398c5c5edaeSJenius    val other_rdatas = Output(Vec(numOtherReads, new Ftq_RF_Components))
399c5c5edaeSJenius
400c5c5edaeSJenius    val wen = Input(Bool())
401c5c5edaeSJenius    val waddr = Input(UInt(log2Ceil(FtqSize).W))
402c5c5edaeSJenius    val wdata = Input(new Ftq_RF_Components)
403c5c5edaeSJenius  })
404c5c5edaeSJenius
4056bf9b30dSLingrui98  val num_pc_read = numOtherReads + 5
406c5c5edaeSJenius  val mem = Module(new SyncDataModuleTemplate(new Ftq_RF_Components, FtqSize,
40728f2cf58SLingrui98    num_pc_read, 1, "FtqPC"))
408c5c5edaeSJenius  mem.io.wen(0)   := io.wen
409c5c5edaeSJenius  mem.io.waddr(0) := io.waddr
410c5c5edaeSJenius  mem.io.wdata(0) := io.wdata
411c5c5edaeSJenius
4126bf9b30dSLingrui98  // read one cycle ahead for ftq local reads
413c5c5edaeSJenius  val raddr_vec = VecInit(io.other_raddrs ++
41488bc4f90SLingrui98    Seq(io.ifuPtr_w.value, io.ifuPtrPlus1_w.value, io.ifuPtrPlus2_w.value, io.commPtrPlus1_w.value, io.commPtr_w.value))
415c5c5edaeSJenius
416c5c5edaeSJenius  mem.io.raddr := raddr_vec
417c5c5edaeSJenius
4186bf9b30dSLingrui98  io.other_rdatas       := mem.io.rdata.dropRight(5)
4196bf9b30dSLingrui98  io.ifuPtr_rdata       := mem.io.rdata.dropRight(4).last
4206bf9b30dSLingrui98  io.ifuPtrPlus1_rdata  := mem.io.rdata.dropRight(3).last
4216bf9b30dSLingrui98  io.ifuPtrPlus2_rdata  := mem.io.rdata.dropRight(2).last
4226bf9b30dSLingrui98  io.commPtrPlus1_rdata := mem.io.rdata.dropRight(1).last
423c5c5edaeSJenius  io.commPtr_rdata      := mem.io.rdata.last
424c5c5edaeSJenius}
425c5c5edaeSJenius
42609c6f1ddSLingrui98class Ftq(implicit p: Parameters) extends XSModule with HasCircularQueuePtrHelper
427e30430c2SJay  with HasBackendRedirectInfo with BPUUtils with HasBPUConst with HasPerfEvents
428e30430c2SJay  with HasICacheParameters{
42909c6f1ddSLingrui98  val io = IO(new Bundle {
43009c6f1ddSLingrui98    val fromBpu = Flipped(new BpuToFtqIO)
43109c6f1ddSLingrui98    val fromIfu = Flipped(new IfuToFtqIO)
43209c6f1ddSLingrui98    val fromBackend = Flipped(new CtrlToFtqIO)
43309c6f1ddSLingrui98
43409c6f1ddSLingrui98    val toBpu = new FtqToBpuIO
43509c6f1ddSLingrui98    val toIfu = new FtqToIfuIO
436c5c5edaeSJenius    val toICache = new FtqToICacheIO
43709c6f1ddSLingrui98    val toBackend = new FtqToCtrlIO
43809c6f1ddSLingrui98
4397052722fSJay    val toPrefetch = new FtqPrefechBundle
4407052722fSJay
44109c6f1ddSLingrui98    val bpuInfo = new Bundle {
44209c6f1ddSLingrui98      val bpRight = Output(UInt(XLEN.W))
44309c6f1ddSLingrui98      val bpWrong = Output(UInt(XLEN.W))
44409c6f1ddSLingrui98    }
44509c6f1ddSLingrui98  })
44609c6f1ddSLingrui98  io.bpuInfo := DontCare
44709c6f1ddSLingrui98
4482e1be6e1SSteve Gou  val backendRedirect = Wire(Valid(new Redirect))
4492e1be6e1SSteve Gou  val backendRedirectReg = RegNext(backendRedirect)
45009c6f1ddSLingrui98
451df5b4b8eSYinan Xu  val stage2Flush = backendRedirect.valid
45209c6f1ddSLingrui98  val backendFlush = stage2Flush || RegNext(stage2Flush)
45309c6f1ddSLingrui98  val ifuFlush = Wire(Bool())
45409c6f1ddSLingrui98
45509c6f1ddSLingrui98  val flush = stage2Flush || RegNext(stage2Flush)
45609c6f1ddSLingrui98
45709c6f1ddSLingrui98  val allowBpuIn, allowToIfu = WireInit(false.B)
45809c6f1ddSLingrui98  val flushToIfu = !allowToIfu
459df5b4b8eSYinan Xu  allowBpuIn := !ifuFlush && !backendRedirect.valid && !backendRedirectReg.valid
460df5b4b8eSYinan Xu  allowToIfu := !ifuFlush && !backendRedirect.valid && !backendRedirectReg.valid
46109c6f1ddSLingrui98
462f56177cbSJenius  def copyNum = 5
463e30430c2SJay  val bpuPtr, ifuPtr, ifuWbPtr, commPtr = RegInit(FtqPtr(false.B, 0.U))
464c9bc5480SLingrui98  val ifuPtrPlus1 = RegInit(FtqPtr(false.B, 1.U))
4656bf9b30dSLingrui98  val ifuPtrPlus2 = RegInit(FtqPtr(false.B, 2.U))
4666bf9b30dSLingrui98  val commPtrPlus1 = RegInit(FtqPtr(false.B, 1.U))
467f56177cbSJenius  val copied_ifu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U)))
468dc270d3bSJenius  val copied_bpu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U)))
4696bf9b30dSLingrui98  require(FtqSize >= 4)
470c5c5edaeSJenius  val ifuPtr_write       = WireInit(ifuPtr)
471c5c5edaeSJenius  val ifuPtrPlus1_write  = WireInit(ifuPtrPlus1)
4726bf9b30dSLingrui98  val ifuPtrPlus2_write  = WireInit(ifuPtrPlus2)
473c5c5edaeSJenius  val ifuWbPtr_write     = WireInit(ifuWbPtr)
474c5c5edaeSJenius  val commPtr_write      = WireInit(commPtr)
4756bf9b30dSLingrui98  val commPtrPlus1_write = WireInit(commPtrPlus1)
476c5c5edaeSJenius  ifuPtr       := ifuPtr_write
477c5c5edaeSJenius  ifuPtrPlus1  := ifuPtrPlus1_write
4786bf9b30dSLingrui98  ifuPtrPlus2  := ifuPtrPlus2_write
479c5c5edaeSJenius  ifuWbPtr     := ifuWbPtr_write
480c5c5edaeSJenius  commPtr      := commPtr_write
481f83ef67eSLingrui98  commPtrPlus1 := commPtrPlus1_write
482f56177cbSJenius  copied_ifu_ptr.map{ptr =>
483f56177cbSJenius    ptr := ifuPtr_write
484f56177cbSJenius    dontTouch(ptr)
485f56177cbSJenius  }
48609c6f1ddSLingrui98  val validEntries = distanceBetween(bpuPtr, commPtr)
48709c6f1ddSLingrui98
48809c6f1ddSLingrui98  // **********************************************************************
48909c6f1ddSLingrui98  // **************************** enq from bpu ****************************
49009c6f1ddSLingrui98  // **********************************************************************
49109c6f1ddSLingrui98  val new_entry_ready = validEntries < FtqSize.U
49209c6f1ddSLingrui98  io.fromBpu.resp.ready := new_entry_ready
49309c6f1ddSLingrui98
49409c6f1ddSLingrui98  val bpu_s2_resp = io.fromBpu.resp.bits.s2
495cb4f77ceSLingrui98  val bpu_s3_resp = io.fromBpu.resp.bits.s3
49609c6f1ddSLingrui98  val bpu_s2_redirect = bpu_s2_resp.valid && bpu_s2_resp.hasRedirect
497cb4f77ceSLingrui98  val bpu_s3_redirect = bpu_s3_resp.valid && bpu_s3_resp.hasRedirect
49809c6f1ddSLingrui98
49909c6f1ddSLingrui98  io.toBpu.enq_ptr := bpuPtr
50009c6f1ddSLingrui98  val enq_fire = io.fromBpu.resp.fire() && allowBpuIn // from bpu s1
501cb4f77ceSLingrui98  val bpu_in_fire = (io.fromBpu.resp.fire() || bpu_s2_redirect || bpu_s3_redirect) && allowBpuIn
50209c6f1ddSLingrui98
503b37e4b45SLingrui98  val bpu_in_resp = io.fromBpu.resp.bits.selectedResp
504b37e4b45SLingrui98  val bpu_in_stage = io.fromBpu.resp.bits.selectedRespIdx
50509c6f1ddSLingrui98  val bpu_in_resp_ptr = Mux(bpu_in_stage === BP_S1, bpuPtr, bpu_in_resp.ftq_idx)
50609c6f1ddSLingrui98  val bpu_in_resp_idx = bpu_in_resp_ptr.value
50709c6f1ddSLingrui98
508378f00d9SJenius  // read ports:      prefetchReq ++  ifuReq1 + ifuReq2 + ifuReq3 + commitUpdate2 + commitUpdate
509378f00d9SJenius  val ftq_pc_mem = Module(new FtqPcMemWrapper(1))
5106bf9b30dSLingrui98  // resp from uBTB
511c5c5edaeSJenius  ftq_pc_mem.io.wen := bpu_in_fire
512c5c5edaeSJenius  ftq_pc_mem.io.waddr := bpu_in_resp_idx
513c5c5edaeSJenius  ftq_pc_mem.io.wdata.fromBranchPrediction(bpu_in_resp)
51409c6f1ddSLingrui98
51509c6f1ddSLingrui98  //                                                            ifuRedirect + backendRedirect + commit
51609c6f1ddSLingrui98  val ftq_redirect_sram = Module(new FtqNRSRAM(new Ftq_Redirect_SRAMEntry, 1+1+1))
51709c6f1ddSLingrui98  // these info is intended to enq at the last stage of bpu
51809c6f1ddSLingrui98  ftq_redirect_sram.io.wen := io.fromBpu.resp.bits.lastStage.valid
51909c6f1ddSLingrui98  ftq_redirect_sram.io.waddr := io.fromBpu.resp.bits.lastStage.ftq_idx.value
520*c2d1ec7dSLingrui98  ftq_redirect_sram.io.wdata := io.fromBpu.resp.bits.last_stage_spec_info
52149cbc998SLingrui98  println(f"ftq redirect SRAM: entry ${ftq_redirect_sram.io.wdata.getWidth} * ${FtqSize} * 3")
52249cbc998SLingrui98  println(f"ftq redirect SRAM: ahead fh ${ftq_redirect_sram.io.wdata.afhob.getWidth} * ${FtqSize} * 3")
52309c6f1ddSLingrui98
52409c6f1ddSLingrui98  val ftq_meta_1r_sram = Module(new FtqNRSRAM(new Ftq_1R_SRAMEntry, 1))
52509c6f1ddSLingrui98  // these info is intended to enq at the last stage of bpu
52609c6f1ddSLingrui98  ftq_meta_1r_sram.io.wen := io.fromBpu.resp.bits.lastStage.valid
52709c6f1ddSLingrui98  ftq_meta_1r_sram.io.waddr := io.fromBpu.resp.bits.lastStage.ftq_idx.value
528*c2d1ec7dSLingrui98  ftq_meta_1r_sram.io.wdata.meta := io.fromBpu.resp.bits.last_stage_meta
52909c6f1ddSLingrui98  //                                                            ifuRedirect + backendRedirect + commit
53009c6f1ddSLingrui98  val ftb_entry_mem = Module(new SyncDataModuleTemplate(new FTBEntry, FtqSize, 1+1+1, 1))
53109c6f1ddSLingrui98  ftb_entry_mem.io.wen(0) := io.fromBpu.resp.bits.lastStage.valid
53209c6f1ddSLingrui98  ftb_entry_mem.io.waddr(0) := io.fromBpu.resp.bits.lastStage.ftq_idx.value
533*c2d1ec7dSLingrui98  ftb_entry_mem.io.wdata(0) := io.fromBpu.resp.bits.last_stage_ftb_entry
53409c6f1ddSLingrui98
53509c6f1ddSLingrui98
53609c6f1ddSLingrui98  // multi-write
537b0ed7239SLingrui98  val update_target = Reg(Vec(FtqSize, UInt(VAddrBits.W))) // could be taken target or fallThrough //TODO: remove this
5386bf9b30dSLingrui98  val newest_entry_target = Reg(UInt(VAddrBits.W))
5396bf9b30dSLingrui98  val newest_entry_ptr = Reg(new FtqPtr)
54009c6f1ddSLingrui98  val cfiIndex_vec = Reg(Vec(FtqSize, ValidUndirectioned(UInt(log2Ceil(PredictWidth).W))))
54109c6f1ddSLingrui98  val mispredict_vec = Reg(Vec(FtqSize, Vec(PredictWidth, Bool())))
54209c6f1ddSLingrui98  val pred_stage = Reg(Vec(FtqSize, UInt(2.W)))
54309c6f1ddSLingrui98
54409c6f1ddSLingrui98  val c_invalid :: c_valid :: c_commited :: Nil = Enum(3)
54509c6f1ddSLingrui98  val commitStateQueue = RegInit(VecInit(Seq.fill(FtqSize) {
54609c6f1ddSLingrui98    VecInit(Seq.fill(PredictWidth)(c_invalid))
54709c6f1ddSLingrui98  }))
54809c6f1ddSLingrui98
54909c6f1ddSLingrui98  val f_to_send :: f_sent :: Nil = Enum(2)
55009c6f1ddSLingrui98  val entry_fetch_status = RegInit(VecInit(Seq.fill(FtqSize)(f_sent)))
55109c6f1ddSLingrui98
55209c6f1ddSLingrui98  val h_not_hit :: h_false_hit :: h_hit :: Nil = Enum(3)
55309c6f1ddSLingrui98  val entry_hit_status = RegInit(VecInit(Seq.fill(FtqSize)(h_not_hit)))
55409c6f1ddSLingrui98
555f63797a4SLingrui98  // modify registers one cycle later to cut critical path
556f63797a4SLingrui98  val last_cycle_bpu_in = RegNext(bpu_in_fire)
5576bf9b30dSLingrui98  val last_cycle_bpu_in_ptr = RegNext(bpu_in_resp_ptr)
5586bf9b30dSLingrui98  val last_cycle_bpu_in_idx = last_cycle_bpu_in_ptr.value
5596bf9b30dSLingrui98  val last_cycle_bpu_target = RegNext(bpu_in_resp.getTarget)
560f63797a4SLingrui98  val last_cycle_cfiIndex = RegNext(bpu_in_resp.cfiIndex)
561f63797a4SLingrui98  val last_cycle_bpu_in_stage = RegNext(bpu_in_stage)
562f56177cbSJenius
5637be982afSLingrui98  def extra_copyNum_for_commitStateQueue = 2
5647be982afSLingrui98  val copied_last_cycle_bpu_in = VecInit(Seq.fill(copyNum+extra_copyNum_for_commitStateQueue)(RegNext(bpu_in_fire)))
5657be982afSLingrui98  val copied_last_cycle_bpu_in_ptr_for_ftq = VecInit(Seq.fill(extra_copyNum_for_commitStateQueue)(RegNext(bpu_in_resp_ptr)))
566f56177cbSJenius
567f63797a4SLingrui98  when (last_cycle_bpu_in) {
568f63797a4SLingrui98    entry_fetch_status(last_cycle_bpu_in_idx) := f_to_send
569f63797a4SLingrui98    cfiIndex_vec(last_cycle_bpu_in_idx) := last_cycle_cfiIndex
570f63797a4SLingrui98    pred_stage(last_cycle_bpu_in_idx) := last_cycle_bpu_in_stage
5716bf9b30dSLingrui98
572b0ed7239SLingrui98    update_target(last_cycle_bpu_in_idx) := last_cycle_bpu_target // TODO: remove this
5736bf9b30dSLingrui98    newest_entry_target := last_cycle_bpu_target
5746bf9b30dSLingrui98    newest_entry_ptr := last_cycle_bpu_in_ptr
57509c6f1ddSLingrui98  }
57609c6f1ddSLingrui98
5777be982afSLingrui98  // reduce fanout by delay write for a cycle
5787be982afSLingrui98  when (RegNext(last_cycle_bpu_in)) {
5797be982afSLingrui98    mispredict_vec(RegNext(last_cycle_bpu_in_idx)) := WireInit(VecInit(Seq.fill(PredictWidth)(false.B)))
5807be982afSLingrui98  }
5817be982afSLingrui98
5827be982afSLingrui98  // reduce fanout using copied last_cycle_bpu_in and copied last_cycle_bpu_in_ptr
5837be982afSLingrui98  val copied_last_cycle_bpu_in_for_ftq = copied_last_cycle_bpu_in.takeRight(extra_copyNum_for_commitStateQueue)
5847be982afSLingrui98  copied_last_cycle_bpu_in_for_ftq.zip(copied_last_cycle_bpu_in_ptr_for_ftq).zipWithIndex.map {
5857be982afSLingrui98    case ((in, ptr), i) =>
5867be982afSLingrui98      when (in) {
5877be982afSLingrui98        val perSetEntries = FtqSize / extra_copyNum_for_commitStateQueue // 32
5887be982afSLingrui98        require(FtqSize % extra_copyNum_for_commitStateQueue == 0)
5897be982afSLingrui98        for (j <- 0 until perSetEntries) {
5909361b0c5SLingrui98          when (ptr.value === (i*perSetEntries+j).U) {
5917be982afSLingrui98            commitStateQueue(i*perSetEntries+j) := VecInit(Seq.fill(PredictWidth)(c_invalid))
5927be982afSLingrui98          }
5937be982afSLingrui98        }
5947be982afSLingrui98      }
5959361b0c5SLingrui98  }
5967be982afSLingrui98
597873dc383SLingrui98  // num cycle is fixed
598873dc383SLingrui98  io.toBackend.newest_entry_ptr := RegNext(newest_entry_ptr)
599873dc383SLingrui98  io.toBackend.newest_entry_target := RegNext(newest_entry_target)
600873dc383SLingrui98
601f63797a4SLingrui98
60209c6f1ddSLingrui98  bpuPtr := bpuPtr + enq_fire
603dc270d3bSJenius  copied_bpu_ptr.map(_ := bpuPtr + enq_fire)
604c9bc5480SLingrui98  when (io.toIfu.req.fire && allowToIfu) {
605c5c5edaeSJenius    ifuPtr_write := ifuPtrPlus1
6066bf9b30dSLingrui98    ifuPtrPlus1_write := ifuPtrPlus2
6076bf9b30dSLingrui98    ifuPtrPlus2_write := ifuPtrPlus2 + 1.U
608c9bc5480SLingrui98  }
60909c6f1ddSLingrui98
61009c6f1ddSLingrui98  // only use ftb result to assign hit status
61109c6f1ddSLingrui98  when (bpu_s2_resp.valid) {
612b37e4b45SLingrui98    entry_hit_status(bpu_s2_resp.ftq_idx.value) := Mux(bpu_s2_resp.full_pred.hit, h_hit, h_not_hit)
61309c6f1ddSLingrui98  }
61409c6f1ddSLingrui98
61509c6f1ddSLingrui98
6162f4a3aa4SLingrui98  io.toIfu.flushFromBpu.s2.valid := bpu_s2_redirect
61709c6f1ddSLingrui98  io.toIfu.flushFromBpu.s2.bits := bpu_s2_resp.ftq_idx
61809c6f1ddSLingrui98  when (bpu_s2_resp.valid && bpu_s2_resp.hasRedirect) {
61909c6f1ddSLingrui98    bpuPtr := bpu_s2_resp.ftq_idx + 1.U
620dc270d3bSJenius    copied_bpu_ptr.map(_ := bpu_s2_resp.ftq_idx + 1.U)
62109c6f1ddSLingrui98    // only when ifuPtr runs ahead of bpu s2 resp should we recover it
62209c6f1ddSLingrui98    when (!isBefore(ifuPtr, bpu_s2_resp.ftq_idx)) {
623c5c5edaeSJenius      ifuPtr_write := bpu_s2_resp.ftq_idx
624c5c5edaeSJenius      ifuPtrPlus1_write := bpu_s2_resp.ftq_idx + 1.U
6256bf9b30dSLingrui98      ifuPtrPlus2_write := bpu_s2_resp.ftq_idx + 2.U
62609c6f1ddSLingrui98    }
62709c6f1ddSLingrui98  }
62809c6f1ddSLingrui98
629cb4f77ceSLingrui98  io.toIfu.flushFromBpu.s3.valid := bpu_s3_redirect
630cb4f77ceSLingrui98  io.toIfu.flushFromBpu.s3.bits := bpu_s3_resp.ftq_idx
631cb4f77ceSLingrui98  when (bpu_s3_resp.valid && bpu_s3_resp.hasRedirect) {
632cb4f77ceSLingrui98    bpuPtr := bpu_s3_resp.ftq_idx + 1.U
633dc270d3bSJenius    copied_bpu_ptr.map(_ := bpu_s3_resp.ftq_idx + 1.U)
634cb4f77ceSLingrui98    // only when ifuPtr runs ahead of bpu s2 resp should we recover it
635cb4f77ceSLingrui98    when (!isBefore(ifuPtr, bpu_s3_resp.ftq_idx)) {
636c5c5edaeSJenius      ifuPtr_write := bpu_s3_resp.ftq_idx
637c5c5edaeSJenius      ifuPtrPlus1_write := bpu_s3_resp.ftq_idx + 1.U
6386bf9b30dSLingrui98      ifuPtrPlus2_write := bpu_s3_resp.ftq_idx + 2.U
639cb4f77ceSLingrui98    }
640cb4f77ceSLingrui98  }
641cb4f77ceSLingrui98
64209c6f1ddSLingrui98  XSError(isBefore(bpuPtr, ifuPtr) && !isFull(bpuPtr, ifuPtr), "\nifuPtr is before bpuPtr!\n")
64309c6f1ddSLingrui98
644dc270d3bSJenius  (0 until copyNum).map{i =>
645dc270d3bSJenius    XSError(copied_bpu_ptr(i) =/= bpuPtr, "\ncopiedBpuPtr is different from bpuPtr!\n")
646dc270d3bSJenius  }
647dc270d3bSJenius
64809c6f1ddSLingrui98  // ****************************************************************
64909c6f1ddSLingrui98  // **************************** to ifu ****************************
65009c6f1ddSLingrui98  // ****************************************************************
651f22cf846SJenius  // 0  for ifu, and 1-4 for ICache
652f56177cbSJenius  val bpu_in_bypass_buf = RegEnable(ftq_pc_mem.io.wdata, enable=bpu_in_fire)
653f56177cbSJenius  val copied_bpu_in_bypass_buf = VecInit(Seq.fill(copyNum)(RegEnable(ftq_pc_mem.io.wdata, enable=bpu_in_fire)))
654f56177cbSJenius  val bpu_in_bypass_buf_for_ifu = bpu_in_bypass_buf
65509c6f1ddSLingrui98  val bpu_in_bypass_ptr = RegNext(bpu_in_resp_ptr)
65609c6f1ddSLingrui98  val last_cycle_to_ifu_fire = RegNext(io.toIfu.req.fire)
65709c6f1ddSLingrui98
658f56177cbSJenius  val copied_bpu_in_bypass_ptr = VecInit(Seq.fill(copyNum)(RegNext(bpu_in_resp_ptr)))
659f56177cbSJenius  val copied_last_cycle_to_ifu_fire = VecInit(Seq.fill(copyNum)(RegNext(io.toIfu.req.fire)))
66088bc4f90SLingrui98
66109c6f1ddSLingrui98  // read pc and target
6626bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtr_w       := ifuPtr_write
6636bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtrPlus1_w  := ifuPtrPlus1_write
6646bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtrPlus2_w  := ifuPtrPlus2_write
6656bf9b30dSLingrui98  ftq_pc_mem.io.commPtr_w      := commPtr_write
6666bf9b30dSLingrui98  ftq_pc_mem.io.commPtrPlus1_w := commPtrPlus1_write
667c5c5edaeSJenius
66809c6f1ddSLingrui98
6695ff19bd8SLingrui98  io.toIfu.req.bits.ftqIdx := ifuPtr
670f63797a4SLingrui98
671f56177cbSJenius  val toICachePcBundle = Wire(Vec(copyNum,new Ftq_RF_Components))
672dc270d3bSJenius  val toICacheEntryToSend = Wire(Vec(copyNum,Bool()))
673b37e4b45SLingrui98  val toIfuPcBundle = Wire(new Ftq_RF_Components)
674f63797a4SLingrui98  val entry_is_to_send = WireInit(entry_fetch_status(ifuPtr.value) === f_to_send)
675f63797a4SLingrui98  val entry_ftq_offset = WireInit(cfiIndex_vec(ifuPtr.value))
6766bf9b30dSLingrui98  val entry_next_addr  = Wire(UInt(VAddrBits.W))
677b004fa13SJenius
678f56177cbSJenius  val pc_mem_ifu_ptr_rdata   = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtr_rdata)))
679f56177cbSJenius  val pc_mem_ifu_plus1_rdata = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata)))
680b0ed7239SLingrui98  val diff_entry_next_addr = WireInit(update_target(ifuPtr.value)) //TODO: remove this
681f63797a4SLingrui98
682dc270d3bSJenius  val copied_ifu_plus1_to_send = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1))))
683dc270d3bSJenius  val copied_ifu_ptr_to_send   = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr)))
684dc270d3bSJenius
685f56177cbSJenius  for(i <- 0 until copyNum){
686f56177cbSJenius    when(copied_last_cycle_bpu_in(i) && copied_bpu_in_bypass_ptr(i) === copied_ifu_ptr(i)){
687f56177cbSJenius      toICachePcBundle(i) := copied_bpu_in_bypass_buf(i)
688dc270d3bSJenius      toICacheEntryToSend(i)   := true.B
689f56177cbSJenius    }.elsewhen(copied_last_cycle_to_ifu_fire(i)){
690f56177cbSJenius      toICachePcBundle(i) := pc_mem_ifu_plus1_rdata(i)
691dc270d3bSJenius      toICacheEntryToSend(i)   := copied_ifu_plus1_to_send(i)
692f56177cbSJenius    }.otherwise{
693f56177cbSJenius      toICachePcBundle(i) := pc_mem_ifu_ptr_rdata(i)
694dc270d3bSJenius      toICacheEntryToSend(i)   := copied_ifu_ptr_to_send(i)
695f56177cbSJenius    }
696f56177cbSJenius  }
697f56177cbSJenius
698873dc383SLingrui98  // TODO: reconsider target address bypass logic
69909c6f1ddSLingrui98  when (last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) {
70088bc4f90SLingrui98    toIfuPcBundle := bpu_in_bypass_buf_for_ifu
701f678dd91SSteve Gou    entry_is_to_send := true.B
7026bf9b30dSLingrui98    entry_next_addr := last_cycle_bpu_target
703f63797a4SLingrui98    entry_ftq_offset := last_cycle_cfiIndex
704b0ed7239SLingrui98    diff_entry_next_addr := last_cycle_bpu_target // TODO: remove this
70509c6f1ddSLingrui98  }.elsewhen (last_cycle_to_ifu_fire) {
706c5c5edaeSJenius    toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata)
707c5c5edaeSJenius    entry_is_to_send := RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) ||
708c5c5edaeSJenius                        RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1)) // reduce potential bubbles
709ed434d67SLingrui98    entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1),
71088bc4f90SLingrui98                          bpu_in_bypass_buf_for_ifu.startAddr,
711fef810c0SLingrui98                          Mux(ifuPtr === newest_entry_ptr,
7126bf9b30dSLingrui98                            newest_entry_target,
713f83ef67eSLingrui98                            RegNext(ftq_pc_mem.io.ifuPtrPlus2_rdata.startAddr))) // ifuPtr+2
714c5c5edaeSJenius  }.otherwise {
715c5c5edaeSJenius    toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtr_rdata)
71628f2cf58SLingrui98    entry_is_to_send := RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) ||
71728f2cf58SLingrui98                        RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) // reduce potential bubbles
7186bf9b30dSLingrui98    entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1),
71988bc4f90SLingrui98                          bpu_in_bypass_buf_for_ifu.startAddr,
720fef810c0SLingrui98                          Mux(ifuPtr === newest_entry_ptr,
7216bf9b30dSLingrui98                            newest_entry_target,
722f83ef67eSLingrui98                            RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata.startAddr))) // ifuPtr+1
72309c6f1ddSLingrui98  }
72409c6f1ddSLingrui98
725f678dd91SSteve Gou  io.toIfu.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr
726f63797a4SLingrui98  io.toIfu.req.bits.nextStartAddr := entry_next_addr
727f63797a4SLingrui98  io.toIfu.req.bits.ftqOffset := entry_ftq_offset
728b37e4b45SLingrui98  io.toIfu.req.bits.fromFtqPcBundle(toIfuPcBundle)
729c5c5edaeSJenius
730c5c5edaeSJenius  io.toICache.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr
731dc270d3bSJenius  io.toICache.req.bits.readValid.zipWithIndex.map{case(copy, i) => copy := toICacheEntryToSend(i) && copied_ifu_ptr(i) =/= copied_bpu_ptr(i)}
732b004fa13SJenius  io.toICache.req.bits.pcMemRead.zipWithIndex.map{case(copy,i) => copy.fromFtqPcBundle(toICachePcBundle(i))}
733b004fa13SJenius  // io.toICache.req.bits.bypassSelect := last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr
734b004fa13SJenius  // io.toICache.req.bits.bpuBypassWrite.zipWithIndex.map{case(bypassWrtie, i) =>
735b004fa13SJenius  //   bypassWrtie.startAddr := bpu_in_bypass_buf.tail(i).startAddr
736b004fa13SJenius  //   bypassWrtie.nextlineStart := bpu_in_bypass_buf.tail(i).nextLineAddr
737b004fa13SJenius  // }
738f22cf846SJenius
739b0ed7239SLingrui98  // TODO: remove this
740b0ed7239SLingrui98  XSError(io.toIfu.req.valid && diff_entry_next_addr =/= entry_next_addr,
7415a674179SLingrui98          p"\nifu_req_target wrong! ifuPtr: ${ifuPtr}, entry_next_addr: ${Hexadecimal(entry_next_addr)} diff_entry_next_addr: ${Hexadecimal(diff_entry_next_addr)}\n")
742b0ed7239SLingrui98
74309c6f1ddSLingrui98  // when fall through is smaller in value than start address, there must be a false hit
744b37e4b45SLingrui98  when (toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit) {
74509c6f1ddSLingrui98    when (io.toIfu.req.fire &&
746cb4f77ceSLingrui98      !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) &&
747cb4f77ceSLingrui98      !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr)
74809c6f1ddSLingrui98    ) {
74909c6f1ddSLingrui98      entry_hit_status(ifuPtr.value) := h_false_hit
750352db50aSLingrui98      // XSError(true.B, "FTB false hit by fallThroughError, startAddr: %x, fallTHru: %x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr)
75109c6f1ddSLingrui98    }
752b37e4b45SLingrui98    XSDebug(true.B, "fallThruError! start:%x, fallThru:%x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr)
75309c6f1ddSLingrui98  }
75409c6f1ddSLingrui98
755a60a2901SLingrui98  XSPerfAccumulate(f"fall_through_error_to_ifu", toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit &&
756a60a2901SLingrui98    io.toIfu.req.fire && !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) && !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr))
757a60a2901SLingrui98
75809c6f1ddSLingrui98  val ifu_req_should_be_flushed =
759cb4f77ceSLingrui98    io.toIfu.flushFromBpu.shouldFlushByStage2(io.toIfu.req.bits.ftqIdx) ||
760cb4f77ceSLingrui98    io.toIfu.flushFromBpu.shouldFlushByStage3(io.toIfu.req.bits.ftqIdx)
76109c6f1ddSLingrui98
76209c6f1ddSLingrui98    when (io.toIfu.req.fire && !ifu_req_should_be_flushed) {
76309c6f1ddSLingrui98      entry_fetch_status(ifuPtr.value) := f_sent
76409c6f1ddSLingrui98    }
76509c6f1ddSLingrui98
76609c6f1ddSLingrui98  // *********************************************************************
76709c6f1ddSLingrui98  // **************************** wb from ifu ****************************
76809c6f1ddSLingrui98  // *********************************************************************
76909c6f1ddSLingrui98  val pdWb = io.fromIfu.pdWb
77009c6f1ddSLingrui98  val pds = pdWb.bits.pd
77109c6f1ddSLingrui98  val ifu_wb_valid = pdWb.valid
77209c6f1ddSLingrui98  val ifu_wb_idx = pdWb.bits.ftqIdx.value
77309c6f1ddSLingrui98  // read ports:                                                         commit update
77409c6f1ddSLingrui98  val ftq_pd_mem = Module(new SyncDataModuleTemplate(new Ftq_pd_Entry, FtqSize, 1, 1))
77509c6f1ddSLingrui98  ftq_pd_mem.io.wen(0) := ifu_wb_valid
77609c6f1ddSLingrui98  ftq_pd_mem.io.waddr(0) := pdWb.bits.ftqIdx.value
77709c6f1ddSLingrui98  ftq_pd_mem.io.wdata(0).fromPdWb(pdWb.bits)
77809c6f1ddSLingrui98
77909c6f1ddSLingrui98  val hit_pd_valid = entry_hit_status(ifu_wb_idx) === h_hit && ifu_wb_valid
78009c6f1ddSLingrui98  val hit_pd_mispred = hit_pd_valid && pdWb.bits.misOffset.valid
78109c6f1ddSLingrui98  val hit_pd_mispred_reg = RegNext(hit_pd_mispred, init=false.B)
782005e809bSJiuyang Liu  val pd_reg       = RegEnable(pds,             pdWb.valid)
783005e809bSJiuyang Liu  val start_pc_reg = RegEnable(pdWb.bits.pc(0), pdWb.valid)
784005e809bSJiuyang Liu  val wb_idx_reg   = RegEnable(ifu_wb_idx,      pdWb.valid)
78509c6f1ddSLingrui98
78609c6f1ddSLingrui98  when (ifu_wb_valid) {
78709c6f1ddSLingrui98    val comm_stq_wen = VecInit(pds.map(_.valid).zip(pdWb.bits.instrRange).map{
78809c6f1ddSLingrui98      case (v, inRange) => v && inRange
78909c6f1ddSLingrui98    })
79009c6f1ddSLingrui98    (commitStateQueue(ifu_wb_idx) zip comm_stq_wen).map{
79109c6f1ddSLingrui98      case (qe, v) => when (v) { qe := c_valid }
79209c6f1ddSLingrui98    }
79309c6f1ddSLingrui98  }
79409c6f1ddSLingrui98
795c5c5edaeSJenius  when (ifu_wb_valid) {
796c5c5edaeSJenius    ifuWbPtr_write := ifuWbPtr + 1.U
797c5c5edaeSJenius  }
79809c6f1ddSLingrui98
79909c6f1ddSLingrui98  ftb_entry_mem.io.raddr.head := ifu_wb_idx
80009c6f1ddSLingrui98  val has_false_hit = WireInit(false.B)
80109c6f1ddSLingrui98  when (RegNext(hit_pd_valid)) {
80209c6f1ddSLingrui98    // check for false hit
80309c6f1ddSLingrui98    val pred_ftb_entry = ftb_entry_mem.io.rdata.head
804eeb5ff92SLingrui98    val brSlots = pred_ftb_entry.brSlots
805eeb5ff92SLingrui98    val tailSlot = pred_ftb_entry.tailSlot
80609c6f1ddSLingrui98    // we check cfis that bpu predicted
80709c6f1ddSLingrui98
808eeb5ff92SLingrui98    // bpu predicted branches but denied by predecode
809eeb5ff92SLingrui98    val br_false_hit =
810eeb5ff92SLingrui98      brSlots.map{
811eeb5ff92SLingrui98        s => s.valid && !(pd_reg(s.offset).valid && pd_reg(s.offset).isBr)
812eeb5ff92SLingrui98      }.reduce(_||_) ||
813b37e4b45SLingrui98      (tailSlot.valid && pred_ftb_entry.tailSlot.sharing &&
814eeb5ff92SLingrui98        !(pd_reg(tailSlot.offset).valid && pd_reg(tailSlot.offset).isBr))
815eeb5ff92SLingrui98
816eeb5ff92SLingrui98    val jmpOffset = tailSlot.offset
81709c6f1ddSLingrui98    val jmp_pd = pd_reg(jmpOffset)
81809c6f1ddSLingrui98    val jal_false_hit = pred_ftb_entry.jmpValid &&
81909c6f1ddSLingrui98      ((pred_ftb_entry.isJal  && !(jmp_pd.valid && jmp_pd.isJal)) ||
82009c6f1ddSLingrui98       (pred_ftb_entry.isJalr && !(jmp_pd.valid && jmp_pd.isJalr)) ||
82109c6f1ddSLingrui98       (pred_ftb_entry.isCall && !(jmp_pd.valid && jmp_pd.isCall)) ||
82209c6f1ddSLingrui98       (pred_ftb_entry.isRet  && !(jmp_pd.valid && jmp_pd.isRet))
82309c6f1ddSLingrui98      )
82409c6f1ddSLingrui98
82509c6f1ddSLingrui98    has_false_hit := br_false_hit || jal_false_hit || hit_pd_mispred_reg
82665fddcf0Szoujr    XSDebug(has_false_hit, "FTB false hit by br or jal or hit_pd, startAddr: %x\n", pdWb.bits.pc(0))
82765fddcf0Szoujr
828352db50aSLingrui98    // assert(!has_false_hit)
82909c6f1ddSLingrui98  }
83009c6f1ddSLingrui98
83109c6f1ddSLingrui98  when (has_false_hit) {
83209c6f1ddSLingrui98    entry_hit_status(wb_idx_reg) := h_false_hit
83309c6f1ddSLingrui98  }
83409c6f1ddSLingrui98
83509c6f1ddSLingrui98
83609c6f1ddSLingrui98  // **********************************************************************
837b56f947eSYinan Xu  // ***************************** to backend *****************************
83809c6f1ddSLingrui98  // **********************************************************************
839b56f947eSYinan Xu  // to backend pc mem / target
840b56f947eSYinan Xu  io.toBackend.pc_mem_wen   := RegNext(last_cycle_bpu_in)
841b56f947eSYinan Xu  io.toBackend.pc_mem_waddr := RegNext(last_cycle_bpu_in_idx)
84288bc4f90SLingrui98  io.toBackend.pc_mem_wdata := RegNext(bpu_in_bypass_buf_for_ifu)
84309c6f1ddSLingrui98
84409c6f1ddSLingrui98  // *******************************************************************************
84509c6f1ddSLingrui98  // **************************** redirect from backend ****************************
84609c6f1ddSLingrui98  // *******************************************************************************
84709c6f1ddSLingrui98
84809c6f1ddSLingrui98  // redirect read cfiInfo, couples to redirectGen s2
8492e1be6e1SSteve Gou  ftq_redirect_sram.io.ren.init.last := backendRedirect.valid
8502e1be6e1SSteve Gou  ftq_redirect_sram.io.raddr.init.last := backendRedirect.bits.ftqIdx.value
85109c6f1ddSLingrui98
8522e1be6e1SSteve Gou  ftb_entry_mem.io.raddr.init.last := backendRedirect.bits.ftqIdx.value
85309c6f1ddSLingrui98
85409c6f1ddSLingrui98  val stage3CfiInfo = ftq_redirect_sram.io.rdata.init.last
855df5b4b8eSYinan Xu  val fromBackendRedirect = WireInit(backendRedirectReg)
85609c6f1ddSLingrui98  val backendRedirectCfi = fromBackendRedirect.bits.cfiUpdate
85709c6f1ddSLingrui98  backendRedirectCfi.fromFtqRedirectSram(stage3CfiInfo)
85809c6f1ddSLingrui98
85909c6f1ddSLingrui98  val r_ftb_entry = ftb_entry_mem.io.rdata.init.last
86009c6f1ddSLingrui98  val r_ftqOffset = fromBackendRedirect.bits.ftqOffset
86109c6f1ddSLingrui98
86209c6f1ddSLingrui98  when (entry_hit_status(fromBackendRedirect.bits.ftqIdx.value) === h_hit) {
86309c6f1ddSLingrui98    backendRedirectCfi.shift := PopCount(r_ftb_entry.getBrMaskByOffset(r_ftqOffset)) +&
86409c6f1ddSLingrui98      (backendRedirectCfi.pd.isBr && !r_ftb_entry.brIsSaved(r_ftqOffset) &&
865eeb5ff92SLingrui98      !r_ftb_entry.newBrCanNotInsert(r_ftqOffset))
86609c6f1ddSLingrui98
86709c6f1ddSLingrui98    backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr && (r_ftb_entry.brIsSaved(r_ftqOffset) ||
868eeb5ff92SLingrui98        !r_ftb_entry.newBrCanNotInsert(r_ftqOffset))
86909c6f1ddSLingrui98  }.otherwise {
87009c6f1ddSLingrui98    backendRedirectCfi.shift := (backendRedirectCfi.pd.isBr && backendRedirectCfi.taken).asUInt
87109c6f1ddSLingrui98    backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr.asUInt
87209c6f1ddSLingrui98  }
87309c6f1ddSLingrui98
87409c6f1ddSLingrui98
87509c6f1ddSLingrui98  // ***************************************************************************
87609c6f1ddSLingrui98  // **************************** redirect from ifu ****************************
87709c6f1ddSLingrui98  // ***************************************************************************
87809c6f1ddSLingrui98  val fromIfuRedirect = WireInit(0.U.asTypeOf(Valid(new Redirect)))
87909c6f1ddSLingrui98  fromIfuRedirect.valid := pdWb.valid && pdWb.bits.misOffset.valid && !backendFlush
88009c6f1ddSLingrui98  fromIfuRedirect.bits.ftqIdx := pdWb.bits.ftqIdx
88109c6f1ddSLingrui98  fromIfuRedirect.bits.ftqOffset := pdWb.bits.misOffset.bits
88209c6f1ddSLingrui98  fromIfuRedirect.bits.level := RedirectLevel.flushAfter
88309c6f1ddSLingrui98
88409c6f1ddSLingrui98  val ifuRedirectCfiUpdate = fromIfuRedirect.bits.cfiUpdate
88509c6f1ddSLingrui98  ifuRedirectCfiUpdate.pc := pdWb.bits.pc(pdWb.bits.misOffset.bits)
88609c6f1ddSLingrui98  ifuRedirectCfiUpdate.pd := pdWb.bits.pd(pdWb.bits.misOffset.bits)
88709c6f1ddSLingrui98  ifuRedirectCfiUpdate.predTaken := cfiIndex_vec(pdWb.bits.ftqIdx.value).valid
88809c6f1ddSLingrui98  ifuRedirectCfiUpdate.target := pdWb.bits.target
88909c6f1ddSLingrui98  ifuRedirectCfiUpdate.taken := pdWb.bits.cfiOffset.valid
89009c6f1ddSLingrui98  ifuRedirectCfiUpdate.isMisPred := pdWb.bits.misOffset.valid
89109c6f1ddSLingrui98
89209c6f1ddSLingrui98  val ifuRedirectReg = RegNext(fromIfuRedirect, init=0.U.asTypeOf(Valid(new Redirect)))
89309c6f1ddSLingrui98  val ifuRedirectToBpu = WireInit(ifuRedirectReg)
89409c6f1ddSLingrui98  ifuFlush := fromIfuRedirect.valid || ifuRedirectToBpu.valid
89509c6f1ddSLingrui98
89609c6f1ddSLingrui98  ftq_redirect_sram.io.ren.head := fromIfuRedirect.valid
89709c6f1ddSLingrui98  ftq_redirect_sram.io.raddr.head := fromIfuRedirect.bits.ftqIdx.value
89809c6f1ddSLingrui98
89909c6f1ddSLingrui98  ftb_entry_mem.io.raddr.head := fromIfuRedirect.bits.ftqIdx.value
90009c6f1ddSLingrui98
90109c6f1ddSLingrui98  val toBpuCfi = ifuRedirectToBpu.bits.cfiUpdate
90209c6f1ddSLingrui98  toBpuCfi.fromFtqRedirectSram(ftq_redirect_sram.io.rdata.head)
90309c6f1ddSLingrui98  when (ifuRedirectReg.bits.cfiUpdate.pd.isRet) {
90409c6f1ddSLingrui98    toBpuCfi.target := toBpuCfi.rasEntry.retAddr
90509c6f1ddSLingrui98  }
90609c6f1ddSLingrui98
90709c6f1ddSLingrui98  // *********************************************************************
90809c6f1ddSLingrui98  // **************************** wb from exu ****************************
90909c6f1ddSLingrui98  // *********************************************************************
91009c6f1ddSLingrui98
911b56f947eSYinan Xu  backendRedirect := io.fromBackend.redirect
9122e1be6e1SSteve Gou
91309c6f1ddSLingrui98  def extractRedirectInfo(wb: Valid[Redirect]) = {
9146bf9b30dSLingrui98    val ftqPtr = wb.bits.ftqIdx
91509c6f1ddSLingrui98    val ftqOffset = wb.bits.ftqOffset
91609c6f1ddSLingrui98    val taken = wb.bits.cfiUpdate.taken
91709c6f1ddSLingrui98    val mispred = wb.bits.cfiUpdate.isMisPred
9186bf9b30dSLingrui98    (wb.valid, ftqPtr, ftqOffset, taken, mispred)
91909c6f1ddSLingrui98  }
92009c6f1ddSLingrui98
92109c6f1ddSLingrui98  // fix mispredict entry
92209c6f1ddSLingrui98  val lastIsMispredict = RegNext(
923df5b4b8eSYinan Xu    backendRedirect.valid && backendRedirect.bits.level === RedirectLevel.flushAfter, init = false.B
92409c6f1ddSLingrui98  )
92509c6f1ddSLingrui98
92609c6f1ddSLingrui98  def updateCfiInfo(redirect: Valid[Redirect], isBackend: Boolean = true) = {
9276bf9b30dSLingrui98    val (r_valid, r_ptr, r_offset, r_taken, r_mispred) = extractRedirectInfo(redirect)
9286bf9b30dSLingrui98    val r_idx = r_ptr.value
92909c6f1ddSLingrui98    val cfiIndex_bits_wen = r_valid && r_taken && r_offset < cfiIndex_vec(r_idx).bits
93009c6f1ddSLingrui98    val cfiIndex_valid_wen = r_valid && r_offset === cfiIndex_vec(r_idx).bits
93109c6f1ddSLingrui98    when (cfiIndex_bits_wen || cfiIndex_valid_wen) {
93209c6f1ddSLingrui98      cfiIndex_vec(r_idx).valid := cfiIndex_bits_wen || cfiIndex_valid_wen && r_taken
93309c6f1ddSLingrui98    }
93409c6f1ddSLingrui98    when (cfiIndex_bits_wen) {
93509c6f1ddSLingrui98      cfiIndex_vec(r_idx).bits := r_offset
93609c6f1ddSLingrui98    }
9376bf9b30dSLingrui98    newest_entry_target := redirect.bits.cfiUpdate.target
938873dc383SLingrui98    newest_entry_ptr := r_ptr
939b0ed7239SLingrui98    update_target(r_idx) := redirect.bits.cfiUpdate.target // TODO: remove this
94009c6f1ddSLingrui98    if (isBackend) {
94109c6f1ddSLingrui98      mispredict_vec(r_idx)(r_offset) := r_mispred
94209c6f1ddSLingrui98    }
94309c6f1ddSLingrui98  }
94409c6f1ddSLingrui98
94581e362d8SLingrui98  when(backendRedirectReg.valid) {
946df5b4b8eSYinan Xu    updateCfiInfo(backendRedirectReg)
94709c6f1ddSLingrui98  }.elsewhen (ifuRedirectToBpu.valid) {
94809c6f1ddSLingrui98    updateCfiInfo(ifuRedirectToBpu, isBackend=false)
94909c6f1ddSLingrui98  }
95009c6f1ddSLingrui98
95109c6f1ddSLingrui98  // ***********************************************************************************
95209c6f1ddSLingrui98  // **************************** flush ptr and state queue ****************************
95309c6f1ddSLingrui98  // ***********************************************************************************
95409c6f1ddSLingrui98
955df5b4b8eSYinan Xu  val redirectVec = VecInit(backendRedirect, fromIfuRedirect)
95609c6f1ddSLingrui98
95709c6f1ddSLingrui98  // when redirect, we should reset ptrs and status queues
95809c6f1ddSLingrui98  when(redirectVec.map(r => r.valid).reduce(_||_)){
9592f4a3aa4SLingrui98    val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits)))
96009c6f1ddSLingrui98    val notIfu = redirectVec.dropRight(1).map(r => r.valid).reduce(_||_)
9612f4a3aa4SLingrui98    val (idx, offset, flushItSelf) = (r.ftqIdx, r.ftqOffset, RedirectLevel.flushItself(r.level))
96209c6f1ddSLingrui98    val next = idx + 1.U
96309c6f1ddSLingrui98    bpuPtr := next
964dc270d3bSJenius    copied_bpu_ptr.map(_ := next)
965c5c5edaeSJenius    ifuPtr_write := next
966c5c5edaeSJenius    ifuWbPtr_write := next
967c5c5edaeSJenius    ifuPtrPlus1_write := idx + 2.U
9686bf9b30dSLingrui98    ifuPtrPlus2_write := idx + 3.U
96909c6f1ddSLingrui98    when (notIfu) {
97009c6f1ddSLingrui98      commitStateQueue(idx.value).zipWithIndex.foreach({ case (s, i) =>
97109c6f1ddSLingrui98        when(i.U > offset || i.U === offset && flushItSelf){
97209c6f1ddSLingrui98          s := c_invalid
97309c6f1ddSLingrui98        }
97409c6f1ddSLingrui98      })
97509c6f1ddSLingrui98    }
97609c6f1ddSLingrui98  }
97709c6f1ddSLingrui98
97809c6f1ddSLingrui98  // only the valid bit is actually needed
979df5b4b8eSYinan Xu  io.toIfu.redirect.bits    := backendRedirect.bits
98009c6f1ddSLingrui98  io.toIfu.redirect.valid   := stage2Flush
98109c6f1ddSLingrui98
98209c6f1ddSLingrui98  // commit
9839aca92b9SYinan Xu  for (c <- io.fromBackend.rob_commits) {
98409c6f1ddSLingrui98    when(c.valid) {
98509c6f1ddSLingrui98      commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset) := c_commited
98688825c5cSYinan Xu      // TODO: remove this
98788825c5cSYinan Xu      // For instruction fusions, we also update the next instruction
988c3abb8b6SYinan Xu      when (c.bits.commitType === 4.U) {
98988825c5cSYinan Xu        commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset + 1.U) := c_commited
990c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 5.U) {
99188825c5cSYinan Xu        commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset + 2.U) := c_commited
992c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 6.U) {
99388825c5cSYinan Xu        val index = (c.bits.ftqIdx + 1.U).value
99488825c5cSYinan Xu        commitStateQueue(index)(0) := c_commited
995c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 7.U) {
99688825c5cSYinan Xu        val index = (c.bits.ftqIdx + 1.U).value
99788825c5cSYinan Xu        commitStateQueue(index)(1) := c_commited
99888825c5cSYinan Xu      }
99909c6f1ddSLingrui98    }
100009c6f1ddSLingrui98  }
100109c6f1ddSLingrui98
100209c6f1ddSLingrui98  // ****************************************************************
100309c6f1ddSLingrui98  // **************************** to bpu ****************************
100409c6f1ddSLingrui98  // ****************************************************************
100509c6f1ddSLingrui98
100609c6f1ddSLingrui98  io.toBpu.redirect <> Mux(fromBackendRedirect.valid, fromBackendRedirect, ifuRedirectToBpu)
100709c6f1ddSLingrui98
100802f21c16SLingrui98  val may_have_stall_from_bpu = Wire(Bool())
100902f21c16SLingrui98  val bpu_ftb_update_stall = RegInit(0.U(2.W)) // 2-cycle stall, so we need 3 states
101002f21c16SLingrui98  may_have_stall_from_bpu := bpu_ftb_update_stall =/= 0.U
10115371700eSzoujr  val canCommit = commPtr =/= ifuWbPtr && !may_have_stall_from_bpu &&
101209c6f1ddSLingrui98    Cat(commitStateQueue(commPtr.value).map(s => {
101309c6f1ddSLingrui98      s === c_invalid || s === c_commited
101409c6f1ddSLingrui98    })).andR()
101509c6f1ddSLingrui98
101609c6f1ddSLingrui98  // commit reads
1017c5c5edaeSJenius  val commit_pc_bundle = RegNext(ftq_pc_mem.io.commPtr_rdata)
101881101dc4SLingrui98  val commit_target =
101934cf890eSLingrui98    Mux(RegNext(commPtr === newest_entry_ptr),
102034cf890eSLingrui98      RegNext(newest_entry_target),
102181101dc4SLingrui98      RegNext(ftq_pc_mem.io.commPtrPlus1_rdata.startAddr))
102209c6f1ddSLingrui98  ftq_pd_mem.io.raddr.last := commPtr.value
102309c6f1ddSLingrui98  val commit_pd = ftq_pd_mem.io.rdata.last
102409c6f1ddSLingrui98  ftq_redirect_sram.io.ren.last := canCommit
102509c6f1ddSLingrui98  ftq_redirect_sram.io.raddr.last := commPtr.value
102609c6f1ddSLingrui98  val commit_spec_meta = ftq_redirect_sram.io.rdata.last
102709c6f1ddSLingrui98  ftq_meta_1r_sram.io.ren(0) := canCommit
102809c6f1ddSLingrui98  ftq_meta_1r_sram.io.raddr(0) := commPtr.value
102909c6f1ddSLingrui98  val commit_meta = ftq_meta_1r_sram.io.rdata(0)
103009c6f1ddSLingrui98  ftb_entry_mem.io.raddr.last := commPtr.value
103109c6f1ddSLingrui98  val commit_ftb_entry = ftb_entry_mem.io.rdata.last
103209c6f1ddSLingrui98
103309c6f1ddSLingrui98  // need one cycle to read mem and srams
103409c6f1ddSLingrui98  val do_commit_ptr = RegNext(commPtr)
10355371700eSzoujr  val do_commit = RegNext(canCommit, init=false.B)
10366bf9b30dSLingrui98  when (canCommit) {
10376bf9b30dSLingrui98    commPtr_write := commPtrPlus1
10386bf9b30dSLingrui98    commPtrPlus1_write := commPtrPlus1 + 1.U
10396bf9b30dSLingrui98  }
104009c6f1ddSLingrui98  val commit_state = RegNext(commitStateQueue(commPtr.value))
10415371700eSzoujr  val can_commit_cfi = WireInit(cfiIndex_vec(commPtr.value))
10425371700eSzoujr  when (commitStateQueue(commPtr.value)(can_commit_cfi.bits) =/= c_commited) {
10435371700eSzoujr    can_commit_cfi.valid := false.B
104409c6f1ddSLingrui98  }
10455371700eSzoujr  val commit_cfi = RegNext(can_commit_cfi)
104609c6f1ddSLingrui98
104709c6f1ddSLingrui98  val commit_mispredict = VecInit((RegNext(mispredict_vec(commPtr.value)) zip commit_state).map {
104809c6f1ddSLingrui98    case (mis, state) => mis && state === c_commited
104909c6f1ddSLingrui98  })
10505371700eSzoujr  val can_commit_hit = entry_hit_status(commPtr.value)
10515371700eSzoujr  val commit_hit = RegNext(can_commit_hit)
10525fa3df0dSLingrui98  val diff_commit_target = RegNext(update_target(commPtr.value)) // TODO: remove this
1053edc18578SLingrui98  val commit_stage = RegNext(pred_stage(commPtr.value))
105409c6f1ddSLingrui98  val commit_valid = commit_hit === h_hit || commit_cfi.valid // hit or taken
105509c6f1ddSLingrui98
10565371700eSzoujr  val to_bpu_hit = can_commit_hit === h_hit || can_commit_hit === h_false_hit
105702f21c16SLingrui98  switch (bpu_ftb_update_stall) {
105802f21c16SLingrui98    is (0.U) {
105902f21c16SLingrui98      when (can_commit_cfi.valid && !to_bpu_hit && canCommit) {
106002f21c16SLingrui98        bpu_ftb_update_stall := 2.U // 2-cycle stall
106102f21c16SLingrui98      }
106202f21c16SLingrui98    }
106302f21c16SLingrui98    is (2.U) {
106402f21c16SLingrui98      bpu_ftb_update_stall := 1.U
106502f21c16SLingrui98    }
106602f21c16SLingrui98    is (1.U) {
106702f21c16SLingrui98      bpu_ftb_update_stall := 0.U
106802f21c16SLingrui98    }
106902f21c16SLingrui98    is (3.U) {
107002f21c16SLingrui98      XSError(true.B, "bpu_ftb_update_stall should be 0, 1 or 2")
107102f21c16SLingrui98    }
107202f21c16SLingrui98  }
107309c6f1ddSLingrui98
1074b0ed7239SLingrui98  // TODO: remove this
1075b0ed7239SLingrui98  XSError(do_commit && diff_commit_target =/= commit_target, "\ncommit target should be the same as update target\n")
1076b0ed7239SLingrui98
107709c6f1ddSLingrui98  io.toBpu.update := DontCare
107809c6f1ddSLingrui98  io.toBpu.update.valid := commit_valid && do_commit
107909c6f1ddSLingrui98  val update = io.toBpu.update.bits
108009c6f1ddSLingrui98  update.false_hit   := commit_hit === h_false_hit
108109c6f1ddSLingrui98  update.pc          := commit_pc_bundle.startAddr
108209c6f1ddSLingrui98  update.meta        := commit_meta.meta
1083803124a6SLingrui98  update.cfi_idx     := commit_cfi
10848ffcd86aSLingrui98  update.full_target := commit_target
1085edc18578SLingrui98  update.from_stage  := commit_stage
1086*c2d1ec7dSLingrui98  update.spec_info   := commit_spec_meta
108709c6f1ddSLingrui98
108809c6f1ddSLingrui98  val commit_real_hit = commit_hit === h_hit
108909c6f1ddSLingrui98  val update_ftb_entry = update.ftb_entry
109009c6f1ddSLingrui98
109109c6f1ddSLingrui98  val ftbEntryGen = Module(new FTBEntryGen).io
109209c6f1ddSLingrui98  ftbEntryGen.start_addr     := commit_pc_bundle.startAddr
109309c6f1ddSLingrui98  ftbEntryGen.old_entry      := commit_ftb_entry
109409c6f1ddSLingrui98  ftbEntryGen.pd             := commit_pd
109509c6f1ddSLingrui98  ftbEntryGen.cfiIndex       := commit_cfi
109609c6f1ddSLingrui98  ftbEntryGen.target         := commit_target
109709c6f1ddSLingrui98  ftbEntryGen.hit            := commit_real_hit
109809c6f1ddSLingrui98  ftbEntryGen.mispredict_vec := commit_mispredict
109909c6f1ddSLingrui98
110009c6f1ddSLingrui98  update_ftb_entry         := ftbEntryGen.new_entry
110109c6f1ddSLingrui98  update.new_br_insert_pos := ftbEntryGen.new_br_insert_pos
110209c6f1ddSLingrui98  update.mispred_mask      := ftbEntryGen.mispred_mask
110309c6f1ddSLingrui98  update.old_entry         := ftbEntryGen.is_old_entry
1104edc18578SLingrui98  update.pred_hit          := commit_hit === h_hit || commit_hit === h_false_hit
1105803124a6SLingrui98  update.br_taken_mask     := ftbEntryGen.taken_mask
1106803124a6SLingrui98  update.jmp_taken         := ftbEntryGen.jmp_taken
1107b37e4b45SLingrui98
1108803124a6SLingrui98  // update.is_minimal := false.B
1109803124a6SLingrui98  // update.full_pred.fromFtbEntry(ftbEntryGen.new_entry, update.pc)
1110803124a6SLingrui98  // update.full_pred.jalr_target := commit_target
1111803124a6SLingrui98  // update.full_pred.hit := true.B
1112803124a6SLingrui98  // when (update.full_pred.is_jalr) {
1113803124a6SLingrui98  //   update.full_pred.targets.last := commit_target
1114803124a6SLingrui98  // }
111509c6f1ddSLingrui98
1116e30430c2SJay  // ****************************************************************
1117e30430c2SJay  // *********************** to prefetch ****************************
1118e30430c2SJay  // ****************************************************************
1119e30430c2SJay
11209c8f16f2SJenius  ftq_pc_mem.io.other_raddrs(0) := DontCare
1121e30430c2SJay  if(cacheParams.hasPrefetch){
1122e30430c2SJay    val prefetchPtr = RegInit(FtqPtr(false.B, 0.U))
1123378f00d9SJenius    val diff_prefetch_addr = WireInit(update_target(prefetchPtr.value)) //TODO: remove this
1124378f00d9SJenius
1125e30430c2SJay    prefetchPtr := prefetchPtr + io.toPrefetch.req.fire()
1126e30430c2SJay
1127378f00d9SJenius    ftq_pc_mem.io.other_raddrs(0) := prefetchPtr.value
1128378f00d9SJenius
1129e30430c2SJay    when (bpu_s2_resp.valid && bpu_s2_resp.hasRedirect && !isBefore(prefetchPtr, bpu_s2_resp.ftq_idx)) {
1130e30430c2SJay      prefetchPtr := bpu_s2_resp.ftq_idx
1131e30430c2SJay    }
1132e30430c2SJay
1133cb4f77ceSLingrui98    when (bpu_s3_resp.valid && bpu_s3_resp.hasRedirect && !isBefore(prefetchPtr, bpu_s3_resp.ftq_idx)) {
1134cb4f77ceSLingrui98      prefetchPtr := bpu_s3_resp.ftq_idx
1135a3c55791SJinYue      // XSError(true.B, "\ns3_redirect mechanism not implemented!\n")
1136cb4f77ceSLingrui98    }
1137de7689fcSJay
1138f63797a4SLingrui98
1139f63797a4SLingrui98    val prefetch_is_to_send = WireInit(entry_fetch_status(prefetchPtr.value) === f_to_send)
1140f56177cbSJenius    val prefetch_addr = Wire(UInt(VAddrBits.W))
1141f63797a4SLingrui98
1142f63797a4SLingrui98    when (last_cycle_bpu_in && bpu_in_bypass_ptr === prefetchPtr) {
1143f63797a4SLingrui98      prefetch_is_to_send := true.B
11446bf9b30dSLingrui98      prefetch_addr := last_cycle_bpu_target
1145378f00d9SJenius      diff_prefetch_addr := last_cycle_bpu_target // TODO: remove this
1146f56177cbSJenius    }.otherwise{
1147f56177cbSJenius      prefetch_addr := RegNext( ftq_pc_mem.io.other_rdatas(0).startAddr)
1148f63797a4SLingrui98    }
1149f63797a4SLingrui98    io.toPrefetch.req.valid := prefetchPtr =/= bpuPtr && prefetch_is_to_send
1150f63797a4SLingrui98    io.toPrefetch.req.bits.target := prefetch_addr
1151de7689fcSJay
1152de7689fcSJay    when(redirectVec.map(r => r.valid).reduce(_||_)){
1153de7689fcSJay      val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits)))
1154de7689fcSJay      val next = r.ftqIdx + 1.U
1155de7689fcSJay      prefetchPtr := next
1156de7689fcSJay    }
1157de7689fcSJay
1158378f00d9SJenius    // TODO: remove this
115910f8eea3SLingrui98    // XSError(io.toPrefetch.req.valid && diff_prefetch_addr =/= prefetch_addr,
116010f8eea3SLingrui98    //         f"\nprefetch_req_target wrong! prefetchPtr: ${prefetchPtr}, prefetch_addr: ${Hexadecimal(prefetch_addr)} diff_prefetch_addr: ${Hexadecimal(diff_prefetch_addr)}\n")
1161378f00d9SJenius
1162378f00d9SJenius
1163de7689fcSJay    XSError(isBefore(bpuPtr, prefetchPtr) && !isFull(bpuPtr, prefetchPtr), "\nprefetchPtr is before bpuPtr!\n")
1164e8747464SJenius    XSError(isBefore(prefetchPtr, ifuPtr) && !isFull(ifuPtr, prefetchPtr), "\nifuPtr is before prefetchPtr!\n")
1165de7689fcSJay  }
1166de7689fcSJay  else {
1167de7689fcSJay    io.toPrefetch.req <> DontCare
1168de7689fcSJay  }
1169de7689fcSJay
117009c6f1ddSLingrui98  // ******************************************************************************
117109c6f1ddSLingrui98  // **************************** commit perf counters ****************************
117209c6f1ddSLingrui98  // ******************************************************************************
117309c6f1ddSLingrui98
117409c6f1ddSLingrui98  val commit_inst_mask    = VecInit(commit_state.map(c => c === c_commited && do_commit)).asUInt
117509c6f1ddSLingrui98  val commit_mispred_mask = commit_mispredict.asUInt
117609c6f1ddSLingrui98  val commit_not_mispred_mask = ~commit_mispred_mask
117709c6f1ddSLingrui98
117809c6f1ddSLingrui98  val commit_br_mask = commit_pd.brMask.asUInt
117909c6f1ddSLingrui98  val commit_jmp_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.jmpInfo.valid.asTypeOf(UInt(1.W)))
118009c6f1ddSLingrui98  val commit_cfi_mask = (commit_br_mask | commit_jmp_mask)
118109c6f1ddSLingrui98
118209c6f1ddSLingrui98  val mbpInstrs = commit_inst_mask & commit_cfi_mask
118309c6f1ddSLingrui98
118409c6f1ddSLingrui98  val mbpRights = mbpInstrs & commit_not_mispred_mask
118509c6f1ddSLingrui98  val mbpWrongs = mbpInstrs & commit_mispred_mask
118609c6f1ddSLingrui98
118709c6f1ddSLingrui98  io.bpuInfo.bpRight := PopCount(mbpRights)
118809c6f1ddSLingrui98  io.bpuInfo.bpWrong := PopCount(mbpWrongs)
118909c6f1ddSLingrui98
119009c6f1ddSLingrui98  // Cfi Info
119109c6f1ddSLingrui98  for (i <- 0 until PredictWidth) {
119209c6f1ddSLingrui98    val pc = commit_pc_bundle.startAddr + (i * instBytes).U
119309c6f1ddSLingrui98    val v = commit_state(i) === c_commited
119409c6f1ddSLingrui98    val isBr = commit_pd.brMask(i)
119509c6f1ddSLingrui98    val isJmp = commit_pd.jmpInfo.valid && commit_pd.jmpOffset === i.U
119609c6f1ddSLingrui98    val isCfi = isBr || isJmp
119709c6f1ddSLingrui98    val isTaken = commit_cfi.valid && commit_cfi.bits === i.U
119809c6f1ddSLingrui98    val misPred = commit_mispredict(i)
1199c2ad24ebSLingrui98    // val ghist = commit_spec_meta.ghist.predHist
1200c2ad24ebSLingrui98    val histPtr = commit_spec_meta.histPtr
120109c6f1ddSLingrui98    val predCycle = commit_meta.meta(63, 0)
120209c6f1ddSLingrui98    val target = commit_target
120309c6f1ddSLingrui98
120409c6f1ddSLingrui98    val brIdx = OHToUInt(Reverse(Cat(update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U})))
120509c6f1ddSLingrui98    val inFtbEntry = update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U}.reduce(_||_)
120609c6f1ddSLingrui98    val addIntoHist = ((commit_hit === h_hit) && inFtbEntry) || ((!(commit_hit === h_hit) && i.U === commit_cfi.bits && isBr && commit_cfi.valid))
120709c6f1ddSLingrui98    XSDebug(v && do_commit && isCfi, p"cfi_update: isBr(${isBr}) pc(${Hexadecimal(pc)}) " +
1208c2ad24ebSLingrui98    p"taken(${isTaken}) mispred(${misPred}) cycle($predCycle) hist(${histPtr.value}) " +
120909c6f1ddSLingrui98    p"startAddr(${Hexadecimal(commit_pc_bundle.startAddr)}) AddIntoHist(${addIntoHist}) " +
121009c6f1ddSLingrui98    p"brInEntry(${inFtbEntry}) brIdx(${brIdx}) target(${Hexadecimal(target)})\n")
121109c6f1ddSLingrui98  }
121209c6f1ddSLingrui98
121309c6f1ddSLingrui98  val enq = io.fromBpu.resp
12142e1be6e1SSteve Gou  val perf_redirect = backendRedirect
121509c6f1ddSLingrui98
121609c6f1ddSLingrui98  XSPerfAccumulate("entry", validEntries)
121709c6f1ddSLingrui98  XSPerfAccumulate("bpu_to_ftq_stall", enq.valid && !enq.ready)
121809c6f1ddSLingrui98  XSPerfAccumulate("mispredictRedirect", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level)
121909c6f1ddSLingrui98  XSPerfAccumulate("replayRedirect", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level))
122009c6f1ddSLingrui98  XSPerfAccumulate("predecodeRedirect", fromIfuRedirect.valid)
122109c6f1ddSLingrui98
122209c6f1ddSLingrui98  XSPerfAccumulate("to_ifu_bubble", io.toIfu.req.ready && !io.toIfu.req.valid)
122309c6f1ddSLingrui98
122409c6f1ddSLingrui98  XSPerfAccumulate("to_ifu_stall", io.toIfu.req.valid && !io.toIfu.req.ready)
122509c6f1ddSLingrui98  XSPerfAccumulate("from_bpu_real_bubble", !enq.valid && enq.ready && allowBpuIn)
122612cedb6fSLingrui98  XSPerfAccumulate("bpu_to_ifu_bubble", bpuPtr === ifuPtr)
122709c6f1ddSLingrui98
122809c6f1ddSLingrui98  val from_bpu = io.fromBpu.resp.bits
1229*c2d1ec7dSLingrui98  def in_entry_len_map_gen(resp: BpuToFtqBundle)(stage: String) = {
1230*c2d1ec7dSLingrui98    val entry_len = (resp.last_stage_ftb_entry.getFallThrough(resp.s3.pc) - resp.s3.pc) >> instOffsetBits
123109c6f1ddSLingrui98    val entry_len_recording_vec = (1 to PredictWidth+1).map(i => entry_len === i.U)
123209c6f1ddSLingrui98    val entry_len_map = (1 to PredictWidth+1).map(i =>
1233*c2d1ec7dSLingrui98      f"${stage}_ftb_entry_len_$i" -> (entry_len_recording_vec(i-1) && resp.s3.valid)
123409c6f1ddSLingrui98    ).foldLeft(Map[String, UInt]())(_+_)
123509c6f1ddSLingrui98    entry_len_map
123609c6f1ddSLingrui98  }
1237*c2d1ec7dSLingrui98  val s3_entry_len_map = in_entry_len_map_gen(from_bpu)("s3")
123809c6f1ddSLingrui98
123909c6f1ddSLingrui98  val to_ifu = io.toIfu.req.bits
124009c6f1ddSLingrui98
124109c6f1ddSLingrui98
124209c6f1ddSLingrui98
124309c6f1ddSLingrui98  val commit_num_inst_recording_vec = (1 to PredictWidth).map(i => PopCount(commit_inst_mask) === i.U)
124409c6f1ddSLingrui98  val commit_num_inst_map = (1 to PredictWidth).map(i =>
124509c6f1ddSLingrui98    f"commit_num_inst_$i" -> (commit_num_inst_recording_vec(i-1) && do_commit)
124609c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
124709c6f1ddSLingrui98
124809c6f1ddSLingrui98
124909c6f1ddSLingrui98
125009c6f1ddSLingrui98  val commit_jal_mask  = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJal.asTypeOf(UInt(1.W)))
125109c6f1ddSLingrui98  val commit_jalr_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJalr.asTypeOf(UInt(1.W)))
125209c6f1ddSLingrui98  val commit_call_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasCall.asTypeOf(UInt(1.W)))
125309c6f1ddSLingrui98  val commit_ret_mask  = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasRet.asTypeOf(UInt(1.W)))
125409c6f1ddSLingrui98
125509c6f1ddSLingrui98
125609c6f1ddSLingrui98  val mbpBRights = mbpRights & commit_br_mask
125709c6f1ddSLingrui98  val mbpJRights = mbpRights & commit_jal_mask
125809c6f1ddSLingrui98  val mbpIRights = mbpRights & commit_jalr_mask
125909c6f1ddSLingrui98  val mbpCRights = mbpRights & commit_call_mask
126009c6f1ddSLingrui98  val mbpRRights = mbpRights & commit_ret_mask
126109c6f1ddSLingrui98
126209c6f1ddSLingrui98  val mbpBWrongs = mbpWrongs & commit_br_mask
126309c6f1ddSLingrui98  val mbpJWrongs = mbpWrongs & commit_jal_mask
126409c6f1ddSLingrui98  val mbpIWrongs = mbpWrongs & commit_jalr_mask
126509c6f1ddSLingrui98  val mbpCWrongs = mbpWrongs & commit_call_mask
126609c6f1ddSLingrui98  val mbpRWrongs = mbpWrongs & commit_ret_mask
126709c6f1ddSLingrui98
12681d7e5011SLingrui98  val commit_pred_stage = RegNext(pred_stage(commPtr.value))
12691d7e5011SLingrui98
12701d7e5011SLingrui98  def pred_stage_map(src: UInt, name: String) = {
12711d7e5011SLingrui98    (0 until numBpStages).map(i =>
12721d7e5011SLingrui98      f"${name}_stage_${i+1}" -> PopCount(src.asBools.map(_ && commit_pred_stage === BP_STAGES(i)))
12731d7e5011SLingrui98    ).foldLeft(Map[String, UInt]())(_+_)
12741d7e5011SLingrui98  }
12751d7e5011SLingrui98
12761d7e5011SLingrui98  val mispred_stage_map      = pred_stage_map(mbpWrongs,  "mispredict")
12771d7e5011SLingrui98  val br_mispred_stage_map   = pred_stage_map(mbpBWrongs, "br_mispredict")
12781d7e5011SLingrui98  val jalr_mispred_stage_map = pred_stage_map(mbpIWrongs, "jalr_mispredict")
12791d7e5011SLingrui98  val correct_stage_map      = pred_stage_map(mbpRights,  "correct")
12801d7e5011SLingrui98  val br_correct_stage_map   = pred_stage_map(mbpBRights, "br_correct")
12811d7e5011SLingrui98  val jalr_correct_stage_map = pred_stage_map(mbpIRights, "jalr_correct")
12821d7e5011SLingrui98
128309c6f1ddSLingrui98  val update_valid = io.toBpu.update.valid
128409c6f1ddSLingrui98  def u(cond: Bool) = update_valid && cond
128509c6f1ddSLingrui98  val ftb_false_hit = u(update.false_hit)
128665fddcf0Szoujr  // assert(!ftb_false_hit)
128709c6f1ddSLingrui98  val ftb_hit = u(commit_hit === h_hit)
128809c6f1ddSLingrui98
128909c6f1ddSLingrui98  val ftb_new_entry = u(ftbEntryGen.is_init_entry)
1290b37e4b45SLingrui98  val ftb_new_entry_only_br = ftb_new_entry && !update_ftb_entry.jmpValid
1291b37e4b45SLingrui98  val ftb_new_entry_only_jmp = ftb_new_entry && !update_ftb_entry.brValids(0)
1292b37e4b45SLingrui98  val ftb_new_entry_has_br_and_jmp = ftb_new_entry && update_ftb_entry.brValids(0) && update_ftb_entry.jmpValid
129309c6f1ddSLingrui98
129409c6f1ddSLingrui98  val ftb_old_entry = u(ftbEntryGen.is_old_entry)
129509c6f1ddSLingrui98
129609c6f1ddSLingrui98  val ftb_modified_entry = u(ftbEntryGen.is_new_br || ftbEntryGen.is_jalr_target_modified || ftbEntryGen.is_always_taken_modified)
129709c6f1ddSLingrui98  val ftb_modified_entry_new_br = u(ftbEntryGen.is_new_br)
129809c6f1ddSLingrui98  val ftb_modified_entry_jalr_target_modified = u(ftbEntryGen.is_jalr_target_modified)
129909c6f1ddSLingrui98  val ftb_modified_entry_br_full = ftb_modified_entry && ftbEntryGen.is_br_full
130009c6f1ddSLingrui98  val ftb_modified_entry_always_taken = ftb_modified_entry && ftbEntryGen.is_always_taken_modified
130109c6f1ddSLingrui98
130209c6f1ddSLingrui98  val ftb_entry_len = (ftbEntryGen.new_entry.getFallThrough(update.pc) - update.pc) >> instOffsetBits
130309c6f1ddSLingrui98  val ftb_entry_len_recording_vec = (1 to PredictWidth+1).map(i => ftb_entry_len === i.U)
130409c6f1ddSLingrui98  val ftb_init_entry_len_map = (1 to PredictWidth+1).map(i =>
130509c6f1ddSLingrui98    f"ftb_init_entry_len_$i" -> (ftb_entry_len_recording_vec(i-1) && ftb_new_entry)
130609c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
130709c6f1ddSLingrui98  val ftb_modified_entry_len_map = (1 to PredictWidth+1).map(i =>
130809c6f1ddSLingrui98    f"ftb_modified_entry_len_$i" -> (ftb_entry_len_recording_vec(i-1) && ftb_modified_entry)
130909c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
131009c6f1ddSLingrui98
131109c6f1ddSLingrui98  val ftq_occupancy_map = (0 to FtqSize).map(i =>
131209c6f1ddSLingrui98    f"ftq_has_entry_$i" ->( validEntries === i.U)
131309c6f1ddSLingrui98  ).foldLeft(Map[String, UInt]())(_+_)
131409c6f1ddSLingrui98
131509c6f1ddSLingrui98  val perfCountsMap = Map(
131609c6f1ddSLingrui98    "BpInstr" -> PopCount(mbpInstrs),
131709c6f1ddSLingrui98    "BpBInstr" -> PopCount(mbpBRights | mbpBWrongs),
131809c6f1ddSLingrui98    "BpRight"  -> PopCount(mbpRights),
131909c6f1ddSLingrui98    "BpWrong"  -> PopCount(mbpWrongs),
132009c6f1ddSLingrui98    "BpBRight" -> PopCount(mbpBRights),
132109c6f1ddSLingrui98    "BpBWrong" -> PopCount(mbpBWrongs),
132209c6f1ddSLingrui98    "BpJRight" -> PopCount(mbpJRights),
132309c6f1ddSLingrui98    "BpJWrong" -> PopCount(mbpJWrongs),
132409c6f1ddSLingrui98    "BpIRight" -> PopCount(mbpIRights),
132509c6f1ddSLingrui98    "BpIWrong" -> PopCount(mbpIWrongs),
132609c6f1ddSLingrui98    "BpCRight" -> PopCount(mbpCRights),
132709c6f1ddSLingrui98    "BpCWrong" -> PopCount(mbpCWrongs),
132809c6f1ddSLingrui98    "BpRRight" -> PopCount(mbpRRights),
132909c6f1ddSLingrui98    "BpRWrong" -> PopCount(mbpRWrongs),
133009c6f1ddSLingrui98
133109c6f1ddSLingrui98    "ftb_false_hit"                -> PopCount(ftb_false_hit),
133209c6f1ddSLingrui98    "ftb_hit"                      -> PopCount(ftb_hit),
133309c6f1ddSLingrui98    "ftb_new_entry"                -> PopCount(ftb_new_entry),
133409c6f1ddSLingrui98    "ftb_new_entry_only_br"        -> PopCount(ftb_new_entry_only_br),
133509c6f1ddSLingrui98    "ftb_new_entry_only_jmp"       -> PopCount(ftb_new_entry_only_jmp),
133609c6f1ddSLingrui98    "ftb_new_entry_has_br_and_jmp" -> PopCount(ftb_new_entry_has_br_and_jmp),
133709c6f1ddSLingrui98    "ftb_old_entry"                -> PopCount(ftb_old_entry),
133809c6f1ddSLingrui98    "ftb_modified_entry"           -> PopCount(ftb_modified_entry),
133909c6f1ddSLingrui98    "ftb_modified_entry_new_br"    -> PopCount(ftb_modified_entry_new_br),
134009c6f1ddSLingrui98    "ftb_jalr_target_modified"     -> PopCount(ftb_modified_entry_jalr_target_modified),
134109c6f1ddSLingrui98    "ftb_modified_entry_br_full"   -> PopCount(ftb_modified_entry_br_full),
134209c6f1ddSLingrui98    "ftb_modified_entry_always_taken" -> PopCount(ftb_modified_entry_always_taken)
1343*c2d1ec7dSLingrui98  ) ++ ftb_init_entry_len_map ++ ftb_modified_entry_len_map ++
1344cb4f77ceSLingrui98  s3_entry_len_map ++ commit_num_inst_map ++ ftq_occupancy_map ++
13451d7e5011SLingrui98  mispred_stage_map ++ br_mispred_stage_map ++ jalr_mispred_stage_map ++
13461d7e5011SLingrui98  correct_stage_map ++ br_correct_stage_map ++ jalr_correct_stage_map
134709c6f1ddSLingrui98
134809c6f1ddSLingrui98  for((key, value) <- perfCountsMap) {
134909c6f1ddSLingrui98    XSPerfAccumulate(key, value)
135009c6f1ddSLingrui98  }
135109c6f1ddSLingrui98
135209c6f1ddSLingrui98  // --------------------------- Debug --------------------------------
135309c6f1ddSLingrui98  // XSDebug(enq_fire, p"enq! " + io.fromBpu.resp.bits.toPrintable)
135409c6f1ddSLingrui98  XSDebug(io.toIfu.req.fire, p"fire to ifu " + io.toIfu.req.bits.toPrintable)
135509c6f1ddSLingrui98  XSDebug(do_commit, p"deq! [ptr] $do_commit_ptr\n")
135609c6f1ddSLingrui98  XSDebug(true.B, p"[bpuPtr] $bpuPtr, [ifuPtr] $ifuPtr, [ifuWbPtr] $ifuWbPtr [commPtr] $commPtr\n")
135709c6f1ddSLingrui98  XSDebug(true.B, p"[in] v:${io.fromBpu.resp.valid} r:${io.fromBpu.resp.ready} " +
135809c6f1ddSLingrui98    p"[out] v:${io.toIfu.req.valid} r:${io.toIfu.req.ready}\n")
135909c6f1ddSLingrui98  XSDebug(do_commit, p"[deq info] cfiIndex: $commit_cfi, $commit_pc_bundle, target: ${Hexadecimal(commit_target)}\n")
136009c6f1ddSLingrui98
136109c6f1ddSLingrui98  //   def ubtbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
136209c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
136309c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
136409c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
136509c6f1ddSLingrui98  //         isWrong ^ Mux(ans.hit.asBool,
136609c6f1ddSLingrui98  //           Mux(ans.taken.asBool, taken && ans.target === commitEntry.target,
136709c6f1ddSLingrui98  //           !taken),
136809c6f1ddSLingrui98  //         !taken),
136909c6f1ddSLingrui98  //       false.B)
137009c6f1ddSLingrui98  //     }
137109c6f1ddSLingrui98  //   }
137209c6f1ddSLingrui98
137309c6f1ddSLingrui98  //   def btbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
137409c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
137509c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
137609c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
137709c6f1ddSLingrui98  //         isWrong ^ Mux(ans.hit.asBool,
137809c6f1ddSLingrui98  //           Mux(ans.taken.asBool, taken && ans.target === commitEntry.target,
137909c6f1ddSLingrui98  //           !taken),
138009c6f1ddSLingrui98  //         !taken),
138109c6f1ddSLingrui98  //       false.B)
138209c6f1ddSLingrui98  //     }
138309c6f1ddSLingrui98  //   }
138409c6f1ddSLingrui98
138509c6f1ddSLingrui98  //   def tageCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
138609c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
138709c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
138809c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
138909c6f1ddSLingrui98  //         isWrong ^ (ans.taken.asBool === taken),
139009c6f1ddSLingrui98  //       false.B)
139109c6f1ddSLingrui98  //     }
139209c6f1ddSLingrui98  //   }
139309c6f1ddSLingrui98
139409c6f1ddSLingrui98  //   def loopCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
139509c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
139609c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
139709c6f1ddSLingrui98  //       Mux(valid && (pd.isBr) && ans.hit.asBool,
139809c6f1ddSLingrui98  //         isWrong ^ (!taken),
139909c6f1ddSLingrui98  //           false.B)
140009c6f1ddSLingrui98  //     }
140109c6f1ddSLingrui98  //   }
140209c6f1ddSLingrui98
140309c6f1ddSLingrui98  //   def rasCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
140409c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
140509c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
140609c6f1ddSLingrui98  //       Mux(valid && pd.isRet.asBool /*&& taken*/ && ans.hit.asBool,
140709c6f1ddSLingrui98  //         isWrong ^ (ans.target === commitEntry.target),
140809c6f1ddSLingrui98  //           false.B)
140909c6f1ddSLingrui98  //     }
141009c6f1ddSLingrui98  //   }
141109c6f1ddSLingrui98
141209c6f1ddSLingrui98  //   val ubtbRights = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), false.B)
141309c6f1ddSLingrui98  //   val ubtbWrongs = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), true.B)
141409c6f1ddSLingrui98  //   // btb and ubtb pred jal and jalr as well
141509c6f1ddSLingrui98  //   val btbRights = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), false.B)
141609c6f1ddSLingrui98  //   val btbWrongs = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), true.B)
141709c6f1ddSLingrui98  //   val tageRights = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), false.B)
141809c6f1ddSLingrui98  //   val tageWrongs = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), true.B)
141909c6f1ddSLingrui98
142009c6f1ddSLingrui98  //   val loopRights = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), false.B)
142109c6f1ddSLingrui98  //   val loopWrongs = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), true.B)
142209c6f1ddSLingrui98
142309c6f1ddSLingrui98  //   val rasRights = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), false.B)
142409c6f1ddSLingrui98  //   val rasWrongs = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), true.B)
14251ca0e4f3SYinan Xu
1426cd365d4cSrvcoresjw  val perfEvents = Seq(
1427cd365d4cSrvcoresjw    ("bpu_s2_redirect        ", bpu_s2_redirect                                                             ),
1428cb4f77ceSLingrui98    ("bpu_s3_redirect        ", bpu_s3_redirect                                                             ),
1429cd365d4cSrvcoresjw    ("bpu_to_ftq_stall       ", enq.valid && ~enq.ready                                                     ),
1430cd365d4cSrvcoresjw    ("mispredictRedirect     ", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level),
1431cd365d4cSrvcoresjw    ("replayRedirect         ", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level)  ),
1432cd365d4cSrvcoresjw    ("predecodeRedirect      ", fromIfuRedirect.valid                                                       ),
1433cd365d4cSrvcoresjw    ("to_ifu_bubble          ", io.toIfu.req.ready && !io.toIfu.req.valid                                   ),
1434cd365d4cSrvcoresjw    ("from_bpu_real_bubble   ", !enq.valid && enq.ready && allowBpuIn                                       ),
1435cd365d4cSrvcoresjw    ("BpInstr                ", PopCount(mbpInstrs)                                                         ),
1436cd365d4cSrvcoresjw    ("BpBInstr               ", PopCount(mbpBRights | mbpBWrongs)                                           ),
1437cd365d4cSrvcoresjw    ("BpRight                ", PopCount(mbpRights)                                                         ),
1438cd365d4cSrvcoresjw    ("BpWrong                ", PopCount(mbpWrongs)                                                         ),
1439cd365d4cSrvcoresjw    ("BpBRight               ", PopCount(mbpBRights)                                                        ),
1440cd365d4cSrvcoresjw    ("BpBWrong               ", PopCount(mbpBWrongs)                                                        ),
1441cd365d4cSrvcoresjw    ("BpJRight               ", PopCount(mbpJRights)                                                        ),
1442cd365d4cSrvcoresjw    ("BpJWrong               ", PopCount(mbpJWrongs)                                                        ),
1443cd365d4cSrvcoresjw    ("BpIRight               ", PopCount(mbpIRights)                                                        ),
1444cd365d4cSrvcoresjw    ("BpIWrong               ", PopCount(mbpIWrongs)                                                        ),
1445cd365d4cSrvcoresjw    ("BpCRight               ", PopCount(mbpCRights)                                                        ),
1446cd365d4cSrvcoresjw    ("BpCWrong               ", PopCount(mbpCWrongs)                                                        ),
1447cd365d4cSrvcoresjw    ("BpRRight               ", PopCount(mbpRRights)                                                        ),
1448cd365d4cSrvcoresjw    ("BpRWrong               ", PopCount(mbpRWrongs)                                                        ),
1449cd365d4cSrvcoresjw    ("ftb_false_hit          ", PopCount(ftb_false_hit)                                                     ),
1450cd365d4cSrvcoresjw    ("ftb_hit                ", PopCount(ftb_hit)                                                           ),
1451cd365d4cSrvcoresjw  )
14521ca0e4f3SYinan Xu  generatePerfEvent()
145309c6f1ddSLingrui98}