xref: /XiangShan/src/main/scala/xiangshan/frontend/NewFtq.scala (revision f9c51548eadf004cb854b28a254a32dbaf5fc508)
109c6f1ddSLingrui98/***************************************************************************************
209c6f1ddSLingrui98* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
309c6f1ddSLingrui98* Copyright (c) 2020-2021 Peng Cheng Laboratory
409c6f1ddSLingrui98*
509c6f1ddSLingrui98* XiangShan is licensed under Mulan PSL v2.
609c6f1ddSLingrui98* You can use this software according to the terms and conditions of the Mulan PSL v2.
709c6f1ddSLingrui98* You may obtain a copy of Mulan PSL v2 at:
809c6f1ddSLingrui98*          http://license.coscl.org.cn/MulanPSL2
909c6f1ddSLingrui98*
1009c6f1ddSLingrui98* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
1109c6f1ddSLingrui98* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
1209c6f1ddSLingrui98* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
1309c6f1ddSLingrui98*
1409c6f1ddSLingrui98* See the Mulan PSL v2 for more details.
1509c6f1ddSLingrui98***************************************************************************************/
1609c6f1ddSLingrui98
1709c6f1ddSLingrui98package xiangshan.frontend
1809c6f1ddSLingrui98
198891a219SYinan Xuimport org.chipsalliance.cde.config.Parameters
2009c6f1ddSLingrui98import chisel3._
2109c6f1ddSLingrui98import chisel3.util._
221ca0e4f3SYinan Xuimport utils._
233c02ee8fSwakafaimport utility._
2409c6f1ddSLingrui98import xiangshan._
25e30430c2SJayimport xiangshan.frontend.icache._
261ca0e4f3SYinan Xuimport xiangshan.backend.CtrlToFtqIO
272e1be6e1SSteve Gouimport xiangshan.backend.decode.ImmUnion
283c02ee8fSwakafaimport utility.ChiselDB
2951532d8bSGuokai Chen
3051532d8bSGuokai Chenclass FtqDebugBundle extends Bundle {
3151532d8bSGuokai Chen  val pc = UInt(39.W)
3251532d8bSGuokai Chen  val target = UInt(39.W)
3351532d8bSGuokai Chen  val isBr = Bool()
3451532d8bSGuokai Chen  val isJmp = Bool()
3551532d8bSGuokai Chen  val isCall = Bool()
3651532d8bSGuokai Chen  val isRet = Bool()
3751532d8bSGuokai Chen  val misPred = Bool()
3851532d8bSGuokai Chen  val isTaken = Bool()
3951532d8bSGuokai Chen  val predStage = UInt(2.W)
4051532d8bSGuokai Chen}
4109c6f1ddSLingrui98
4209c6f1ddSLingrui98class FtqPtr(implicit p: Parameters) extends CircularQueuePtr[FtqPtr](
4309c6f1ddSLingrui98  p => p(XSCoreParamsKey).FtqSize
4409c6f1ddSLingrui98){
4509c6f1ddSLingrui98}
4609c6f1ddSLingrui98
4709c6f1ddSLingrui98object FtqPtr {
4809c6f1ddSLingrui98  def apply(f: Bool, v: UInt)(implicit p: Parameters): FtqPtr = {
4909c6f1ddSLingrui98    val ptr = Wire(new FtqPtr)
5009c6f1ddSLingrui98    ptr.flag := f
5109c6f1ddSLingrui98    ptr.value := v
5209c6f1ddSLingrui98    ptr
5309c6f1ddSLingrui98  }
5409c6f1ddSLingrui98  def inverse(ptr: FtqPtr)(implicit p: Parameters): FtqPtr = {
5509c6f1ddSLingrui98    apply(!ptr.flag, ptr.value)
5609c6f1ddSLingrui98  }
5709c6f1ddSLingrui98}
5809c6f1ddSLingrui98
5909c6f1ddSLingrui98class FtqNRSRAM[T <: Data](gen: T, numRead: Int)(implicit p: Parameters) extends XSModule {
6009c6f1ddSLingrui98
6109c6f1ddSLingrui98  val io = IO(new Bundle() {
6209c6f1ddSLingrui98    val raddr = Input(Vec(numRead, UInt(log2Up(FtqSize).W)))
6309c6f1ddSLingrui98    val ren = Input(Vec(numRead, Bool()))
6409c6f1ddSLingrui98    val rdata = Output(Vec(numRead, gen))
6509c6f1ddSLingrui98    val waddr = Input(UInt(log2Up(FtqSize).W))
6609c6f1ddSLingrui98    val wen = Input(Bool())
6709c6f1ddSLingrui98    val wdata = Input(gen)
6809c6f1ddSLingrui98  })
6909c6f1ddSLingrui98
7009c6f1ddSLingrui98  for(i <- 0 until numRead){
7109c6f1ddSLingrui98    val sram = Module(new SRAMTemplate(gen, FtqSize))
7209c6f1ddSLingrui98    sram.io.r.req.valid := io.ren(i)
7309c6f1ddSLingrui98    sram.io.r.req.bits.setIdx := io.raddr(i)
7409c6f1ddSLingrui98    io.rdata(i) := sram.io.r.resp.data(0)
7509c6f1ddSLingrui98    sram.io.w.req.valid := io.wen
7609c6f1ddSLingrui98    sram.io.w.req.bits.setIdx := io.waddr
7709c6f1ddSLingrui98    sram.io.w.req.bits.data := VecInit(io.wdata)
7809c6f1ddSLingrui98  }
7909c6f1ddSLingrui98
8009c6f1ddSLingrui98}
8109c6f1ddSLingrui98
8209c6f1ddSLingrui98class Ftq_RF_Components(implicit p: Parameters) extends XSBundle with BPUUtils {
8309c6f1ddSLingrui98  val startAddr = UInt(VAddrBits.W)
84b37e4b45SLingrui98  val nextLineAddr = UInt(VAddrBits.W)
8509c6f1ddSLingrui98  val isNextMask = Vec(PredictWidth, Bool())
86b37e4b45SLingrui98  val fallThruError = Bool()
87b37e4b45SLingrui98  // val carry = Bool()
8809c6f1ddSLingrui98  def getPc(offset: UInt) = {
8985215037SLingrui98    def getHigher(pc: UInt) = pc(VAddrBits-1, log2Ceil(PredictWidth)+instOffsetBits+1)
9085215037SLingrui98    def getOffset(pc: UInt) = pc(log2Ceil(PredictWidth)+instOffsetBits, instOffsetBits)
91b37e4b45SLingrui98    Cat(getHigher(Mux(isNextMask(offset) && startAddr(log2Ceil(PredictWidth)+instOffsetBits), nextLineAddr, startAddr)),
9209c6f1ddSLingrui98        getOffset(startAddr)+offset, 0.U(instOffsetBits.W))
9309c6f1ddSLingrui98  }
9409c6f1ddSLingrui98  def fromBranchPrediction(resp: BranchPredictionBundle) = {
95a229ab6cSLingrui98    def carryPos(addr: UInt) = addr(instOffsetBits+log2Ceil(PredictWidth)+1)
96adc0b8dfSGuokai Chen    this.startAddr := resp.pc(3)
97adc0b8dfSGuokai Chen    this.nextLineAddr := resp.pc(3) + (FetchWidth * 4 * 2).U // may be broken on other configs
9809c6f1ddSLingrui98    this.isNextMask := VecInit((0 until PredictWidth).map(i =>
99935edac4STang Haojin      (resp.pc(3)(log2Ceil(PredictWidth), 1) +& i.U)(log2Ceil(PredictWidth)).asBool
10009c6f1ddSLingrui98    ))
101adc0b8dfSGuokai Chen    this.fallThruError := resp.fallThruError(3)
10209c6f1ddSLingrui98    this
10309c6f1ddSLingrui98  }
10409c6f1ddSLingrui98  override def toPrintable: Printable = {
105b37e4b45SLingrui98    p"startAddr:${Hexadecimal(startAddr)}"
10609c6f1ddSLingrui98  }
10709c6f1ddSLingrui98}
10809c6f1ddSLingrui98
10909c6f1ddSLingrui98class Ftq_pd_Entry(implicit p: Parameters) extends XSBundle {
11009c6f1ddSLingrui98  val brMask = Vec(PredictWidth, Bool())
11109c6f1ddSLingrui98  val jmpInfo = ValidUndirectioned(Vec(3, Bool()))
11209c6f1ddSLingrui98  val jmpOffset = UInt(log2Ceil(PredictWidth).W)
11309c6f1ddSLingrui98  val jalTarget = UInt(VAddrBits.W)
11409c6f1ddSLingrui98  val rvcMask = Vec(PredictWidth, Bool())
11509c6f1ddSLingrui98  def hasJal  = jmpInfo.valid && !jmpInfo.bits(0)
11609c6f1ddSLingrui98  def hasJalr = jmpInfo.valid && jmpInfo.bits(0)
11709c6f1ddSLingrui98  def hasCall = jmpInfo.valid && jmpInfo.bits(1)
11809c6f1ddSLingrui98  def hasRet  = jmpInfo.valid && jmpInfo.bits(2)
11909c6f1ddSLingrui98
12009c6f1ddSLingrui98  def fromPdWb(pdWb: PredecodeWritebackBundle) = {
12109c6f1ddSLingrui98    val pds = pdWb.pd
12209c6f1ddSLingrui98    this.brMask := VecInit(pds.map(pd => pd.isBr && pd.valid))
12309c6f1ddSLingrui98    this.jmpInfo.valid := VecInit(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid)).asUInt.orR
12409c6f1ddSLingrui98    this.jmpInfo.bits := ParallelPriorityMux(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid),
12509c6f1ddSLingrui98                                             pds.map(pd => VecInit(pd.isJalr, pd.isCall, pd.isRet)))
12609c6f1ddSLingrui98    this.jmpOffset := ParallelPriorityEncoder(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid))
12709c6f1ddSLingrui98    this.rvcMask := VecInit(pds.map(pd => pd.isRVC))
12809c6f1ddSLingrui98    this.jalTarget := pdWb.jalTarget
12909c6f1ddSLingrui98  }
13009c6f1ddSLingrui98
13109c6f1ddSLingrui98  def toPd(offset: UInt) = {
13209c6f1ddSLingrui98    require(offset.getWidth == log2Ceil(PredictWidth))
13309c6f1ddSLingrui98    val pd = Wire(new PreDecodeInfo)
13409c6f1ddSLingrui98    pd.valid := true.B
13509c6f1ddSLingrui98    pd.isRVC := rvcMask(offset)
13609c6f1ddSLingrui98    val isBr = brMask(offset)
13709c6f1ddSLingrui98    val isJalr = offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(0)
13809c6f1ddSLingrui98    pd.brType := Cat(offset === jmpOffset && jmpInfo.valid, isJalr || isBr)
13909c6f1ddSLingrui98    pd.isCall := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(1)
14009c6f1ddSLingrui98    pd.isRet  := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(2)
14109c6f1ddSLingrui98    pd
14209c6f1ddSLingrui98  }
14309c6f1ddSLingrui98}
14409c6f1ddSLingrui98
145*f9c51548Sssszwicclass PrefetchPtrDB(implicit p: Parameters) extends Bundle {
146*f9c51548Sssszwic  val fromFtqPtr  = UInt(log2Up(p(XSCoreParamsKey).FtqSize).W)
147*f9c51548Sssszwic  val fromIfuPtr  = UInt(log2Up(p(XSCoreParamsKey).FtqSize).W)
148*f9c51548Sssszwic}
14909c6f1ddSLingrui98
1503711cf36S小造xu_zhclass Ftq_Redirect_SRAMEntry(implicit p: Parameters) extends SpeculativeInfo {
1513711cf36S小造xu_zh  val sc_disagree = Vec(numBr, Bool())
1523711cf36S小造xu_zh}
15309c6f1ddSLingrui98
15409c6f1ddSLingrui98class Ftq_1R_SRAMEntry(implicit p: Parameters) extends XSBundle with HasBPUConst {
15509c6f1ddSLingrui98  val meta = UInt(MaxMetaLength.W)
15609c6f1ddSLingrui98}
15709c6f1ddSLingrui98
15809c6f1ddSLingrui98class Ftq_Pred_Info(implicit p: Parameters) extends XSBundle {
15909c6f1ddSLingrui98  val target = UInt(VAddrBits.W)
16009c6f1ddSLingrui98  val cfiIndex = ValidUndirectioned(UInt(log2Ceil(PredictWidth).W))
16109c6f1ddSLingrui98}
16209c6f1ddSLingrui98
16309c6f1ddSLingrui98
16409c6f1ddSLingrui98class FtqRead[T <: Data](private val gen: T)(implicit p: Parameters) extends XSBundle {
16509c6f1ddSLingrui98  val ptr = Output(new FtqPtr)
16609c6f1ddSLingrui98  val offset = Output(UInt(log2Ceil(PredictWidth).W))
16709c6f1ddSLingrui98  val data = Input(gen)
16809c6f1ddSLingrui98  def apply(ptr: FtqPtr, offset: UInt) = {
16909c6f1ddSLingrui98    this.ptr := ptr
17009c6f1ddSLingrui98    this.offset := offset
17109c6f1ddSLingrui98    this.data
17209c6f1ddSLingrui98  }
17309c6f1ddSLingrui98}
17409c6f1ddSLingrui98
17509c6f1ddSLingrui98
17609c6f1ddSLingrui98class FtqToBpuIO(implicit p: Parameters) extends XSBundle {
17709c6f1ddSLingrui98  val redirect = Valid(new BranchPredictionRedirect)
17809c6f1ddSLingrui98  val update = Valid(new BranchPredictionUpdate)
17909c6f1ddSLingrui98  val enq_ptr = Output(new FtqPtr)
18009c6f1ddSLingrui98}
18109c6f1ddSLingrui98
18209c6f1ddSLingrui98class FtqToIfuIO(implicit p: Parameters) extends XSBundle with HasCircularQueuePtrHelper {
18309c6f1ddSLingrui98  val req = Decoupled(new FetchRequestBundle)
184d2b20d1aSTang Haojin  val redirect = Valid(new BranchPredictionRedirect)
185d2b20d1aSTang Haojin  val topdown_redirect = Valid(new BranchPredictionRedirect)
18609c6f1ddSLingrui98  val flushFromBpu = new Bundle {
18709c6f1ddSLingrui98    // when ifu pipeline is not stalled,
18809c6f1ddSLingrui98    // a packet from bpu s3 can reach f1 at most
18909c6f1ddSLingrui98    val s2 = Valid(new FtqPtr)
190cb4f77ceSLingrui98    val s3 = Valid(new FtqPtr)
19109c6f1ddSLingrui98    def shouldFlushBy(src: Valid[FtqPtr], idx_to_flush: FtqPtr) = {
19209c6f1ddSLingrui98      src.valid && !isAfter(src.bits, idx_to_flush)
19309c6f1ddSLingrui98    }
19409c6f1ddSLingrui98    def shouldFlushByStage2(idx: FtqPtr) = shouldFlushBy(s2, idx)
195cb4f77ceSLingrui98    def shouldFlushByStage3(idx: FtqPtr) = shouldFlushBy(s3, idx)
19609c6f1ddSLingrui98  }
19709c6f1ddSLingrui98}
19809c6f1ddSLingrui98
199c5c5edaeSJeniusclass FtqToICacheIO(implicit p: Parameters) extends XSBundle with HasCircularQueuePtrHelper {
200c5c5edaeSJenius  //NOTE: req.bits must be prepare in T cycle
201c5c5edaeSJenius  // while req.valid is set true in T + 1 cycle
202c5c5edaeSJenius  val req = Decoupled(new FtqToICacheRequestBundle)
203c5c5edaeSJenius}
204c5c5edaeSJenius
20509c6f1ddSLingrui98trait HasBackendRedirectInfo extends HasXSParameter {
2062e1be6e1SSteve Gou  def numRedirectPcRead = exuParameters.JmpCnt + exuParameters.AluCnt + 1
20709c6f1ddSLingrui98  def isLoadReplay(r: Valid[Redirect]) = r.bits.flushItself()
20809c6f1ddSLingrui98}
20909c6f1ddSLingrui98
21009c6f1ddSLingrui98class FtqToCtrlIO(implicit p: Parameters) extends XSBundle with HasBackendRedirectInfo {
211b56f947eSYinan Xu  // write to backend pc mem
212b56f947eSYinan Xu  val pc_mem_wen = Output(Bool())
213b56f947eSYinan Xu  val pc_mem_waddr = Output(UInt(log2Ceil(FtqSize).W))
214b56f947eSYinan Xu  val pc_mem_wdata = Output(new Ftq_RF_Components)
215873dc383SLingrui98  // newest target
216873dc383SLingrui98  val newest_entry_target = Output(UInt(VAddrBits.W))
217873dc383SLingrui98  val newest_entry_ptr = Output(new FtqPtr)
21809c6f1ddSLingrui98}
21909c6f1ddSLingrui98
22009c6f1ddSLingrui98
22109c6f1ddSLingrui98class FTBEntryGen(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo with HasBPUParameter {
22209c6f1ddSLingrui98  val io = IO(new Bundle {
22309c6f1ddSLingrui98    val start_addr = Input(UInt(VAddrBits.W))
22409c6f1ddSLingrui98    val old_entry = Input(new FTBEntry)
22509c6f1ddSLingrui98    val pd = Input(new Ftq_pd_Entry)
22609c6f1ddSLingrui98    val cfiIndex = Flipped(Valid(UInt(log2Ceil(PredictWidth).W)))
22709c6f1ddSLingrui98    val target = Input(UInt(VAddrBits.W))
22809c6f1ddSLingrui98    val hit = Input(Bool())
22909c6f1ddSLingrui98    val mispredict_vec = Input(Vec(PredictWidth, Bool()))
23009c6f1ddSLingrui98
23109c6f1ddSLingrui98    val new_entry = Output(new FTBEntry)
23209c6f1ddSLingrui98    val new_br_insert_pos = Output(Vec(numBr, Bool()))
23309c6f1ddSLingrui98    val taken_mask = Output(Vec(numBr, Bool()))
234803124a6SLingrui98    val jmp_taken = Output(Bool())
23509c6f1ddSLingrui98    val mispred_mask = Output(Vec(numBr+1, Bool()))
23609c6f1ddSLingrui98
23709c6f1ddSLingrui98    // for perf counters
23809c6f1ddSLingrui98    val is_init_entry = Output(Bool())
23909c6f1ddSLingrui98    val is_old_entry = Output(Bool())
24009c6f1ddSLingrui98    val is_new_br = Output(Bool())
24109c6f1ddSLingrui98    val is_jalr_target_modified = Output(Bool())
24209c6f1ddSLingrui98    val is_always_taken_modified = Output(Bool())
24309c6f1ddSLingrui98    val is_br_full = Output(Bool())
24409c6f1ddSLingrui98  })
24509c6f1ddSLingrui98
24609c6f1ddSLingrui98  // no mispredictions detected at predecode
24709c6f1ddSLingrui98  val hit = io.hit
24809c6f1ddSLingrui98  val pd = io.pd
24909c6f1ddSLingrui98
25009c6f1ddSLingrui98  val init_entry = WireInit(0.U.asTypeOf(new FTBEntry))
25109c6f1ddSLingrui98
25209c6f1ddSLingrui98
25309c6f1ddSLingrui98  val cfi_is_br = pd.brMask(io.cfiIndex.bits) && io.cfiIndex.valid
25409c6f1ddSLingrui98  val entry_has_jmp = pd.jmpInfo.valid
25509c6f1ddSLingrui98  val new_jmp_is_jal  = entry_has_jmp && !pd.jmpInfo.bits(0) && io.cfiIndex.valid
25609c6f1ddSLingrui98  val new_jmp_is_jalr = entry_has_jmp &&  pd.jmpInfo.bits(0) && io.cfiIndex.valid
25709c6f1ddSLingrui98  val new_jmp_is_call = entry_has_jmp &&  pd.jmpInfo.bits(1) && io.cfiIndex.valid
25809c6f1ddSLingrui98  val new_jmp_is_ret  = entry_has_jmp &&  pd.jmpInfo.bits(2) && io.cfiIndex.valid
25909c6f1ddSLingrui98  val last_jmp_rvi = entry_has_jmp && pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask.last
260a60a2901SLingrui98  // val last_br_rvi = cfi_is_br && io.cfiIndex.bits === (PredictWidth-1).U && !pd.rvcMask.last
26109c6f1ddSLingrui98
26209c6f1ddSLingrui98  val cfi_is_jal = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jal
26309c6f1ddSLingrui98  val cfi_is_jalr = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jalr
26409c6f1ddSLingrui98
265a60a2901SLingrui98  def carryPos = log2Ceil(PredictWidth)+instOffsetBits
26609c6f1ddSLingrui98  def getLower(pc: UInt) = pc(carryPos-1, instOffsetBits)
26709c6f1ddSLingrui98  // if not hit, establish a new entry
26809c6f1ddSLingrui98  init_entry.valid := true.B
26909c6f1ddSLingrui98  // tag is left for ftb to assign
270eeb5ff92SLingrui98
271eeb5ff92SLingrui98  // case br
272eeb5ff92SLingrui98  val init_br_slot = init_entry.getSlotForBr(0)
273eeb5ff92SLingrui98  when (cfi_is_br) {
274eeb5ff92SLingrui98    init_br_slot.valid := true.B
275eeb5ff92SLingrui98    init_br_slot.offset := io.cfiIndex.bits
276b37e4b45SLingrui98    init_br_slot.setLowerStatByTarget(io.start_addr, io.target, numBr == 1)
277eeb5ff92SLingrui98    init_entry.always_taken(0) := true.B // set to always taken on init
278eeb5ff92SLingrui98  }
279eeb5ff92SLingrui98
280eeb5ff92SLingrui98  // case jmp
281eeb5ff92SLingrui98  when (entry_has_jmp) {
282eeb5ff92SLingrui98    init_entry.tailSlot.offset := pd.jmpOffset
283eeb5ff92SLingrui98    init_entry.tailSlot.valid := new_jmp_is_jal || new_jmp_is_jalr
284eeb5ff92SLingrui98    init_entry.tailSlot.setLowerStatByTarget(io.start_addr, Mux(cfi_is_jalr, io.target, pd.jalTarget), isShare=false)
285eeb5ff92SLingrui98  }
286eeb5ff92SLingrui98
28709c6f1ddSLingrui98  val jmpPft = getLower(io.start_addr) +& pd.jmpOffset +& Mux(pd.rvcMask(pd.jmpOffset), 1.U, 2.U)
288a60a2901SLingrui98  init_entry.pftAddr := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft, getLower(io.start_addr))
289a60a2901SLingrui98  init_entry.carry   := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft(carryPos-instOffsetBits), true.B)
29009c6f1ddSLingrui98  init_entry.isJalr := new_jmp_is_jalr
29109c6f1ddSLingrui98  init_entry.isCall := new_jmp_is_call
29209c6f1ddSLingrui98  init_entry.isRet  := new_jmp_is_ret
293f4ebc4b2SLingrui98  // that means fall thru points to the middle of an inst
294ae409b75SSteve Gou  init_entry.last_may_be_rvi_call := pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask(pd.jmpOffset)
29509c6f1ddSLingrui98
29609c6f1ddSLingrui98  // if hit, check whether a new cfi(only br is possible) is detected
29709c6f1ddSLingrui98  val oe = io.old_entry
298eeb5ff92SLingrui98  val br_recorded_vec = oe.getBrRecordedVec(io.cfiIndex.bits)
29909c6f1ddSLingrui98  val br_recorded = br_recorded_vec.asUInt.orR
30009c6f1ddSLingrui98  val is_new_br = cfi_is_br && !br_recorded
30109c6f1ddSLingrui98  val new_br_offset = io.cfiIndex.bits
30209c6f1ddSLingrui98  // vec(i) means new br will be inserted BEFORE old br(i)
303eeb5ff92SLingrui98  val allBrSlotsVec = oe.allSlotsForBr
30409c6f1ddSLingrui98  val new_br_insert_onehot = VecInit((0 until numBr).map{
30509c6f1ddSLingrui98    i => i match {
306eeb5ff92SLingrui98      case 0 =>
307eeb5ff92SLingrui98        !allBrSlotsVec(0).valid || new_br_offset < allBrSlotsVec(0).offset
308eeb5ff92SLingrui98      case idx =>
309eeb5ff92SLingrui98        allBrSlotsVec(idx-1).valid && new_br_offset > allBrSlotsVec(idx-1).offset &&
310eeb5ff92SLingrui98        (!allBrSlotsVec(idx).valid || new_br_offset < allBrSlotsVec(idx).offset)
31109c6f1ddSLingrui98    }
31209c6f1ddSLingrui98  })
31309c6f1ddSLingrui98
31409c6f1ddSLingrui98  val old_entry_modified = WireInit(io.old_entry)
31509c6f1ddSLingrui98  for (i <- 0 until numBr) {
316eeb5ff92SLingrui98    val slot = old_entry_modified.allSlotsForBr(i)
317eeb5ff92SLingrui98    when (new_br_insert_onehot(i)) {
318eeb5ff92SLingrui98      slot.valid := true.B
319eeb5ff92SLingrui98      slot.offset := new_br_offset
320b37e4b45SLingrui98      slot.setLowerStatByTarget(io.start_addr, io.target, i == numBr-1)
321eeb5ff92SLingrui98      old_entry_modified.always_taken(i) := true.B
322eeb5ff92SLingrui98    }.elsewhen (new_br_offset > oe.allSlotsForBr(i).offset) {
323eeb5ff92SLingrui98      old_entry_modified.always_taken(i) := false.B
324eeb5ff92SLingrui98      // all other fields remain unchanged
325eeb5ff92SLingrui98    }.otherwise {
326eeb5ff92SLingrui98      // case i == 0, remain unchanged
327eeb5ff92SLingrui98      if (i != 0) {
328b37e4b45SLingrui98        val noNeedToMoveFromFormerSlot = (i == numBr-1).B && !oe.brSlots.last.valid
329eeb5ff92SLingrui98        when (!noNeedToMoveFromFormerSlot) {
330eeb5ff92SLingrui98          slot.fromAnotherSlot(oe.allSlotsForBr(i-1))
331eeb5ff92SLingrui98          old_entry_modified.always_taken(i) := oe.always_taken(i)
33209c6f1ddSLingrui98        }
333eeb5ff92SLingrui98      }
334eeb5ff92SLingrui98    }
335eeb5ff92SLingrui98  }
33609c6f1ddSLingrui98
337eeb5ff92SLingrui98  // two circumstances:
338eeb5ff92SLingrui98  // 1. oe: | br | j  |, new br should be in front of j, thus addr of j should be new pft
339eeb5ff92SLingrui98  // 2. oe: | br | br |, new br could be anywhere between, thus new pft is the addr of either
340eeb5ff92SLingrui98  //        the previous last br or the new br
341eeb5ff92SLingrui98  val may_have_to_replace = oe.noEmptySlotForNewBr
342eeb5ff92SLingrui98  val pft_need_to_change = is_new_br && may_have_to_replace
34309c6f1ddSLingrui98  // it should either be the given last br or the new br
34409c6f1ddSLingrui98  when (pft_need_to_change) {
345eeb5ff92SLingrui98    val new_pft_offset =
346710a8720SLingrui98      Mux(!new_br_insert_onehot.asUInt.orR,
347710a8720SLingrui98        new_br_offset, oe.allSlotsForBr.last.offset)
348eeb5ff92SLingrui98
349710a8720SLingrui98    // set jmp to invalid
35009c6f1ddSLingrui98    old_entry_modified.pftAddr := getLower(io.start_addr) + new_pft_offset
35109c6f1ddSLingrui98    old_entry_modified.carry := (getLower(io.start_addr) +& new_pft_offset).head(1).asBool
352f4ebc4b2SLingrui98    old_entry_modified.last_may_be_rvi_call := false.B
35309c6f1ddSLingrui98    old_entry_modified.isCall := false.B
35409c6f1ddSLingrui98    old_entry_modified.isRet := false.B
355eeb5ff92SLingrui98    old_entry_modified.isJalr := false.B
35609c6f1ddSLingrui98  }
35709c6f1ddSLingrui98
35809c6f1ddSLingrui98  val old_entry_jmp_target_modified = WireInit(oe)
359710a8720SLingrui98  val old_target = oe.tailSlot.getTarget(io.start_addr) // may be wrong because we store only 20 lowest bits
360b37e4b45SLingrui98  val old_tail_is_jmp = !oe.tailSlot.sharing
361eeb5ff92SLingrui98  val jalr_target_modified = cfi_is_jalr && (old_target =/= io.target) && old_tail_is_jmp // TODO: pass full jalr target
3623bcae573SLingrui98  when (jalr_target_modified) {
36309c6f1ddSLingrui98    old_entry_jmp_target_modified.setByJmpTarget(io.start_addr, io.target)
36409c6f1ddSLingrui98    old_entry_jmp_target_modified.always_taken := 0.U.asTypeOf(Vec(numBr, Bool()))
36509c6f1ddSLingrui98  }
36609c6f1ddSLingrui98
36709c6f1ddSLingrui98  val old_entry_always_taken = WireInit(oe)
36809c6f1ddSLingrui98  val always_taken_modified_vec = Wire(Vec(numBr, Bool())) // whether modified or not
36909c6f1ddSLingrui98  for (i <- 0 until numBr) {
37009c6f1ddSLingrui98    old_entry_always_taken.always_taken(i) :=
37109c6f1ddSLingrui98      oe.always_taken(i) && io.cfiIndex.valid && oe.brValids(i) && io.cfiIndex.bits === oe.brOffset(i)
372710a8720SLingrui98    always_taken_modified_vec(i) := oe.always_taken(i) && !old_entry_always_taken.always_taken(i)
37309c6f1ddSLingrui98  }
37409c6f1ddSLingrui98  val always_taken_modified = always_taken_modified_vec.reduce(_||_)
37509c6f1ddSLingrui98
37609c6f1ddSLingrui98
37709c6f1ddSLingrui98
37809c6f1ddSLingrui98  val derived_from_old_entry =
37909c6f1ddSLingrui98    Mux(is_new_br, old_entry_modified,
3803bcae573SLingrui98      Mux(jalr_target_modified, old_entry_jmp_target_modified, old_entry_always_taken))
38109c6f1ddSLingrui98
38209c6f1ddSLingrui98
38309c6f1ddSLingrui98  io.new_entry := Mux(!hit, init_entry, derived_from_old_entry)
38409c6f1ddSLingrui98
38509c6f1ddSLingrui98  io.new_br_insert_pos := new_br_insert_onehot
38609c6f1ddSLingrui98  io.taken_mask := VecInit((io.new_entry.brOffset zip io.new_entry.brValids).map{
38709c6f1ddSLingrui98    case (off, v) => io.cfiIndex.bits === off && io.cfiIndex.valid && v
38809c6f1ddSLingrui98  })
389803124a6SLingrui98  io.jmp_taken := io.new_entry.jmpValid && io.new_entry.tailSlot.offset === io.cfiIndex.bits
39009c6f1ddSLingrui98  for (i <- 0 until numBr) {
39109c6f1ddSLingrui98    io.mispred_mask(i) := io.new_entry.brValids(i) && io.mispredict_vec(io.new_entry.brOffset(i))
39209c6f1ddSLingrui98  }
39309c6f1ddSLingrui98  io.mispred_mask.last := io.new_entry.jmpValid && io.mispredict_vec(pd.jmpOffset)
39409c6f1ddSLingrui98
39509c6f1ddSLingrui98  // for perf counters
39609c6f1ddSLingrui98  io.is_init_entry := !hit
3973bcae573SLingrui98  io.is_old_entry := hit && !is_new_br && !jalr_target_modified && !always_taken_modified
39809c6f1ddSLingrui98  io.is_new_br := hit && is_new_br
3993bcae573SLingrui98  io.is_jalr_target_modified := hit && jalr_target_modified
40009c6f1ddSLingrui98  io.is_always_taken_modified := hit && always_taken_modified
401eeb5ff92SLingrui98  io.is_br_full := hit && is_new_br && may_have_to_replace
40209c6f1ddSLingrui98}
40309c6f1ddSLingrui98
404c5c5edaeSJeniusclass FtqPcMemWrapper(numOtherReads: Int)(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo {
405c5c5edaeSJenius  val io = IO(new Bundle {
406c5c5edaeSJenius    val ifuPtr_w       = Input(new FtqPtr)
407c5c5edaeSJenius    val ifuPtrPlus1_w  = Input(new FtqPtr)
4086bf9b30dSLingrui98    val ifuPtrPlus2_w  = Input(new FtqPtr)
409c5c5edaeSJenius    val commPtr_w      = Input(new FtqPtr)
4106bf9b30dSLingrui98    val commPtrPlus1_w = Input(new FtqPtr)
411c5c5edaeSJenius    val ifuPtr_rdata       = Output(new Ftq_RF_Components)
412c5c5edaeSJenius    val ifuPtrPlus1_rdata  = Output(new Ftq_RF_Components)
4136bf9b30dSLingrui98    val ifuPtrPlus2_rdata  = Output(new Ftq_RF_Components)
414c5c5edaeSJenius    val commPtr_rdata      = Output(new Ftq_RF_Components)
4156bf9b30dSLingrui98    val commPtrPlus1_rdata = Output(new Ftq_RF_Components)
416c5c5edaeSJenius
417c5c5edaeSJenius    val other_raddrs = Input(Vec(numOtherReads, UInt(log2Ceil(FtqSize).W)))
418c5c5edaeSJenius    val other_rdatas = Output(Vec(numOtherReads, new Ftq_RF_Components))
419c5c5edaeSJenius
420c5c5edaeSJenius    val wen = Input(Bool())
421c5c5edaeSJenius    val waddr = Input(UInt(log2Ceil(FtqSize).W))
422c5c5edaeSJenius    val wdata = Input(new Ftq_RF_Components)
423c5c5edaeSJenius  })
424c5c5edaeSJenius
4256bf9b30dSLingrui98  val num_pc_read = numOtherReads + 5
426c5c5edaeSJenius  val mem = Module(new SyncDataModuleTemplate(new Ftq_RF_Components, FtqSize,
42728f2cf58SLingrui98    num_pc_read, 1, "FtqPC"))
428c5c5edaeSJenius  mem.io.wen(0)   := io.wen
429c5c5edaeSJenius  mem.io.waddr(0) := io.waddr
430c5c5edaeSJenius  mem.io.wdata(0) := io.wdata
431c5c5edaeSJenius
4326bf9b30dSLingrui98  // read one cycle ahead for ftq local reads
433c5c5edaeSJenius  val raddr_vec = VecInit(io.other_raddrs ++
43488bc4f90SLingrui98    Seq(io.ifuPtr_w.value, io.ifuPtrPlus1_w.value, io.ifuPtrPlus2_w.value, io.commPtrPlus1_w.value, io.commPtr_w.value))
435c5c5edaeSJenius
436c5c5edaeSJenius  mem.io.raddr := raddr_vec
437c5c5edaeSJenius
4386bf9b30dSLingrui98  io.other_rdatas       := mem.io.rdata.dropRight(5)
4396bf9b30dSLingrui98  io.ifuPtr_rdata       := mem.io.rdata.dropRight(4).last
4406bf9b30dSLingrui98  io.ifuPtrPlus1_rdata  := mem.io.rdata.dropRight(3).last
4416bf9b30dSLingrui98  io.ifuPtrPlus2_rdata  := mem.io.rdata.dropRight(2).last
4426bf9b30dSLingrui98  io.commPtrPlus1_rdata := mem.io.rdata.dropRight(1).last
443c5c5edaeSJenius  io.commPtr_rdata      := mem.io.rdata.last
444c5c5edaeSJenius}
445c5c5edaeSJenius
44609c6f1ddSLingrui98class Ftq(implicit p: Parameters) extends XSModule with HasCircularQueuePtrHelper
447e30430c2SJay  with HasBackendRedirectInfo with BPUUtils with HasBPUConst with HasPerfEvents
448e30430c2SJay  with HasICacheParameters{
44909c6f1ddSLingrui98  val io = IO(new Bundle {
45009c6f1ddSLingrui98    val fromBpu = Flipped(new BpuToFtqIO)
45109c6f1ddSLingrui98    val fromIfu = Flipped(new IfuToFtqIO)
45209c6f1ddSLingrui98    val fromBackend = Flipped(new CtrlToFtqIO)
45309c6f1ddSLingrui98
45409c6f1ddSLingrui98    val toBpu = new FtqToBpuIO
45509c6f1ddSLingrui98    val toIfu = new FtqToIfuIO
456c5c5edaeSJenius    val toICache = new FtqToICacheIO
45709c6f1ddSLingrui98    val toBackend = new FtqToCtrlIO
45809c6f1ddSLingrui98
4597052722fSJay    val toPrefetch = new FtqPrefechBundle
4607052722fSJay
46109c6f1ddSLingrui98    val bpuInfo = new Bundle {
46209c6f1ddSLingrui98      val bpRight = Output(UInt(XLEN.W))
46309c6f1ddSLingrui98      val bpWrong = Output(UInt(XLEN.W))
46409c6f1ddSLingrui98    }
4651d1e6d4dSJenius
4661d1e6d4dSJenius    val mmioCommitRead = Flipped(new mmioCommitRead)
467d2b20d1aSTang Haojin
468d2b20d1aSTang Haojin    // for perf
469d2b20d1aSTang Haojin    val ControlBTBMissBubble = Output(Bool())
470d2b20d1aSTang Haojin    val TAGEMissBubble = Output(Bool())
471d2b20d1aSTang Haojin    val SCMissBubble = Output(Bool())
472d2b20d1aSTang Haojin    val ITTAGEMissBubble = Output(Bool())
473d2b20d1aSTang Haojin    val RASMissBubble = Output(Bool())
47409c6f1ddSLingrui98  })
47509c6f1ddSLingrui98  io.bpuInfo := DontCare
47609c6f1ddSLingrui98
477d2b20d1aSTang Haojin  val topdown_stage = RegInit(0.U.asTypeOf(new FrontendTopDownBundle))
478d2b20d1aSTang Haojin  dontTouch(topdown_stage)
479d2b20d1aSTang Haojin  // only driven by clock, not valid-ready
480d2b20d1aSTang Haojin  topdown_stage := io.fromBpu.resp.bits.topdown_info
481d2b20d1aSTang Haojin  io.toIfu.req.bits.topdown_info := topdown_stage
482d2b20d1aSTang Haojin
483d2b20d1aSTang Haojin  val ifuRedirected = RegInit(VecInit(Seq.fill(FtqSize)(false.B)))
484d2b20d1aSTang Haojin
485d2b20d1aSTang Haojin  val backendRedirect = Wire(Valid(new BranchPredictionRedirect))
4869342624fSGao-Zeyu  when(io.fromBackend.redirect.valid) {
4879342624fSGao-Zeyu    assert(RegNext(io.fromBackend.ftqIdxAhead.map(_.valid).reduce(_|_)))
4889342624fSGao-Zeyu    assert(io.fromBackend.ftqIdxSelOH.valid)
4899342624fSGao-Zeyu    assert(PopCount(io.fromBackend.ftqIdxSelOH.bits) === 1.U)
4909342624fSGao-Zeyu  }
49109c6f1ddSLingrui98
492df5b4b8eSYinan Xu  val stage2Flush = backendRedirect.valid
49309c6f1ddSLingrui98  val backendFlush = stage2Flush || RegNext(stage2Flush)
49409c6f1ddSLingrui98  val ifuFlush = Wire(Bool())
49509c6f1ddSLingrui98
49609c6f1ddSLingrui98  val flush = stage2Flush || RegNext(stage2Flush)
49709c6f1ddSLingrui98
49809c6f1ddSLingrui98  val allowBpuIn, allowToIfu = WireInit(false.B)
49909c6f1ddSLingrui98  val flushToIfu = !allowToIfu
5009342624fSGao-Zeyu  allowBpuIn := !ifuFlush && !backendRedirect.valid
5019342624fSGao-Zeyu  allowToIfu := !ifuFlush && !backendRedirect.valid
50209c6f1ddSLingrui98
503f56177cbSJenius  def copyNum = 5
504e30430c2SJay  val bpuPtr, ifuPtr, ifuWbPtr, commPtr = RegInit(FtqPtr(false.B, 0.U))
505c9bc5480SLingrui98  val ifuPtrPlus1 = RegInit(FtqPtr(false.B, 1.U))
5066bf9b30dSLingrui98  val ifuPtrPlus2 = RegInit(FtqPtr(false.B, 2.U))
5076bf9b30dSLingrui98  val commPtrPlus1 = RegInit(FtqPtr(false.B, 1.U))
508f56177cbSJenius  val copied_ifu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U)))
509dc270d3bSJenius  val copied_bpu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U)))
5106bf9b30dSLingrui98  require(FtqSize >= 4)
511c5c5edaeSJenius  val ifuPtr_write       = WireInit(ifuPtr)
512c5c5edaeSJenius  val ifuPtrPlus1_write  = WireInit(ifuPtrPlus1)
5136bf9b30dSLingrui98  val ifuPtrPlus2_write  = WireInit(ifuPtrPlus2)
514c5c5edaeSJenius  val ifuWbPtr_write     = WireInit(ifuWbPtr)
515c5c5edaeSJenius  val commPtr_write      = WireInit(commPtr)
5166bf9b30dSLingrui98  val commPtrPlus1_write = WireInit(commPtrPlus1)
517c5c5edaeSJenius  ifuPtr       := ifuPtr_write
518c5c5edaeSJenius  ifuPtrPlus1  := ifuPtrPlus1_write
5196bf9b30dSLingrui98  ifuPtrPlus2  := ifuPtrPlus2_write
520c5c5edaeSJenius  ifuWbPtr     := ifuWbPtr_write
521c5c5edaeSJenius  commPtr      := commPtr_write
522f83ef67eSLingrui98  commPtrPlus1 := commPtrPlus1_write
523f56177cbSJenius  copied_ifu_ptr.map{ptr =>
524f56177cbSJenius    ptr := ifuPtr_write
525f56177cbSJenius    dontTouch(ptr)
526f56177cbSJenius  }
52709c6f1ddSLingrui98  val validEntries = distanceBetween(bpuPtr, commPtr)
52843aca6c2SGuokai Chen  val canCommit = Wire(Bool())
52909c6f1ddSLingrui98
53009c6f1ddSLingrui98  // **********************************************************************
53109c6f1ddSLingrui98  // **************************** enq from bpu ****************************
53209c6f1ddSLingrui98  // **********************************************************************
53343aca6c2SGuokai Chen  val new_entry_ready = validEntries < FtqSize.U || canCommit
53409c6f1ddSLingrui98  io.fromBpu.resp.ready := new_entry_ready
53509c6f1ddSLingrui98
53609c6f1ddSLingrui98  val bpu_s2_resp = io.fromBpu.resp.bits.s2
537cb4f77ceSLingrui98  val bpu_s3_resp = io.fromBpu.resp.bits.s3
538adc0b8dfSGuokai Chen  val bpu_s2_redirect = bpu_s2_resp.valid(3) && bpu_s2_resp.hasRedirect(3)
539adc0b8dfSGuokai Chen  val bpu_s3_redirect = bpu_s3_resp.valid(3) && bpu_s3_resp.hasRedirect(3)
54009c6f1ddSLingrui98
54109c6f1ddSLingrui98  io.toBpu.enq_ptr := bpuPtr
542935edac4STang Haojin  val enq_fire = io.fromBpu.resp.fire && allowBpuIn // from bpu s1
543935edac4STang Haojin  val bpu_in_fire = (io.fromBpu.resp.fire || bpu_s2_redirect || bpu_s3_redirect) && allowBpuIn
54409c6f1ddSLingrui98
545b37e4b45SLingrui98  val bpu_in_resp = io.fromBpu.resp.bits.selectedResp
546adc0b8dfSGuokai Chen  val bpu_in_stage = io.fromBpu.resp.bits.selectedRespIdxForFtq
54709c6f1ddSLingrui98  val bpu_in_resp_ptr = Mux(bpu_in_stage === BP_S1, bpuPtr, bpu_in_resp.ftq_idx)
54809c6f1ddSLingrui98  val bpu_in_resp_idx = bpu_in_resp_ptr.value
54909c6f1ddSLingrui98
550378f00d9SJenius  // read ports:      prefetchReq ++  ifuReq1 + ifuReq2 + ifuReq3 + commitUpdate2 + commitUpdate
551378f00d9SJenius  val ftq_pc_mem = Module(new FtqPcMemWrapper(1))
5526bf9b30dSLingrui98  // resp from uBTB
553c5c5edaeSJenius  ftq_pc_mem.io.wen := bpu_in_fire
554c5c5edaeSJenius  ftq_pc_mem.io.waddr := bpu_in_resp_idx
555c5c5edaeSJenius  ftq_pc_mem.io.wdata.fromBranchPrediction(bpu_in_resp)
55609c6f1ddSLingrui98
55709c6f1ddSLingrui98  //                                                            ifuRedirect + backendRedirect + commit
5589342624fSGao-Zeyu  val ftq_redirect_sram = Module(new FtqNRSRAM(new Ftq_Redirect_SRAMEntry, 1+BackendRedirectNum+1))
55909c6f1ddSLingrui98  // these info is intended to enq at the last stage of bpu
560adc0b8dfSGuokai Chen  ftq_redirect_sram.io.wen := io.fromBpu.resp.bits.lastStage.valid(3)
56109c6f1ddSLingrui98  ftq_redirect_sram.io.waddr := io.fromBpu.resp.bits.lastStage.ftq_idx.value
562c2d1ec7dSLingrui98  ftq_redirect_sram.io.wdata := io.fromBpu.resp.bits.last_stage_spec_info
56349cbc998SLingrui98  println(f"ftq redirect SRAM: entry ${ftq_redirect_sram.io.wdata.getWidth} * ${FtqSize} * 3")
56449cbc998SLingrui98  println(f"ftq redirect SRAM: ahead fh ${ftq_redirect_sram.io.wdata.afhob.getWidth} * ${FtqSize} * 3")
56509c6f1ddSLingrui98
56609c6f1ddSLingrui98  val ftq_meta_1r_sram = Module(new FtqNRSRAM(new Ftq_1R_SRAMEntry, 1))
56709c6f1ddSLingrui98  // these info is intended to enq at the last stage of bpu
568adc0b8dfSGuokai Chen  ftq_meta_1r_sram.io.wen := io.fromBpu.resp.bits.lastStage.valid(3)
56909c6f1ddSLingrui98  ftq_meta_1r_sram.io.waddr := io.fromBpu.resp.bits.lastStage.ftq_idx.value
570c2d1ec7dSLingrui98  ftq_meta_1r_sram.io.wdata.meta := io.fromBpu.resp.bits.last_stage_meta
57109c6f1ddSLingrui98  //                                                            ifuRedirect + backendRedirect + commit
5729342624fSGao-Zeyu  val ftb_entry_mem = Module(new SyncDataModuleTemplate(new FTBEntry, FtqSize, 1+BackendRedirectNum+1, 1))
573adc0b8dfSGuokai Chen  ftb_entry_mem.io.wen(0) := io.fromBpu.resp.bits.lastStage.valid(3)
57409c6f1ddSLingrui98  ftb_entry_mem.io.waddr(0) := io.fromBpu.resp.bits.lastStage.ftq_idx.value
575c2d1ec7dSLingrui98  ftb_entry_mem.io.wdata(0) := io.fromBpu.resp.bits.last_stage_ftb_entry
57609c6f1ddSLingrui98
57709c6f1ddSLingrui98
57809c6f1ddSLingrui98  // multi-write
579b0ed7239SLingrui98  val update_target = Reg(Vec(FtqSize, UInt(VAddrBits.W))) // could be taken target or fallThrough //TODO: remove this
5806bf9b30dSLingrui98  val newest_entry_target = Reg(UInt(VAddrBits.W))
5816bf9b30dSLingrui98  val newest_entry_ptr = Reg(new FtqPtr)
58209c6f1ddSLingrui98  val cfiIndex_vec = Reg(Vec(FtqSize, ValidUndirectioned(UInt(log2Ceil(PredictWidth).W))))
58309c6f1ddSLingrui98  val mispredict_vec = Reg(Vec(FtqSize, Vec(PredictWidth, Bool())))
58409c6f1ddSLingrui98  val pred_stage = Reg(Vec(FtqSize, UInt(2.W)))
585209a4cafSSteve Gou  val pred_s1_cycle = if (!env.FPGAPlatform) Some(Reg(Vec(FtqSize, UInt(64.W)))) else None
58609c6f1ddSLingrui98
587b5808fc2Ssfencevma  val c_invalid :: c_valid :: c_commited :: Nil = Enum(3)
58809c6f1ddSLingrui98  val commitStateQueue = RegInit(VecInit(Seq.fill(FtqSize) {
58909c6f1ddSLingrui98    VecInit(Seq.fill(PredictWidth)(c_invalid))
59009c6f1ddSLingrui98  }))
59109c6f1ddSLingrui98
59209c6f1ddSLingrui98  val f_to_send :: f_sent :: Nil = Enum(2)
59309c6f1ddSLingrui98  val entry_fetch_status = RegInit(VecInit(Seq.fill(FtqSize)(f_sent)))
59409c6f1ddSLingrui98
59509c6f1ddSLingrui98  val h_not_hit :: h_false_hit :: h_hit :: Nil = Enum(3)
59609c6f1ddSLingrui98  val entry_hit_status = RegInit(VecInit(Seq.fill(FtqSize)(h_not_hit)))
59709c6f1ddSLingrui98
598f63797a4SLingrui98  // modify registers one cycle later to cut critical path
599f63797a4SLingrui98  val last_cycle_bpu_in = RegNext(bpu_in_fire)
6006bf9b30dSLingrui98  val last_cycle_bpu_in_ptr = RegNext(bpu_in_resp_ptr)
6016bf9b30dSLingrui98  val last_cycle_bpu_in_idx = last_cycle_bpu_in_ptr.value
602adc0b8dfSGuokai Chen  val last_cycle_bpu_target = RegNext(bpu_in_resp.getTarget(3))
603adc0b8dfSGuokai Chen  val last_cycle_cfiIndex = RegNext(bpu_in_resp.cfiIndex(3))
604f63797a4SLingrui98  val last_cycle_bpu_in_stage = RegNext(bpu_in_stage)
605f56177cbSJenius
6067be982afSLingrui98  def extra_copyNum_for_commitStateQueue = 2
6077be982afSLingrui98  val copied_last_cycle_bpu_in = VecInit(Seq.fill(copyNum+extra_copyNum_for_commitStateQueue)(RegNext(bpu_in_fire)))
6087be982afSLingrui98  val copied_last_cycle_bpu_in_ptr_for_ftq = VecInit(Seq.fill(extra_copyNum_for_commitStateQueue)(RegNext(bpu_in_resp_ptr)))
609f56177cbSJenius
610f63797a4SLingrui98  when (last_cycle_bpu_in) {
611f63797a4SLingrui98    entry_fetch_status(last_cycle_bpu_in_idx) := f_to_send
612f63797a4SLingrui98    cfiIndex_vec(last_cycle_bpu_in_idx) := last_cycle_cfiIndex
613f63797a4SLingrui98    pred_stage(last_cycle_bpu_in_idx) := last_cycle_bpu_in_stage
6146bf9b30dSLingrui98
615b0ed7239SLingrui98    update_target(last_cycle_bpu_in_idx) := last_cycle_bpu_target // TODO: remove this
6166bf9b30dSLingrui98    newest_entry_target := last_cycle_bpu_target
6176bf9b30dSLingrui98    newest_entry_ptr := last_cycle_bpu_in_ptr
61809c6f1ddSLingrui98  }
61909c6f1ddSLingrui98
6207be982afSLingrui98  // reduce fanout by delay write for a cycle
6217be982afSLingrui98  when (RegNext(last_cycle_bpu_in)) {
6227be982afSLingrui98    mispredict_vec(RegNext(last_cycle_bpu_in_idx)) := WireInit(VecInit(Seq.fill(PredictWidth)(false.B)))
6237be982afSLingrui98  }
6247be982afSLingrui98
625209a4cafSSteve Gou  // record s1 pred cycles
626209a4cafSSteve Gou  pred_s1_cycle.map(vec => {
627209a4cafSSteve Gou    when (bpu_in_fire && (bpu_in_stage === BP_S1)) {
628209a4cafSSteve Gou      vec(bpu_in_resp_ptr.value) := bpu_in_resp.full_pred(0).predCycle.getOrElse(0.U)
629209a4cafSSteve Gou    }
630209a4cafSSteve Gou  })
631209a4cafSSteve Gou
6327be982afSLingrui98  // reduce fanout using copied last_cycle_bpu_in and copied last_cycle_bpu_in_ptr
6337be982afSLingrui98  val copied_last_cycle_bpu_in_for_ftq = copied_last_cycle_bpu_in.takeRight(extra_copyNum_for_commitStateQueue)
6347be982afSLingrui98  copied_last_cycle_bpu_in_for_ftq.zip(copied_last_cycle_bpu_in_ptr_for_ftq).zipWithIndex.map {
6357be982afSLingrui98    case ((in, ptr), i) =>
6367be982afSLingrui98      when (in) {
6377be982afSLingrui98        val perSetEntries = FtqSize / extra_copyNum_for_commitStateQueue // 32
6387be982afSLingrui98        require(FtqSize % extra_copyNum_for_commitStateQueue == 0)
6397be982afSLingrui98        for (j <- 0 until perSetEntries) {
6409361b0c5SLingrui98          when (ptr.value === (i*perSetEntries+j).U) {
6417be982afSLingrui98            commitStateQueue(i*perSetEntries+j) := VecInit(Seq.fill(PredictWidth)(c_invalid))
6427be982afSLingrui98          }
6437be982afSLingrui98        }
6447be982afSLingrui98      }
6459361b0c5SLingrui98  }
6467be982afSLingrui98
647873dc383SLingrui98  // num cycle is fixed
648873dc383SLingrui98  io.toBackend.newest_entry_ptr := RegNext(newest_entry_ptr)
649873dc383SLingrui98  io.toBackend.newest_entry_target := RegNext(newest_entry_target)
650873dc383SLingrui98
651f63797a4SLingrui98
65209c6f1ddSLingrui98  bpuPtr := bpuPtr + enq_fire
653dc270d3bSJenius  copied_bpu_ptr.map(_ := bpuPtr + enq_fire)
654c9bc5480SLingrui98  when (io.toIfu.req.fire && allowToIfu) {
655c5c5edaeSJenius    ifuPtr_write := ifuPtrPlus1
6566bf9b30dSLingrui98    ifuPtrPlus1_write := ifuPtrPlus2
6576bf9b30dSLingrui98    ifuPtrPlus2_write := ifuPtrPlus2 + 1.U
658c9bc5480SLingrui98  }
65909c6f1ddSLingrui98
66009c6f1ddSLingrui98  // only use ftb result to assign hit status
661adc0b8dfSGuokai Chen  when (bpu_s2_resp.valid(3)) {
662adc0b8dfSGuokai Chen    entry_hit_status(bpu_s2_resp.ftq_idx.value) := Mux(bpu_s2_resp.full_pred(3).hit, h_hit, h_not_hit)
66309c6f1ddSLingrui98  }
66409c6f1ddSLingrui98
66509c6f1ddSLingrui98
6662f4a3aa4SLingrui98  io.toIfu.flushFromBpu.s2.valid := bpu_s2_redirect
66709c6f1ddSLingrui98  io.toIfu.flushFromBpu.s2.bits := bpu_s2_resp.ftq_idx
668adc0b8dfSGuokai Chen  when (bpu_s2_redirect) {
66909c6f1ddSLingrui98    bpuPtr := bpu_s2_resp.ftq_idx + 1.U
670dc270d3bSJenius    copied_bpu_ptr.map(_ := bpu_s2_resp.ftq_idx + 1.U)
67109c6f1ddSLingrui98    // only when ifuPtr runs ahead of bpu s2 resp should we recover it
67209c6f1ddSLingrui98    when (!isBefore(ifuPtr, bpu_s2_resp.ftq_idx)) {
673c5c5edaeSJenius      ifuPtr_write := bpu_s2_resp.ftq_idx
674c5c5edaeSJenius      ifuPtrPlus1_write := bpu_s2_resp.ftq_idx + 1.U
6756bf9b30dSLingrui98      ifuPtrPlus2_write := bpu_s2_resp.ftq_idx + 2.U
67609c6f1ddSLingrui98    }
67709c6f1ddSLingrui98  }
67809c6f1ddSLingrui98
679cb4f77ceSLingrui98  io.toIfu.flushFromBpu.s3.valid := bpu_s3_redirect
680cb4f77ceSLingrui98  io.toIfu.flushFromBpu.s3.bits := bpu_s3_resp.ftq_idx
681adc0b8dfSGuokai Chen  when (bpu_s3_redirect) {
682cb4f77ceSLingrui98    bpuPtr := bpu_s3_resp.ftq_idx + 1.U
683dc270d3bSJenius    copied_bpu_ptr.map(_ := bpu_s3_resp.ftq_idx + 1.U)
684cb4f77ceSLingrui98    // only when ifuPtr runs ahead of bpu s2 resp should we recover it
685cb4f77ceSLingrui98    when (!isBefore(ifuPtr, bpu_s3_resp.ftq_idx)) {
686c5c5edaeSJenius      ifuPtr_write := bpu_s3_resp.ftq_idx
687c5c5edaeSJenius      ifuPtrPlus1_write := bpu_s3_resp.ftq_idx + 1.U
6886bf9b30dSLingrui98      ifuPtrPlus2_write := bpu_s3_resp.ftq_idx + 2.U
689cb4f77ceSLingrui98    }
690cb4f77ceSLingrui98  }
691cb4f77ceSLingrui98
69209c6f1ddSLingrui98  XSError(isBefore(bpuPtr, ifuPtr) && !isFull(bpuPtr, ifuPtr), "\nifuPtr is before bpuPtr!\n")
6932448f137SGuokai Chen  XSError(isBefore(ifuWbPtr, commPtr) && !isFull(ifuWbPtr, commPtr), "\ncommPtr is before ifuWbPtr!\n")
69409c6f1ddSLingrui98
695dc270d3bSJenius  (0 until copyNum).map{i =>
696dc270d3bSJenius    XSError(copied_bpu_ptr(i) =/= bpuPtr, "\ncopiedBpuPtr is different from bpuPtr!\n")
697dc270d3bSJenius  }
698dc270d3bSJenius
69909c6f1ddSLingrui98  // ****************************************************************
70009c6f1ddSLingrui98  // **************************** to ifu ****************************
70109c6f1ddSLingrui98  // ****************************************************************
702f22cf846SJenius  // 0  for ifu, and 1-4 for ICache
703935edac4STang Haojin  val bpu_in_bypass_buf = RegEnable(ftq_pc_mem.io.wdata, bpu_in_fire)
704935edac4STang Haojin  val copied_bpu_in_bypass_buf = VecInit(Seq.fill(copyNum)(RegEnable(ftq_pc_mem.io.wdata, bpu_in_fire)))
705f56177cbSJenius  val bpu_in_bypass_buf_for_ifu = bpu_in_bypass_buf
70609c6f1ddSLingrui98  val bpu_in_bypass_ptr = RegNext(bpu_in_resp_ptr)
70709c6f1ddSLingrui98  val last_cycle_to_ifu_fire = RegNext(io.toIfu.req.fire)
70809c6f1ddSLingrui98
709f56177cbSJenius  val copied_bpu_in_bypass_ptr = VecInit(Seq.fill(copyNum)(RegNext(bpu_in_resp_ptr)))
710f56177cbSJenius  val copied_last_cycle_to_ifu_fire = VecInit(Seq.fill(copyNum)(RegNext(io.toIfu.req.fire)))
71188bc4f90SLingrui98
71209c6f1ddSLingrui98  // read pc and target
7136bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtr_w       := ifuPtr_write
7146bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtrPlus1_w  := ifuPtrPlus1_write
7156bf9b30dSLingrui98  ftq_pc_mem.io.ifuPtrPlus2_w  := ifuPtrPlus2_write
7166bf9b30dSLingrui98  ftq_pc_mem.io.commPtr_w      := commPtr_write
7176bf9b30dSLingrui98  ftq_pc_mem.io.commPtrPlus1_w := commPtrPlus1_write
718c5c5edaeSJenius
71909c6f1ddSLingrui98
7205ff19bd8SLingrui98  io.toIfu.req.bits.ftqIdx := ifuPtr
721f63797a4SLingrui98
722f56177cbSJenius  val toICachePcBundle = Wire(Vec(copyNum,new Ftq_RF_Components))
723dc270d3bSJenius  val toICacheEntryToSend = Wire(Vec(copyNum,Bool()))
724b37e4b45SLingrui98  val toIfuPcBundle = Wire(new Ftq_RF_Components)
725f63797a4SLingrui98  val entry_is_to_send = WireInit(entry_fetch_status(ifuPtr.value) === f_to_send)
726f63797a4SLingrui98  val entry_ftq_offset = WireInit(cfiIndex_vec(ifuPtr.value))
7276bf9b30dSLingrui98  val entry_next_addr  = Wire(UInt(VAddrBits.W))
728b004fa13SJenius
729f56177cbSJenius  val pc_mem_ifu_ptr_rdata   = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtr_rdata)))
730f56177cbSJenius  val pc_mem_ifu_plus1_rdata = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata)))
731b0ed7239SLingrui98  val diff_entry_next_addr = WireInit(update_target(ifuPtr.value)) //TODO: remove this
732f63797a4SLingrui98
733dc270d3bSJenius  val copied_ifu_plus1_to_send = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1))))
734dc270d3bSJenius  val copied_ifu_ptr_to_send   = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr)))
735dc270d3bSJenius
736f56177cbSJenius  for(i <- 0 until copyNum){
737f56177cbSJenius    when(copied_last_cycle_bpu_in(i) && copied_bpu_in_bypass_ptr(i) === copied_ifu_ptr(i)){
738f56177cbSJenius      toICachePcBundle(i) := copied_bpu_in_bypass_buf(i)
739dc270d3bSJenius      toICacheEntryToSend(i)   := true.B
740f56177cbSJenius    }.elsewhen(copied_last_cycle_to_ifu_fire(i)){
741f56177cbSJenius      toICachePcBundle(i) := pc_mem_ifu_plus1_rdata(i)
742dc270d3bSJenius      toICacheEntryToSend(i)   := copied_ifu_plus1_to_send(i)
743f56177cbSJenius    }.otherwise{
744f56177cbSJenius      toICachePcBundle(i) := pc_mem_ifu_ptr_rdata(i)
745dc270d3bSJenius      toICacheEntryToSend(i)   := copied_ifu_ptr_to_send(i)
746f56177cbSJenius    }
747f56177cbSJenius  }
748f56177cbSJenius
749873dc383SLingrui98  // TODO: reconsider target address bypass logic
75009c6f1ddSLingrui98  when (last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) {
75188bc4f90SLingrui98    toIfuPcBundle := bpu_in_bypass_buf_for_ifu
752f678dd91SSteve Gou    entry_is_to_send := true.B
7536bf9b30dSLingrui98    entry_next_addr := last_cycle_bpu_target
754f63797a4SLingrui98    entry_ftq_offset := last_cycle_cfiIndex
755b0ed7239SLingrui98    diff_entry_next_addr := last_cycle_bpu_target // TODO: remove this
75609c6f1ddSLingrui98  }.elsewhen (last_cycle_to_ifu_fire) {
757c5c5edaeSJenius    toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata)
758c5c5edaeSJenius    entry_is_to_send := RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) ||
759c5c5edaeSJenius                        RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1)) // reduce potential bubbles
760ed434d67SLingrui98    entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1),
76188bc4f90SLingrui98                          bpu_in_bypass_buf_for_ifu.startAddr,
762fef810c0SLingrui98                          Mux(ifuPtr === newest_entry_ptr,
7636bf9b30dSLingrui98                            newest_entry_target,
764f83ef67eSLingrui98                            RegNext(ftq_pc_mem.io.ifuPtrPlus2_rdata.startAddr))) // ifuPtr+2
765c5c5edaeSJenius  }.otherwise {
766c5c5edaeSJenius    toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtr_rdata)
76728f2cf58SLingrui98    entry_is_to_send := RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) ||
76828f2cf58SLingrui98                        RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) // reduce potential bubbles
7696bf9b30dSLingrui98    entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1),
77088bc4f90SLingrui98                          bpu_in_bypass_buf_for_ifu.startAddr,
771fef810c0SLingrui98                          Mux(ifuPtr === newest_entry_ptr,
7726bf9b30dSLingrui98                            newest_entry_target,
773f83ef67eSLingrui98                            RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata.startAddr))) // ifuPtr+1
77409c6f1ddSLingrui98  }
77509c6f1ddSLingrui98
776f678dd91SSteve Gou  io.toIfu.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr
777f63797a4SLingrui98  io.toIfu.req.bits.nextStartAddr := entry_next_addr
778f63797a4SLingrui98  io.toIfu.req.bits.ftqOffset := entry_ftq_offset
779b37e4b45SLingrui98  io.toIfu.req.bits.fromFtqPcBundle(toIfuPcBundle)
780c5c5edaeSJenius
781c5c5edaeSJenius  io.toICache.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr
782dc270d3bSJenius  io.toICache.req.bits.readValid.zipWithIndex.map{case(copy, i) => copy := toICacheEntryToSend(i) && copied_ifu_ptr(i) =/= copied_bpu_ptr(i)}
783b004fa13SJenius  io.toICache.req.bits.pcMemRead.zipWithIndex.map{case(copy,i) => copy.fromFtqPcBundle(toICachePcBundle(i))}
784b004fa13SJenius  // io.toICache.req.bits.bypassSelect := last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr
785b004fa13SJenius  // io.toICache.req.bits.bpuBypassWrite.zipWithIndex.map{case(bypassWrtie, i) =>
786b004fa13SJenius  //   bypassWrtie.startAddr := bpu_in_bypass_buf.tail(i).startAddr
787b004fa13SJenius  //   bypassWrtie.nextlineStart := bpu_in_bypass_buf.tail(i).nextLineAddr
788b004fa13SJenius  // }
789f22cf846SJenius
790b0ed7239SLingrui98  // TODO: remove this
791b0ed7239SLingrui98  XSError(io.toIfu.req.valid && diff_entry_next_addr =/= entry_next_addr,
7925a674179SLingrui98          p"\nifu_req_target wrong! ifuPtr: ${ifuPtr}, entry_next_addr: ${Hexadecimal(entry_next_addr)} diff_entry_next_addr: ${Hexadecimal(diff_entry_next_addr)}\n")
793b0ed7239SLingrui98
79409c6f1ddSLingrui98  // when fall through is smaller in value than start address, there must be a false hit
795b37e4b45SLingrui98  when (toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit) {
79609c6f1ddSLingrui98    when (io.toIfu.req.fire &&
797cb4f77ceSLingrui98      !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) &&
798cb4f77ceSLingrui98      !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr)
79909c6f1ddSLingrui98    ) {
80009c6f1ddSLingrui98      entry_hit_status(ifuPtr.value) := h_false_hit
801352db50aSLingrui98      // XSError(true.B, "FTB false hit by fallThroughError, startAddr: %x, fallTHru: %x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr)
80209c6f1ddSLingrui98    }
803b37e4b45SLingrui98    XSDebug(true.B, "fallThruError! start:%x, fallThru:%x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr)
80409c6f1ddSLingrui98  }
80509c6f1ddSLingrui98
806a60a2901SLingrui98  XSPerfAccumulate(f"fall_through_error_to_ifu", toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit &&
807a60a2901SLingrui98    io.toIfu.req.fire && !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) && !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr))
808a60a2901SLingrui98
80909c6f1ddSLingrui98  val ifu_req_should_be_flushed =
810cb4f77ceSLingrui98    io.toIfu.flushFromBpu.shouldFlushByStage2(io.toIfu.req.bits.ftqIdx) ||
811cb4f77ceSLingrui98    io.toIfu.flushFromBpu.shouldFlushByStage3(io.toIfu.req.bits.ftqIdx)
81209c6f1ddSLingrui98
81309c6f1ddSLingrui98    when (io.toIfu.req.fire && !ifu_req_should_be_flushed) {
81409c6f1ddSLingrui98      entry_fetch_status(ifuPtr.value) := f_sent
81509c6f1ddSLingrui98    }
81609c6f1ddSLingrui98
81709c6f1ddSLingrui98  // *********************************************************************
81809c6f1ddSLingrui98  // **************************** wb from ifu ****************************
81909c6f1ddSLingrui98  // *********************************************************************
82009c6f1ddSLingrui98  val pdWb = io.fromIfu.pdWb
82109c6f1ddSLingrui98  val pds = pdWb.bits.pd
82209c6f1ddSLingrui98  val ifu_wb_valid = pdWb.valid
82309c6f1ddSLingrui98  val ifu_wb_idx = pdWb.bits.ftqIdx.value
82409c6f1ddSLingrui98  // read ports:                                                         commit update
82509c6f1ddSLingrui98  val ftq_pd_mem = Module(new SyncDataModuleTemplate(new Ftq_pd_Entry, FtqSize, 1, 1))
82609c6f1ddSLingrui98  ftq_pd_mem.io.wen(0) := ifu_wb_valid
82709c6f1ddSLingrui98  ftq_pd_mem.io.waddr(0) := pdWb.bits.ftqIdx.value
82809c6f1ddSLingrui98  ftq_pd_mem.io.wdata(0).fromPdWb(pdWb.bits)
82909c6f1ddSLingrui98
83009c6f1ddSLingrui98  val hit_pd_valid = entry_hit_status(ifu_wb_idx) === h_hit && ifu_wb_valid
83109c6f1ddSLingrui98  val hit_pd_mispred = hit_pd_valid && pdWb.bits.misOffset.valid
83209c6f1ddSLingrui98  val hit_pd_mispred_reg = RegNext(hit_pd_mispred, init=false.B)
833005e809bSJiuyang Liu  val pd_reg       = RegEnable(pds,             pdWb.valid)
834005e809bSJiuyang Liu  val start_pc_reg = RegEnable(pdWb.bits.pc(0), pdWb.valid)
835005e809bSJiuyang Liu  val wb_idx_reg   = RegEnable(ifu_wb_idx,      pdWb.valid)
83609c6f1ddSLingrui98
83709c6f1ddSLingrui98  when (ifu_wb_valid) {
83809c6f1ddSLingrui98    val comm_stq_wen = VecInit(pds.map(_.valid).zip(pdWb.bits.instrRange).map{
83909c6f1ddSLingrui98      case (v, inRange) => v && inRange
84009c6f1ddSLingrui98    })
84109c6f1ddSLingrui98    (commitStateQueue(ifu_wb_idx) zip comm_stq_wen).map{
84209c6f1ddSLingrui98      case (qe, v) => when (v) { qe := c_valid }
84309c6f1ddSLingrui98    }
84409c6f1ddSLingrui98  }
84509c6f1ddSLingrui98
846c5c5edaeSJenius  when (ifu_wb_valid) {
847c5c5edaeSJenius    ifuWbPtr_write := ifuWbPtr + 1.U
848c5c5edaeSJenius  }
84909c6f1ddSLingrui98
850f21bbcb2SGuokai Chen  XSError(ifu_wb_valid && isAfter(pdWb.bits.ftqIdx, ifuPtr), "IFU returned a predecode before its req, check IFU")
851f21bbcb2SGuokai Chen
85209c6f1ddSLingrui98  ftb_entry_mem.io.raddr.head := ifu_wb_idx
85309c6f1ddSLingrui98  val has_false_hit = WireInit(false.B)
85409c6f1ddSLingrui98  when (RegNext(hit_pd_valid)) {
85509c6f1ddSLingrui98    // check for false hit
85609c6f1ddSLingrui98    val pred_ftb_entry = ftb_entry_mem.io.rdata.head
857eeb5ff92SLingrui98    val brSlots = pred_ftb_entry.brSlots
858eeb5ff92SLingrui98    val tailSlot = pred_ftb_entry.tailSlot
85909c6f1ddSLingrui98    // we check cfis that bpu predicted
86009c6f1ddSLingrui98
861eeb5ff92SLingrui98    // bpu predicted branches but denied by predecode
862eeb5ff92SLingrui98    val br_false_hit =
863eeb5ff92SLingrui98      brSlots.map{
864eeb5ff92SLingrui98        s => s.valid && !(pd_reg(s.offset).valid && pd_reg(s.offset).isBr)
865eeb5ff92SLingrui98      }.reduce(_||_) ||
866b37e4b45SLingrui98      (tailSlot.valid && pred_ftb_entry.tailSlot.sharing &&
867eeb5ff92SLingrui98        !(pd_reg(tailSlot.offset).valid && pd_reg(tailSlot.offset).isBr))
868eeb5ff92SLingrui98
869eeb5ff92SLingrui98    val jmpOffset = tailSlot.offset
87009c6f1ddSLingrui98    val jmp_pd = pd_reg(jmpOffset)
87109c6f1ddSLingrui98    val jal_false_hit = pred_ftb_entry.jmpValid &&
87209c6f1ddSLingrui98      ((pred_ftb_entry.isJal  && !(jmp_pd.valid && jmp_pd.isJal)) ||
87309c6f1ddSLingrui98       (pred_ftb_entry.isJalr && !(jmp_pd.valid && jmp_pd.isJalr)) ||
87409c6f1ddSLingrui98       (pred_ftb_entry.isCall && !(jmp_pd.valid && jmp_pd.isCall)) ||
87509c6f1ddSLingrui98       (pred_ftb_entry.isRet  && !(jmp_pd.valid && jmp_pd.isRet))
87609c6f1ddSLingrui98      )
87709c6f1ddSLingrui98
87809c6f1ddSLingrui98    has_false_hit := br_false_hit || jal_false_hit || hit_pd_mispred_reg
87965fddcf0Szoujr    XSDebug(has_false_hit, "FTB false hit by br or jal or hit_pd, startAddr: %x\n", pdWb.bits.pc(0))
88065fddcf0Szoujr
881352db50aSLingrui98    // assert(!has_false_hit)
88209c6f1ddSLingrui98  }
88309c6f1ddSLingrui98
88409c6f1ddSLingrui98  when (has_false_hit) {
88509c6f1ddSLingrui98    entry_hit_status(wb_idx_reg) := h_false_hit
88609c6f1ddSLingrui98  }
88709c6f1ddSLingrui98
88809c6f1ddSLingrui98
88909c6f1ddSLingrui98  // **********************************************************************
890b56f947eSYinan Xu  // ***************************** to backend *****************************
89109c6f1ddSLingrui98  // **********************************************************************
892b56f947eSYinan Xu  // to backend pc mem / target
893b56f947eSYinan Xu  io.toBackend.pc_mem_wen   := RegNext(last_cycle_bpu_in)
894b56f947eSYinan Xu  io.toBackend.pc_mem_waddr := RegNext(last_cycle_bpu_in_idx)
89588bc4f90SLingrui98  io.toBackend.pc_mem_wdata := RegNext(bpu_in_bypass_buf_for_ifu)
89609c6f1ddSLingrui98
89709c6f1ddSLingrui98  // *******************************************************************************
89809c6f1ddSLingrui98  // **************************** redirect from backend ****************************
89909c6f1ddSLingrui98  // *******************************************************************************
90009c6f1ddSLingrui98
90109c6f1ddSLingrui98  // redirect read cfiInfo, couples to redirectGen s2
9029342624fSGao-Zeyu  val ftq_redirect_rdata = Wire(Vec(BackendRedirectNum, new Ftq_Redirect_SRAMEntry))
9039342624fSGao-Zeyu  val ftb_redirect_rdata = Wire(Vec(BackendRedirectNum, new FTBEntry))
9049342624fSGao-Zeyu  for (i <- 0 until BackendRedirectNum) {
9059342624fSGao-Zeyu    ftq_redirect_sram.io.ren(i + 1) := io.fromBackend.ftqIdxAhead(i).valid
9069342624fSGao-Zeyu    ftq_redirect_sram.io.raddr(i + 1) := io.fromBackend.ftqIdxAhead(i).bits.value
9079342624fSGao-Zeyu    ftb_entry_mem.io.raddr(i + 1)     := io.fromBackend.ftqIdxAhead(i).bits.value
90809c6f1ddSLingrui98
9099342624fSGao-Zeyu    ftq_redirect_rdata(i) := ftq_redirect_sram.io.rdata(i + 1)
9109342624fSGao-Zeyu    ftb_redirect_rdata(i) := ftb_entry_mem.io.rdata(i + 1)
9119342624fSGao-Zeyu  }
9129342624fSGao-Zeyu  val stage3CfiInfo = Mux1H(io.fromBackend.ftqIdxSelOH.bits, ftq_redirect_rdata)
9139342624fSGao-Zeyu  val fromBackendRedirect = WireInit(backendRedirect)
91409c6f1ddSLingrui98  val backendRedirectCfi = fromBackendRedirect.bits.cfiUpdate
91509c6f1ddSLingrui98  backendRedirectCfi.fromFtqRedirectSram(stage3CfiInfo)
91609c6f1ddSLingrui98
917d2b20d1aSTang Haojin
9189342624fSGao-Zeyu  val r_ftb_entry = Mux1H(io.fromBackend.ftqIdxSelOH.bits, ftb_redirect_rdata)
91909c6f1ddSLingrui98  val r_ftqOffset = fromBackendRedirect.bits.ftqOffset
92009c6f1ddSLingrui98
921d2b20d1aSTang Haojin  backendRedirectCfi.br_hit := r_ftb_entry.brIsSaved(r_ftqOffset)
922d2b20d1aSTang Haojin  backendRedirectCfi.jr_hit := r_ftb_entry.isJalr && r_ftb_entry.tailSlot.offset === r_ftqOffset
9233711cf36S小造xu_zh  // FIXME: not portable
924d2b20d1aSTang Haojin  backendRedirectCfi.sc_hit := backendRedirectCfi.br_hit && Mux(r_ftb_entry.brSlots(0).offset === r_ftqOffset,
9253711cf36S小造xu_zh    stage3CfiInfo.sc_disagree(0), stage3CfiInfo.sc_disagree(1))
926d2b20d1aSTang Haojin
92709c6f1ddSLingrui98  when (entry_hit_status(fromBackendRedirect.bits.ftqIdx.value) === h_hit) {
92809c6f1ddSLingrui98    backendRedirectCfi.shift := PopCount(r_ftb_entry.getBrMaskByOffset(r_ftqOffset)) +&
92909c6f1ddSLingrui98      (backendRedirectCfi.pd.isBr && !r_ftb_entry.brIsSaved(r_ftqOffset) &&
930eeb5ff92SLingrui98      !r_ftb_entry.newBrCanNotInsert(r_ftqOffset))
93109c6f1ddSLingrui98
93209c6f1ddSLingrui98    backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr && (r_ftb_entry.brIsSaved(r_ftqOffset) ||
933eeb5ff92SLingrui98        !r_ftb_entry.newBrCanNotInsert(r_ftqOffset))
93409c6f1ddSLingrui98  }.otherwise {
93509c6f1ddSLingrui98    backendRedirectCfi.shift := (backendRedirectCfi.pd.isBr && backendRedirectCfi.taken).asUInt
93609c6f1ddSLingrui98    backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr.asUInt
93709c6f1ddSLingrui98  }
93809c6f1ddSLingrui98
93909c6f1ddSLingrui98
94009c6f1ddSLingrui98  // ***************************************************************************
94109c6f1ddSLingrui98  // **************************** redirect from ifu ****************************
94209c6f1ddSLingrui98  // ***************************************************************************
943d2b20d1aSTang Haojin  val fromIfuRedirect = WireInit(0.U.asTypeOf(Valid(new BranchPredictionRedirect)))
94409c6f1ddSLingrui98  fromIfuRedirect.valid := pdWb.valid && pdWb.bits.misOffset.valid && !backendFlush
94509c6f1ddSLingrui98  fromIfuRedirect.bits.ftqIdx := pdWb.bits.ftqIdx
94609c6f1ddSLingrui98  fromIfuRedirect.bits.ftqOffset := pdWb.bits.misOffset.bits
94709c6f1ddSLingrui98  fromIfuRedirect.bits.level := RedirectLevel.flushAfter
948d2b20d1aSTang Haojin  fromIfuRedirect.bits.BTBMissBubble := true.B
949d2b20d1aSTang Haojin  fromIfuRedirect.bits.debugIsMemVio := false.B
950d2b20d1aSTang Haojin  fromIfuRedirect.bits.debugIsCtrl := false.B
95109c6f1ddSLingrui98
95209c6f1ddSLingrui98  val ifuRedirectCfiUpdate = fromIfuRedirect.bits.cfiUpdate
95309c6f1ddSLingrui98  ifuRedirectCfiUpdate.pc := pdWb.bits.pc(pdWb.bits.misOffset.bits)
95409c6f1ddSLingrui98  ifuRedirectCfiUpdate.pd := pdWb.bits.pd(pdWb.bits.misOffset.bits)
95509c6f1ddSLingrui98  ifuRedirectCfiUpdate.predTaken := cfiIndex_vec(pdWb.bits.ftqIdx.value).valid
95609c6f1ddSLingrui98  ifuRedirectCfiUpdate.target := pdWb.bits.target
95709c6f1ddSLingrui98  ifuRedirectCfiUpdate.taken := pdWb.bits.cfiOffset.valid
95809c6f1ddSLingrui98  ifuRedirectCfiUpdate.isMisPred := pdWb.bits.misOffset.valid
95909c6f1ddSLingrui98
960d2b20d1aSTang Haojin  val ifuRedirectReg = RegNext(fromIfuRedirect, init=0.U.asTypeOf(Valid(new BranchPredictionRedirect)))
96109c6f1ddSLingrui98  val ifuRedirectToBpu = WireInit(ifuRedirectReg)
96209c6f1ddSLingrui98  ifuFlush := fromIfuRedirect.valid || ifuRedirectToBpu.valid
96309c6f1ddSLingrui98
96409c6f1ddSLingrui98  ftq_redirect_sram.io.ren.head := fromIfuRedirect.valid
96509c6f1ddSLingrui98  ftq_redirect_sram.io.raddr.head := fromIfuRedirect.bits.ftqIdx.value
96609c6f1ddSLingrui98
96709c6f1ddSLingrui98  ftb_entry_mem.io.raddr.head := fromIfuRedirect.bits.ftqIdx.value
96809c6f1ddSLingrui98
96909c6f1ddSLingrui98  val toBpuCfi = ifuRedirectToBpu.bits.cfiUpdate
97009c6f1ddSLingrui98  toBpuCfi.fromFtqRedirectSram(ftq_redirect_sram.io.rdata.head)
971f1267a13SEaston Man  when (ifuRedirectReg.bits.cfiUpdate.pd.isRet && ifuRedirectReg.bits.cfiUpdate.pd.valid) {
972c89b4642SGuokai Chen    toBpuCfi.target := toBpuCfi.topAddr
97309c6f1ddSLingrui98  }
97409c6f1ddSLingrui98
975d2b20d1aSTang Haojin  when (ifuRedirectReg.valid) {
976d2b20d1aSTang Haojin    ifuRedirected(ifuRedirectReg.bits.ftqIdx.value) := true.B
977d2b20d1aSTang Haojin  } .elsewhen(RegNext(pdWb.valid)) {
978d2b20d1aSTang Haojin    // if pdWb and no redirect, set to false
979d2b20d1aSTang Haojin    ifuRedirected(last_cycle_bpu_in_ptr.value) := false.B
980d2b20d1aSTang Haojin  }
981d2b20d1aSTang Haojin
98209c6f1ddSLingrui98  // *********************************************************************
98309c6f1ddSLingrui98  // **************************** wb from exu ****************************
98409c6f1ddSLingrui98  // *********************************************************************
98509c6f1ddSLingrui98
986d2b20d1aSTang Haojin  backendRedirect.valid := io.fromBackend.redirect.valid
987d2b20d1aSTang Haojin  backendRedirect.bits.connectRedirect(io.fromBackend.redirect.bits)
988d2b20d1aSTang Haojin  backendRedirect.bits.BTBMissBubble := false.B
989d2b20d1aSTang Haojin
9902e1be6e1SSteve Gou
99109c6f1ddSLingrui98  def extractRedirectInfo(wb: Valid[Redirect]) = {
9926bf9b30dSLingrui98    val ftqPtr = wb.bits.ftqIdx
99309c6f1ddSLingrui98    val ftqOffset = wb.bits.ftqOffset
99409c6f1ddSLingrui98    val taken = wb.bits.cfiUpdate.taken
99509c6f1ddSLingrui98    val mispred = wb.bits.cfiUpdate.isMisPred
9966bf9b30dSLingrui98    (wb.valid, ftqPtr, ftqOffset, taken, mispred)
99709c6f1ddSLingrui98  }
99809c6f1ddSLingrui98
99909c6f1ddSLingrui98  // fix mispredict entry
100009c6f1ddSLingrui98  val lastIsMispredict = RegNext(
1001df5b4b8eSYinan Xu    backendRedirect.valid && backendRedirect.bits.level === RedirectLevel.flushAfter, init = false.B
100209c6f1ddSLingrui98  )
100309c6f1ddSLingrui98
100409c6f1ddSLingrui98  def updateCfiInfo(redirect: Valid[Redirect], isBackend: Boolean = true) = {
10056bf9b30dSLingrui98    val (r_valid, r_ptr, r_offset, r_taken, r_mispred) = extractRedirectInfo(redirect)
10066bf9b30dSLingrui98    val r_idx = r_ptr.value
100709c6f1ddSLingrui98    val cfiIndex_bits_wen = r_valid && r_taken && r_offset < cfiIndex_vec(r_idx).bits
100809c6f1ddSLingrui98    val cfiIndex_valid_wen = r_valid && r_offset === cfiIndex_vec(r_idx).bits
100909c6f1ddSLingrui98    when (cfiIndex_bits_wen || cfiIndex_valid_wen) {
101009c6f1ddSLingrui98      cfiIndex_vec(r_idx).valid := cfiIndex_bits_wen || cfiIndex_valid_wen && r_taken
10113f88c020SGuokai Chen    } .elsewhen (r_valid && !r_taken && r_offset =/= cfiIndex_vec(r_idx).bits) {
10123f88c020SGuokai Chen      cfiIndex_vec(r_idx).valid :=false.B
101309c6f1ddSLingrui98    }
101409c6f1ddSLingrui98    when (cfiIndex_bits_wen) {
101509c6f1ddSLingrui98      cfiIndex_vec(r_idx).bits := r_offset
101609c6f1ddSLingrui98    }
10176bf9b30dSLingrui98    newest_entry_target := redirect.bits.cfiUpdate.target
1018873dc383SLingrui98    newest_entry_ptr := r_ptr
1019b0ed7239SLingrui98    update_target(r_idx) := redirect.bits.cfiUpdate.target // TODO: remove this
102009c6f1ddSLingrui98    if (isBackend) {
102109c6f1ddSLingrui98      mispredict_vec(r_idx)(r_offset) := r_mispred
102209c6f1ddSLingrui98    }
102309c6f1ddSLingrui98  }
102409c6f1ddSLingrui98
10259342624fSGao-Zeyu  when(backendRedirect.valid) {
10269342624fSGao-Zeyu    updateCfiInfo(backendRedirect)
102709c6f1ddSLingrui98  }.elsewhen (ifuRedirectToBpu.valid) {
102809c6f1ddSLingrui98    updateCfiInfo(ifuRedirectToBpu, isBackend=false)
102909c6f1ddSLingrui98  }
103009c6f1ddSLingrui98
10319342624fSGao-Zeyu  when (backendRedirect.valid) {
10329342624fSGao-Zeyu    when (backendRedirect.bits.ControlRedirectBubble) {
1033d2b20d1aSTang Haojin      when (fromBackendRedirect.bits.ControlBTBMissBubble) {
1034d2b20d1aSTang Haojin        topdown_stage.reasons(TopDownCounters.BTBMissBubble.id) := true.B
1035d2b20d1aSTang Haojin        io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.BTBMissBubble.id) := true.B
1036d2b20d1aSTang Haojin      } .elsewhen (fromBackendRedirect.bits.TAGEMissBubble) {
1037d2b20d1aSTang Haojin        topdown_stage.reasons(TopDownCounters.TAGEMissBubble.id) := true.B
1038d2b20d1aSTang Haojin        io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.TAGEMissBubble.id) := true.B
1039d2b20d1aSTang Haojin      } .elsewhen (fromBackendRedirect.bits.SCMissBubble) {
1040d2b20d1aSTang Haojin        topdown_stage.reasons(TopDownCounters.SCMissBubble.id) := true.B
1041d2b20d1aSTang Haojin        io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.SCMissBubble.id) := true.B
1042d2b20d1aSTang Haojin      } .elsewhen (fromBackendRedirect.bits.ITTAGEMissBubble) {
1043d2b20d1aSTang Haojin        topdown_stage.reasons(TopDownCounters.ITTAGEMissBubble.id) := true.B
1044d2b20d1aSTang Haojin        io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.ITTAGEMissBubble.id) := true.B
1045d2b20d1aSTang Haojin      } .elsewhen (fromBackendRedirect.bits.RASMissBubble) {
1046d2b20d1aSTang Haojin        topdown_stage.reasons(TopDownCounters.RASMissBubble.id) := true.B
1047d2b20d1aSTang Haojin        io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.RASMissBubble.id) := true.B
1048d2b20d1aSTang Haojin      }
1049d2b20d1aSTang Haojin
1050d2b20d1aSTang Haojin
10519342624fSGao-Zeyu    } .elsewhen (backendRedirect.bits.MemVioRedirectBubble) {
1052d2b20d1aSTang Haojin      topdown_stage.reasons(TopDownCounters.MemVioRedirectBubble.id) := true.B
1053d2b20d1aSTang Haojin      io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.MemVioRedirectBubble.id) := true.B
1054d2b20d1aSTang Haojin    } .otherwise {
1055d2b20d1aSTang Haojin      topdown_stage.reasons(TopDownCounters.OtherRedirectBubble.id) := true.B
1056d2b20d1aSTang Haojin      io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.OtherRedirectBubble.id) := true.B
1057d2b20d1aSTang Haojin    }
1058d2b20d1aSTang Haojin  } .elsewhen (ifuRedirectReg.valid) {
1059d2b20d1aSTang Haojin    topdown_stage.reasons(TopDownCounters.BTBMissBubble.id) := true.B
1060d2b20d1aSTang Haojin    io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.BTBMissBubble.id) := true.B
1061d2b20d1aSTang Haojin  }
1062d2b20d1aSTang Haojin
1063d2b20d1aSTang Haojin  io.ControlBTBMissBubble := fromBackendRedirect.bits.ControlBTBMissBubble
1064d2b20d1aSTang Haojin  io.TAGEMissBubble := fromBackendRedirect.bits.TAGEMissBubble
1065d2b20d1aSTang Haojin  io.SCMissBubble := fromBackendRedirect.bits.SCMissBubble
1066d2b20d1aSTang Haojin  io.ITTAGEMissBubble := fromBackendRedirect.bits.ITTAGEMissBubble
1067d2b20d1aSTang Haojin  io.RASMissBubble := fromBackendRedirect.bits.RASMissBubble
1068d2b20d1aSTang Haojin
106909c6f1ddSLingrui98  // ***********************************************************************************
107009c6f1ddSLingrui98  // **************************** flush ptr and state queue ****************************
107109c6f1ddSLingrui98  // ***********************************************************************************
107209c6f1ddSLingrui98
1073df5b4b8eSYinan Xu  val redirectVec = VecInit(backendRedirect, fromIfuRedirect)
107409c6f1ddSLingrui98
107509c6f1ddSLingrui98  // when redirect, we should reset ptrs and status queues
107609c6f1ddSLingrui98  when(redirectVec.map(r => r.valid).reduce(_||_)){
10772f4a3aa4SLingrui98    val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits)))
107809c6f1ddSLingrui98    val notIfu = redirectVec.dropRight(1).map(r => r.valid).reduce(_||_)
10792f4a3aa4SLingrui98    val (idx, offset, flushItSelf) = (r.ftqIdx, r.ftqOffset, RedirectLevel.flushItself(r.level))
108009c6f1ddSLingrui98    val next = idx + 1.U
108109c6f1ddSLingrui98    bpuPtr := next
1082dc270d3bSJenius    copied_bpu_ptr.map(_ := next)
1083c5c5edaeSJenius    ifuPtr_write := next
1084c5c5edaeSJenius    ifuWbPtr_write := next
1085c5c5edaeSJenius    ifuPtrPlus1_write := idx + 2.U
10866bf9b30dSLingrui98    ifuPtrPlus2_write := idx + 3.U
10873f88c020SGuokai Chen
10883f88c020SGuokai Chen  }
10893f88c020SGuokai Chen  when(RegNext(redirectVec.map(r => r.valid).reduce(_||_))){
10903f88c020SGuokai Chen    val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits)))
10913f88c020SGuokai Chen    val notIfu = redirectVec.dropRight(1).map(r => r.valid).reduce(_||_)
10923f88c020SGuokai Chen    val (idx, offset, flushItSelf) = (r.ftqIdx, r.ftqOffset, RedirectLevel.flushItself(r.level))
10933f88c020SGuokai Chen    when (RegNext(notIfu)) {
10943f88c020SGuokai Chen      commitStateQueue(RegNext(idx.value)).zipWithIndex.foreach({ case (s, i) =>
10953f88c020SGuokai Chen        when(i.U > RegNext(offset) || i.U === RegNext(offset) && RegNext(flushItSelf)){
1096b5808fc2Ssfencevma          s := c_invalid
109709c6f1ddSLingrui98        }
109809c6f1ddSLingrui98      })
109909c6f1ddSLingrui98    }
110009c6f1ddSLingrui98  }
110109c6f1ddSLingrui98
11023f88c020SGuokai Chen
110309c6f1ddSLingrui98  // only the valid bit is actually needed
1104df5b4b8eSYinan Xu  io.toIfu.redirect.bits    := backendRedirect.bits
110509c6f1ddSLingrui98  io.toIfu.redirect.valid   := stage2Flush
1106d2b20d1aSTang Haojin  io.toIfu.topdown_redirect := fromBackendRedirect
110709c6f1ddSLingrui98
110809c6f1ddSLingrui98  // commit
11099aca92b9SYinan Xu  for (c <- io.fromBackend.rob_commits) {
111009c6f1ddSLingrui98    when(c.valid) {
111109c6f1ddSLingrui98      commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset) := c_commited
111288825c5cSYinan Xu      // TODO: remove this
111388825c5cSYinan Xu      // For instruction fusions, we also update the next instruction
1114c3abb8b6SYinan Xu      when (c.bits.commitType === 4.U) {
111588825c5cSYinan Xu        commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset + 1.U) := c_commited
1116c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 5.U) {
111788825c5cSYinan Xu        commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset + 2.U) := c_commited
1118c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 6.U) {
111988825c5cSYinan Xu        val index = (c.bits.ftqIdx + 1.U).value
112088825c5cSYinan Xu        commitStateQueue(index)(0) := c_commited
1121c3abb8b6SYinan Xu      }.elsewhen(c.bits.commitType === 7.U) {
112288825c5cSYinan Xu        val index = (c.bits.ftqIdx + 1.U).value
112388825c5cSYinan Xu        commitStateQueue(index)(1) := c_commited
112488825c5cSYinan Xu      }
112509c6f1ddSLingrui98    }
112609c6f1ddSLingrui98  }
112709c6f1ddSLingrui98
112809c6f1ddSLingrui98  // ****************************************************************
112909c6f1ddSLingrui98  // **************************** to bpu ****************************
113009c6f1ddSLingrui98  // ****************************************************************
113109c6f1ddSLingrui98
113251981c77SbugGenerator  io.toBpu.redirect := Mux(fromBackendRedirect.valid, fromBackendRedirect, ifuRedirectToBpu)
1133209a4cafSSteve Gou  val dummy_s1_pred_cycle_vec = VecInit(List.tabulate(FtqSize)(_=>0.U(64.W)))
1134209a4cafSSteve Gou  val redirect_latency = GTimer() - pred_s1_cycle.getOrElse(dummy_s1_pred_cycle_vec)(io.toBpu.redirect.bits.ftqIdx.value) + 1.U
1135209a4cafSSteve Gou  XSPerfHistogram("backend_redirect_latency", redirect_latency, fromBackendRedirect.valid, 0, 60, 1)
1136209a4cafSSteve Gou  XSPerfHistogram("ifu_redirect_latency", redirect_latency, !fromBackendRedirect.valid && ifuRedirectToBpu.valid, 0, 60, 1)
113709c6f1ddSLingrui98
1138f21bbcb2SGuokai Chen  XSError(io.toBpu.redirect.valid && isBefore(io.toBpu.redirect.bits.ftqIdx, commPtr), "Ftq received a redirect after its commit, check backend or replay")
1139f21bbcb2SGuokai Chen
114002f21c16SLingrui98  val may_have_stall_from_bpu = Wire(Bool())
114102f21c16SLingrui98  val bpu_ftb_update_stall = RegInit(0.U(2.W)) // 2-cycle stall, so we need 3 states
114202f21c16SLingrui98  may_have_stall_from_bpu := bpu_ftb_update_stall =/= 0.U
114343aca6c2SGuokai Chen  canCommit := commPtr =/= ifuWbPtr && !may_have_stall_from_bpu &&
114409c6f1ddSLingrui98    Cat(commitStateQueue(commPtr.value).map(s => {
1145b5808fc2Ssfencevma      s === c_invalid || s === c_commited
1146935edac4STang Haojin    })).andR
114709c6f1ddSLingrui98
11481d1e6d4dSJenius  val mmioReadPtr = io.mmioCommitRead.mmioFtqPtr
11491d1e6d4dSJenius  val mmioLastCommit = isBefore(commPtr, mmioReadPtr) && (isAfter(ifuPtr,mmioReadPtr)  ||  mmioReadPtr ===   ifuPtr) &&
1150935edac4STang Haojin                       Cat(commitStateQueue(mmioReadPtr.value).map(s => { s === c_invalid || s === c_commited})).andR
11511d1e6d4dSJenius  io.mmioCommitRead.mmioLastCommit := RegNext(mmioLastCommit)
11521d1e6d4dSJenius
115309c6f1ddSLingrui98  // commit reads
1154c5c5edaeSJenius  val commit_pc_bundle = RegNext(ftq_pc_mem.io.commPtr_rdata)
115581101dc4SLingrui98  val commit_target =
115634cf890eSLingrui98    Mux(RegNext(commPtr === newest_entry_ptr),
115734cf890eSLingrui98      RegNext(newest_entry_target),
115881101dc4SLingrui98      RegNext(ftq_pc_mem.io.commPtrPlus1_rdata.startAddr))
115909c6f1ddSLingrui98  ftq_pd_mem.io.raddr.last := commPtr.value
116009c6f1ddSLingrui98  val commit_pd = ftq_pd_mem.io.rdata.last
116109c6f1ddSLingrui98  ftq_redirect_sram.io.ren.last := canCommit
116209c6f1ddSLingrui98  ftq_redirect_sram.io.raddr.last := commPtr.value
116309c6f1ddSLingrui98  val commit_spec_meta = ftq_redirect_sram.io.rdata.last
116409c6f1ddSLingrui98  ftq_meta_1r_sram.io.ren(0) := canCommit
116509c6f1ddSLingrui98  ftq_meta_1r_sram.io.raddr(0) := commPtr.value
116609c6f1ddSLingrui98  val commit_meta = ftq_meta_1r_sram.io.rdata(0)
116709c6f1ddSLingrui98  ftb_entry_mem.io.raddr.last := commPtr.value
116809c6f1ddSLingrui98  val commit_ftb_entry = ftb_entry_mem.io.rdata.last
116909c6f1ddSLingrui98
117009c6f1ddSLingrui98  // need one cycle to read mem and srams
117109c6f1ddSLingrui98  val do_commit_ptr = RegNext(commPtr)
11725371700eSzoujr  val do_commit = RegNext(canCommit, init=false.B)
11736bf9b30dSLingrui98  when (canCommit) {
11746bf9b30dSLingrui98    commPtr_write := commPtrPlus1
11756bf9b30dSLingrui98    commPtrPlus1_write := commPtrPlus1 + 1.U
11766bf9b30dSLingrui98  }
117709c6f1ddSLingrui98  val commit_state = RegNext(commitStateQueue(commPtr.value))
11785371700eSzoujr  val can_commit_cfi = WireInit(cfiIndex_vec(commPtr.value))
1179d4fcfc3eSGuokai Chen  val do_commit_cfi = WireInit(cfiIndex_vec(do_commit_ptr.value))
11803f88c020SGuokai Chen  //
11813f88c020SGuokai Chen  //when (commitStateQueue(commPtr.value)(can_commit_cfi.bits) =/= c_commited) {
11823f88c020SGuokai Chen  //  can_commit_cfi.valid := false.B
11833f88c020SGuokai Chen  //}
11845371700eSzoujr  val commit_cfi = RegNext(can_commit_cfi)
1185d4fcfc3eSGuokai Chen  val debug_cfi = commitStateQueue(do_commit_ptr.value)(do_commit_cfi.bits) =/= c_commited && do_commit_cfi.valid
118609c6f1ddSLingrui98
1187cc2d1573SEaston Man  val commit_mispredict  : Vec[Bool] = VecInit((RegNext(mispredict_vec(commPtr.value)) zip commit_state).map {
118809c6f1ddSLingrui98    case (mis, state) => mis && state === c_commited
118909c6f1ddSLingrui98  })
1190cc2d1573SEaston Man  val commit_instCommited: Vec[Bool] = VecInit(commit_state.map(_ === c_commited)) // [PredictWidth]
11915371700eSzoujr  val can_commit_hit                 = entry_hit_status(commPtr.value)
11925371700eSzoujr  val commit_hit                     = RegNext(can_commit_hit)
11935fa3df0dSLingrui98  val diff_commit_target             = RegNext(update_target(commPtr.value)) // TODO: remove this
1194edc18578SLingrui98  val commit_stage                   = RegNext(pred_stage(commPtr.value))
119509c6f1ddSLingrui98  val commit_valid                   = commit_hit === h_hit || commit_cfi.valid // hit or taken
119609c6f1ddSLingrui98
11975371700eSzoujr  val to_bpu_hit = can_commit_hit === h_hit || can_commit_hit === h_false_hit
119802f21c16SLingrui98  switch (bpu_ftb_update_stall) {
119902f21c16SLingrui98    is (0.U) {
120002f21c16SLingrui98      when (can_commit_cfi.valid && !to_bpu_hit && canCommit) {
120102f21c16SLingrui98        bpu_ftb_update_stall := 2.U // 2-cycle stall
120202f21c16SLingrui98      }
120302f21c16SLingrui98    }
120402f21c16SLingrui98    is (2.U) {
120502f21c16SLingrui98      bpu_ftb_update_stall := 1.U
120602f21c16SLingrui98    }
120702f21c16SLingrui98    is (1.U) {
120802f21c16SLingrui98      bpu_ftb_update_stall := 0.U
120902f21c16SLingrui98    }
121002f21c16SLingrui98    is (3.U) {
121102f21c16SLingrui98      XSError(true.B, "bpu_ftb_update_stall should be 0, 1 or 2")
121202f21c16SLingrui98    }
121302f21c16SLingrui98  }
121409c6f1ddSLingrui98
1215b0ed7239SLingrui98  // TODO: remove this
1216b0ed7239SLingrui98  XSError(do_commit && diff_commit_target =/= commit_target, "\ncommit target should be the same as update target\n")
1217b0ed7239SLingrui98
1218b2f6ed0aSSteve Gou  // update latency stats
1219b2f6ed0aSSteve Gou  val update_latency = GTimer() - pred_s1_cycle.getOrElse(dummy_s1_pred_cycle_vec)(do_commit_ptr.value) + 1.U
1220b2f6ed0aSSteve Gou  XSPerfHistogram("bpu_update_latency", update_latency, io.toBpu.update.valid, 0, 64, 2)
1221b2f6ed0aSSteve Gou
122209c6f1ddSLingrui98  io.toBpu.update := DontCare
122309c6f1ddSLingrui98  io.toBpu.update.valid := commit_valid && do_commit
122409c6f1ddSLingrui98  val update = io.toBpu.update.bits
122509c6f1ddSLingrui98  update.false_hit   := commit_hit === h_false_hit
122609c6f1ddSLingrui98  update.pc          := commit_pc_bundle.startAddr
122709c6f1ddSLingrui98  update.meta        := commit_meta.meta
1228803124a6SLingrui98  update.cfi_idx     := commit_cfi
12298ffcd86aSLingrui98  update.full_target := commit_target
1230edc18578SLingrui98  update.from_stage  := commit_stage
1231c2d1ec7dSLingrui98  update.spec_info   := commit_spec_meta
12323f88c020SGuokai Chen  XSError(commit_valid && do_commit && debug_cfi, "\ncommit cfi can be non c_commited\n")
123309c6f1ddSLingrui98
123409c6f1ddSLingrui98  val commit_real_hit = commit_hit === h_hit
123509c6f1ddSLingrui98  val update_ftb_entry = update.ftb_entry
123609c6f1ddSLingrui98
123709c6f1ddSLingrui98  val ftbEntryGen = Module(new FTBEntryGen).io
123809c6f1ddSLingrui98  ftbEntryGen.start_addr     := commit_pc_bundle.startAddr
123909c6f1ddSLingrui98  ftbEntryGen.old_entry      := commit_ftb_entry
124009c6f1ddSLingrui98  ftbEntryGen.pd             := commit_pd
124109c6f1ddSLingrui98  ftbEntryGen.cfiIndex       := commit_cfi
124209c6f1ddSLingrui98  ftbEntryGen.target         := commit_target
124309c6f1ddSLingrui98  ftbEntryGen.hit            := commit_real_hit
124409c6f1ddSLingrui98  ftbEntryGen.mispredict_vec := commit_mispredict
124509c6f1ddSLingrui98
124609c6f1ddSLingrui98  update_ftb_entry         := ftbEntryGen.new_entry
124709c6f1ddSLingrui98  update.new_br_insert_pos := ftbEntryGen.new_br_insert_pos
124809c6f1ddSLingrui98  update.mispred_mask      := ftbEntryGen.mispred_mask
124909c6f1ddSLingrui98  update.old_entry         := ftbEntryGen.is_old_entry
1250edc18578SLingrui98  update.pred_hit          := commit_hit === h_hit || commit_hit === h_false_hit
1251803124a6SLingrui98  update.br_taken_mask     := ftbEntryGen.taken_mask
1252cc2d1573SEaston Man  update.br_committed      := (ftbEntryGen.new_entry.brValids zip ftbEntryGen.new_entry.brOffset) map {
1253cc2d1573SEaston Man    case (valid, offset) => valid && commit_instCommited(offset)
1254cc2d1573SEaston Man  }
1255803124a6SLingrui98  update.jmp_taken         := ftbEntryGen.jmp_taken
1256b37e4b45SLingrui98
1257803124a6SLingrui98  // update.full_pred.fromFtbEntry(ftbEntryGen.new_entry, update.pc)
1258803124a6SLingrui98  // update.full_pred.jalr_target := commit_target
1259803124a6SLingrui98  // update.full_pred.hit := true.B
1260803124a6SLingrui98  // when (update.full_pred.is_jalr) {
1261803124a6SLingrui98  //   update.full_pred.targets.last := commit_target
1262803124a6SLingrui98  // }
126309c6f1ddSLingrui98
1264e30430c2SJay  // ****************************************************************
1265e30430c2SJay  // *********************** to prefetch ****************************
1266e30430c2SJay  // ****************************************************************
1267*f9c51548Sssszwic  /**
1268*f9c51548Sssszwic    ******************************************************************************
1269*f9c51548Sssszwic    * prefetchPtr control
1270*f9c51548Sssszwic    * - 1. prefetchPtr plus 1 when toPrefetch fire and keep distance from bpuPtr more than 2
1271*f9c51548Sssszwic    * - 2. limit range of prefetchPtr is in [ifuPtr + minRange, ifuPtr + maxRange]
1272*f9c51548Sssszwic    * - 3. flush prefetchPtr when receive redirect from ifu or backend
1273*f9c51548Sssszwic    ******************************************************************************
1274*f9c51548Sssszwic    */
1275e30430c2SJay  val prefetchPtr = RegInit(FtqPtr(false.B, 0.U))
1276*f9c51548Sssszwic  val nextPrefetchPtr = WireInit(prefetchPtr)
1277e30430c2SJay
1278*f9c51548Sssszwic  prefetchPtr := nextPrefetchPtr
1279*f9c51548Sssszwic
1280*f9c51548Sssszwic  // TODO: consider req which cross cacheline
1281*f9c51548Sssszwic  when(io.toPrefetch.req.fire) {
1282*f9c51548Sssszwic    when(prefetchPtr < bpuPtr - 2.U) {
1283*f9c51548Sssszwic      nextPrefetchPtr := prefetchPtr + 1.U
1284a677d2cbSguohongyu    }
1285a677d2cbSguohongyu  }
1286a677d2cbSguohongyu
1287*f9c51548Sssszwic  when(prefetchPtr < ifuPtr + minRangeFromIFUptr.U) {
1288*f9c51548Sssszwic    nextPrefetchPtr := ifuPtr + minRangeFromIFUptr.U
1289*f9c51548Sssszwic  }.elsewhen(prefetchPtr > ifuPtr + maxRangeFromIFUptr.U) {
1290*f9c51548Sssszwic    nextPrefetchPtr := ifuPtr + maxRangeFromIFUptr.U
1291e30430c2SJay  }
1292e30430c2SJay
1293de7689fcSJay  when(redirectVec.map(r => r.valid).reduce(_||_)){
1294de7689fcSJay    val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits)))
1295*f9c51548Sssszwic    val next = r.ftqIdx + minRangeFromIFUptr.U
1296*f9c51548Sssszwic    nextPrefetchPtr := next
1297de7689fcSJay  }
1298de7689fcSJay
1299*f9c51548Sssszwic  // data from ftq_pc_mem has 1 cycle delay
1300*f9c51548Sssszwic  io.toPrefetch.req.valid := RegNext(entry_fetch_status(nextPrefetchPtr.value) === f_to_send)
1301*f9c51548Sssszwic  ftq_pc_mem.io.other_raddrs(0) := nextPrefetchPtr.value
1302*f9c51548Sssszwic  io.toPrefetch.req.bits.target := RegNext(ftq_pc_mem.io.other_rdatas(0).startAddr)
1303378f00d9SJenius
1304*f9c51548Sssszwic  // record position relationship between ifuPtr, pfPtr and bpuPtr
1305*f9c51548Sssszwic  val isWritePrefetchPtrTable = WireInit(Constantin.createRecord("isWritePrefetchPtrTable" + p(XSCoreParamsKey).HartId.toString))
1306*f9c51548Sssszwic  val prefetchPtrTable = ChiselDB.createTable("PrefetchPtrTable" + p(XSCoreParamsKey).HartId.toString, new PrefetchPtrDB)
1307*f9c51548Sssszwic  val prefetchPtrDumpData = Wire(new PrefetchPtrDB)
1308*f9c51548Sssszwic  prefetchPtrDumpData.fromFtqPtr  := distanceBetween(bpuPtr, prefetchPtr)
1309*f9c51548Sssszwic  prefetchPtrDumpData.fromIfuPtr  := distanceBetween(prefetchPtr, ifuPtr)
1310378f00d9SJenius
1311*f9c51548Sssszwic  prefetchPtrTable.log(
1312*f9c51548Sssszwic    data = prefetchPtrDumpData,
1313*f9c51548Sssszwic    en = isWritePrefetchPtrTable.orR && io.toPrefetch.req.fire,
1314*f9c51548Sssszwic    site = "FTQ" + p(XSCoreParamsKey).HartId.toString,
1315*f9c51548Sssszwic    clock = clock,
1316*f9c51548Sssszwic    reset = reset
1317*f9c51548Sssszwic  )
1318*f9c51548Sssszwic
1319de7689fcSJay
132009c6f1ddSLingrui98  // ******************************************************************************
132109c6f1ddSLingrui98  // **************************** commit perf counters ****************************
132209c6f1ddSLingrui98  // ******************************************************************************
132309c6f1ddSLingrui98
132409c6f1ddSLingrui98  val commit_inst_mask    = VecInit(commit_state.map(c => c === c_commited && do_commit)).asUInt
132509c6f1ddSLingrui98  val commit_mispred_mask = commit_mispredict.asUInt
132609c6f1ddSLingrui98  val commit_not_mispred_mask = ~commit_mispred_mask
132709c6f1ddSLingrui98
132809c6f1ddSLingrui98  val commit_br_mask = commit_pd.brMask.asUInt
132909c6f1ddSLingrui98  val commit_jmp_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.jmpInfo.valid.asTypeOf(UInt(1.W)))
133009c6f1ddSLingrui98  val commit_cfi_mask = (commit_br_mask | commit_jmp_mask)
133109c6f1ddSLingrui98
133209c6f1ddSLingrui98  val mbpInstrs = commit_inst_mask & commit_cfi_mask
133309c6f1ddSLingrui98
133409c6f1ddSLingrui98  val mbpRights = mbpInstrs & commit_not_mispred_mask
133509c6f1ddSLingrui98  val mbpWrongs = mbpInstrs & commit_mispred_mask
133609c6f1ddSLingrui98
133709c6f1ddSLingrui98  io.bpuInfo.bpRight := PopCount(mbpRights)
133809c6f1ddSLingrui98  io.bpuInfo.bpWrong := PopCount(mbpWrongs)
133909c6f1ddSLingrui98
1340da3bf434SMaxpicca-Li  val isWriteFTQTable = WireInit(Constantin.createRecord("isWriteFTQTable" + p(XSCoreParamsKey).HartId.toString))
134151532d8bSGuokai Chen  val ftqBranchTraceDB = ChiselDB.createTable("FTQTable" + p(XSCoreParamsKey).HartId.toString, new FtqDebugBundle)
134209c6f1ddSLingrui98  // Cfi Info
134309c6f1ddSLingrui98  for (i <- 0 until PredictWidth) {
134409c6f1ddSLingrui98    val pc = commit_pc_bundle.startAddr + (i * instBytes).U
134509c6f1ddSLingrui98    val v = commit_state(i) === c_commited
134609c6f1ddSLingrui98    val isBr = commit_pd.brMask(i)
134709c6f1ddSLingrui98    val isJmp = commit_pd.jmpInfo.valid && commit_pd.jmpOffset === i.U
134809c6f1ddSLingrui98    val isCfi = isBr || isJmp
134909c6f1ddSLingrui98    val isTaken = commit_cfi.valid && commit_cfi.bits === i.U
135009c6f1ddSLingrui98    val misPred = commit_mispredict(i)
1351c2ad24ebSLingrui98    // val ghist = commit_spec_meta.ghist.predHist
1352c2ad24ebSLingrui98    val histPtr = commit_spec_meta.histPtr
135309c6f1ddSLingrui98    val predCycle = commit_meta.meta(63, 0)
135409c6f1ddSLingrui98    val target = commit_target
135509c6f1ddSLingrui98
135609c6f1ddSLingrui98    val brIdx = OHToUInt(Reverse(Cat(update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U})))
135709c6f1ddSLingrui98    val inFtbEntry = update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U}.reduce(_||_)
135809c6f1ddSLingrui98    val addIntoHist = ((commit_hit === h_hit) && inFtbEntry) || ((!(commit_hit === h_hit) && i.U === commit_cfi.bits && isBr && commit_cfi.valid))
135909c6f1ddSLingrui98    XSDebug(v && do_commit && isCfi, p"cfi_update: isBr(${isBr}) pc(${Hexadecimal(pc)}) " +
1360c2ad24ebSLingrui98    p"taken(${isTaken}) mispred(${misPred}) cycle($predCycle) hist(${histPtr.value}) " +
136109c6f1ddSLingrui98    p"startAddr(${Hexadecimal(commit_pc_bundle.startAddr)}) AddIntoHist(${addIntoHist}) " +
136209c6f1ddSLingrui98    p"brInEntry(${inFtbEntry}) brIdx(${brIdx}) target(${Hexadecimal(target)})\n")
136351532d8bSGuokai Chen
136451532d8bSGuokai Chen    val logbundle = Wire(new FtqDebugBundle)
136551532d8bSGuokai Chen    logbundle.pc := pc
136651532d8bSGuokai Chen    logbundle.target := target
136751532d8bSGuokai Chen    logbundle.isBr := isBr
136851532d8bSGuokai Chen    logbundle.isJmp := isJmp
136951532d8bSGuokai Chen    logbundle.isCall := isJmp && commit_pd.hasCall
137051532d8bSGuokai Chen    logbundle.isRet := isJmp && commit_pd.hasRet
137151532d8bSGuokai Chen    logbundle.misPred := misPred
137251532d8bSGuokai Chen    logbundle.isTaken := isTaken
137351532d8bSGuokai Chen    logbundle.predStage := commit_stage
137451532d8bSGuokai Chen
137551532d8bSGuokai Chen    ftqBranchTraceDB.log(
137651532d8bSGuokai Chen      data = logbundle /* hardware of type T */,
1377da3bf434SMaxpicca-Li      en = isWriteFTQTable.orR && v && do_commit && isCfi,
137851532d8bSGuokai Chen      site = "FTQ" + p(XSCoreParamsKey).HartId.toString,
137951532d8bSGuokai Chen      clock = clock,
138051532d8bSGuokai Chen      reset = reset
138151532d8bSGuokai Chen    )
138209c6f1ddSLingrui98  }
138309c6f1ddSLingrui98
138409c6f1ddSLingrui98  val enq = io.fromBpu.resp
13852e1be6e1SSteve Gou  val perf_redirect = backendRedirect
138609c6f1ddSLingrui98
138709c6f1ddSLingrui98  XSPerfAccumulate("entry", validEntries)
138809c6f1ddSLingrui98  XSPerfAccumulate("bpu_to_ftq_stall", enq.valid && !enq.ready)
138909c6f1ddSLingrui98  XSPerfAccumulate("mispredictRedirect", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level)
139009c6f1ddSLingrui98  XSPerfAccumulate("replayRedirect", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level))
139109c6f1ddSLingrui98  XSPerfAccumulate("predecodeRedirect", fromIfuRedirect.valid)
139209c6f1ddSLingrui98
139309c6f1ddSLingrui98  XSPerfAccumulate("to_ifu_bubble", io.toIfu.req.ready && !io.toIfu.req.valid)
139409c6f1ddSLingrui98
139509c6f1ddSLingrui98  XSPerfAccumulate("to_ifu_stall", io.toIfu.req.valid && !io.toIfu.req.ready)
139609c6f1ddSLingrui98  XSPerfAccumulate("from_bpu_real_bubble", !enq.valid && enq.ready && allowBpuIn)
139712cedb6fSLingrui98  XSPerfAccumulate("bpu_to_ifu_bubble", bpuPtr === ifuPtr)
1398b2f6ed0aSSteve Gou  XSPerfAccumulate("bpu_to_ifu_bubble_when_ftq_full", (bpuPtr === ifuPtr) && isFull(bpuPtr, commPtr) && io.toIfu.req.ready)
139909c6f1ddSLingrui98
14009342624fSGao-Zeyu  XSPerfAccumulate("redirectAhead_ValidNum", io.fromBackend.ftqIdxAhead.map(_.valid).reduce(_|_))
14019342624fSGao-Zeyu  XSPerfAccumulate("fromBackendRedirect_ValidNum", io.fromBackend.redirect.valid)
14029342624fSGao-Zeyu  XSPerfAccumulate("toBpuRedirect_ValidNum", io.toBpu.redirect.valid)
14039342624fSGao-Zeyu
140409c6f1ddSLingrui98  val from_bpu = io.fromBpu.resp.bits
140509c6f1ddSLingrui98  val to_ifu = io.toIfu.req.bits
140609c6f1ddSLingrui98
140709c6f1ddSLingrui98
1408209a4cafSSteve Gou  XSPerfHistogram("commit_num_inst", PopCount(commit_inst_mask), do_commit, 0, PredictWidth+1, 1)
140909c6f1ddSLingrui98
141009c6f1ddSLingrui98
141109c6f1ddSLingrui98
141209c6f1ddSLingrui98
141309c6f1ddSLingrui98  val commit_jal_mask  = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJal.asTypeOf(UInt(1.W)))
141409c6f1ddSLingrui98  val commit_jalr_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJalr.asTypeOf(UInt(1.W)))
141509c6f1ddSLingrui98  val commit_call_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasCall.asTypeOf(UInt(1.W)))
141609c6f1ddSLingrui98  val commit_ret_mask  = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasRet.asTypeOf(UInt(1.W)))
141709c6f1ddSLingrui98
141809c6f1ddSLingrui98
141909c6f1ddSLingrui98  val mbpBRights = mbpRights & commit_br_mask
142009c6f1ddSLingrui98  val mbpJRights = mbpRights & commit_jal_mask
142109c6f1ddSLingrui98  val mbpIRights = mbpRights & commit_jalr_mask
142209c6f1ddSLingrui98  val mbpCRights = mbpRights & commit_call_mask
142309c6f1ddSLingrui98  val mbpRRights = mbpRights & commit_ret_mask
142409c6f1ddSLingrui98
142509c6f1ddSLingrui98  val mbpBWrongs = mbpWrongs & commit_br_mask
142609c6f1ddSLingrui98  val mbpJWrongs = mbpWrongs & commit_jal_mask
142709c6f1ddSLingrui98  val mbpIWrongs = mbpWrongs & commit_jalr_mask
142809c6f1ddSLingrui98  val mbpCWrongs = mbpWrongs & commit_call_mask
142909c6f1ddSLingrui98  val mbpRWrongs = mbpWrongs & commit_ret_mask
143009c6f1ddSLingrui98
14311d7e5011SLingrui98  val commit_pred_stage = RegNext(pred_stage(commPtr.value))
14321d7e5011SLingrui98
14331d7e5011SLingrui98  def pred_stage_map(src: UInt, name: String) = {
14341d7e5011SLingrui98    (0 until numBpStages).map(i =>
14351d7e5011SLingrui98      f"${name}_stage_${i+1}" -> PopCount(src.asBools.map(_ && commit_pred_stage === BP_STAGES(i)))
14361d7e5011SLingrui98    ).foldLeft(Map[String, UInt]())(_+_)
14371d7e5011SLingrui98  }
14381d7e5011SLingrui98
14391d7e5011SLingrui98  val mispred_stage_map      = pred_stage_map(mbpWrongs,  "mispredict")
14401d7e5011SLingrui98  val br_mispred_stage_map   = pred_stage_map(mbpBWrongs, "br_mispredict")
14411d7e5011SLingrui98  val jalr_mispred_stage_map = pred_stage_map(mbpIWrongs, "jalr_mispredict")
14421d7e5011SLingrui98  val correct_stage_map      = pred_stage_map(mbpRights,  "correct")
14431d7e5011SLingrui98  val br_correct_stage_map   = pred_stage_map(mbpBRights, "br_correct")
14441d7e5011SLingrui98  val jalr_correct_stage_map = pred_stage_map(mbpIRights, "jalr_correct")
14451d7e5011SLingrui98
144609c6f1ddSLingrui98  val update_valid = io.toBpu.update.valid
144709c6f1ddSLingrui98  def u(cond: Bool) = update_valid && cond
144809c6f1ddSLingrui98  val ftb_false_hit = u(update.false_hit)
144965fddcf0Szoujr  // assert(!ftb_false_hit)
145009c6f1ddSLingrui98  val ftb_hit = u(commit_hit === h_hit)
145109c6f1ddSLingrui98
145209c6f1ddSLingrui98  val ftb_new_entry = u(ftbEntryGen.is_init_entry)
1453b37e4b45SLingrui98  val ftb_new_entry_only_br = ftb_new_entry && !update_ftb_entry.jmpValid
1454b37e4b45SLingrui98  val ftb_new_entry_only_jmp = ftb_new_entry && !update_ftb_entry.brValids(0)
1455b37e4b45SLingrui98  val ftb_new_entry_has_br_and_jmp = ftb_new_entry && update_ftb_entry.brValids(0) && update_ftb_entry.jmpValid
145609c6f1ddSLingrui98
145709c6f1ddSLingrui98  val ftb_old_entry = u(ftbEntryGen.is_old_entry)
145809c6f1ddSLingrui98
145909c6f1ddSLingrui98  val ftb_modified_entry = u(ftbEntryGen.is_new_br || ftbEntryGen.is_jalr_target_modified || ftbEntryGen.is_always_taken_modified)
146009c6f1ddSLingrui98  val ftb_modified_entry_new_br = u(ftbEntryGen.is_new_br)
1461d2b20d1aSTang Haojin  val ftb_modified_entry_ifu_redirected = u(ifuRedirected(do_commit_ptr.value))
146209c6f1ddSLingrui98  val ftb_modified_entry_jalr_target_modified = u(ftbEntryGen.is_jalr_target_modified)
146309c6f1ddSLingrui98  val ftb_modified_entry_br_full = ftb_modified_entry && ftbEntryGen.is_br_full
146409c6f1ddSLingrui98  val ftb_modified_entry_always_taken = ftb_modified_entry && ftbEntryGen.is_always_taken_modified
146509c6f1ddSLingrui98
1466209a4cafSSteve Gou  def getFtbEntryLen(pc: UInt, entry: FTBEntry) = (entry.getFallThrough(pc) - pc) >> instOffsetBits
1467209a4cafSSteve Gou  val gen_ftb_entry_len = getFtbEntryLen(update.pc, ftbEntryGen.new_entry)
1468209a4cafSSteve Gou  XSPerfHistogram("ftb_init_entry_len", gen_ftb_entry_len, ftb_new_entry, 0, PredictWidth+1, 1)
1469209a4cafSSteve Gou  XSPerfHistogram("ftb_modified_entry_len", gen_ftb_entry_len, ftb_modified_entry, 0, PredictWidth+1, 1)
1470209a4cafSSteve Gou  val s3_ftb_entry_len = getFtbEntryLen(from_bpu.s3.pc(0), from_bpu.last_stage_ftb_entry)
1471209a4cafSSteve Gou  XSPerfHistogram("s3_ftb_entry_len", s3_ftb_entry_len, from_bpu.s3.valid(0), 0, PredictWidth+1, 1)
147209c6f1ddSLingrui98
1473209a4cafSSteve Gou  XSPerfHistogram("ftq_has_entry", validEntries, true.B, 0, FtqSize+1, 1)
147409c6f1ddSLingrui98
147509c6f1ddSLingrui98  val perfCountsMap = Map(
147609c6f1ddSLingrui98    "BpInstr" -> PopCount(mbpInstrs),
147709c6f1ddSLingrui98    "BpBInstr" -> PopCount(mbpBRights | mbpBWrongs),
147809c6f1ddSLingrui98    "BpRight"  -> PopCount(mbpRights),
147909c6f1ddSLingrui98    "BpWrong"  -> PopCount(mbpWrongs),
148009c6f1ddSLingrui98    "BpBRight" -> PopCount(mbpBRights),
148109c6f1ddSLingrui98    "BpBWrong" -> PopCount(mbpBWrongs),
148209c6f1ddSLingrui98    "BpJRight" -> PopCount(mbpJRights),
148309c6f1ddSLingrui98    "BpJWrong" -> PopCount(mbpJWrongs),
148409c6f1ddSLingrui98    "BpIRight" -> PopCount(mbpIRights),
148509c6f1ddSLingrui98    "BpIWrong" -> PopCount(mbpIWrongs),
148609c6f1ddSLingrui98    "BpCRight" -> PopCount(mbpCRights),
148709c6f1ddSLingrui98    "BpCWrong" -> PopCount(mbpCWrongs),
148809c6f1ddSLingrui98    "BpRRight" -> PopCount(mbpRRights),
148909c6f1ddSLingrui98    "BpRWrong" -> PopCount(mbpRWrongs),
149009c6f1ddSLingrui98
149109c6f1ddSLingrui98    "ftb_false_hit"                -> PopCount(ftb_false_hit),
149209c6f1ddSLingrui98    "ftb_hit"                      -> PopCount(ftb_hit),
149309c6f1ddSLingrui98    "ftb_new_entry"                -> PopCount(ftb_new_entry),
149409c6f1ddSLingrui98    "ftb_new_entry_only_br"        -> PopCount(ftb_new_entry_only_br),
149509c6f1ddSLingrui98    "ftb_new_entry_only_jmp"       -> PopCount(ftb_new_entry_only_jmp),
149609c6f1ddSLingrui98    "ftb_new_entry_has_br_and_jmp" -> PopCount(ftb_new_entry_has_br_and_jmp),
149709c6f1ddSLingrui98    "ftb_old_entry"                -> PopCount(ftb_old_entry),
149809c6f1ddSLingrui98    "ftb_modified_entry"           -> PopCount(ftb_modified_entry),
149909c6f1ddSLingrui98    "ftb_modified_entry_new_br"    -> PopCount(ftb_modified_entry_new_br),
150009c6f1ddSLingrui98    "ftb_jalr_target_modified"     -> PopCount(ftb_modified_entry_jalr_target_modified),
150109c6f1ddSLingrui98    "ftb_modified_entry_br_full"   -> PopCount(ftb_modified_entry_br_full),
150209c6f1ddSLingrui98    "ftb_modified_entry_always_taken" -> PopCount(ftb_modified_entry_always_taken)
1503209a4cafSSteve Gou  ) ++ mispred_stage_map ++ br_mispred_stage_map ++ jalr_mispred_stage_map ++
15041d7e5011SLingrui98       correct_stage_map ++ br_correct_stage_map ++ jalr_correct_stage_map
150509c6f1ddSLingrui98
150609c6f1ddSLingrui98  for((key, value) <- perfCountsMap) {
150709c6f1ddSLingrui98    XSPerfAccumulate(key, value)
150809c6f1ddSLingrui98  }
150909c6f1ddSLingrui98
151009c6f1ddSLingrui98  // --------------------------- Debug --------------------------------
151109c6f1ddSLingrui98  // XSDebug(enq_fire, p"enq! " + io.fromBpu.resp.bits.toPrintable)
151209c6f1ddSLingrui98  XSDebug(io.toIfu.req.fire, p"fire to ifu " + io.toIfu.req.bits.toPrintable)
151309c6f1ddSLingrui98  XSDebug(do_commit, p"deq! [ptr] $do_commit_ptr\n")
151409c6f1ddSLingrui98  XSDebug(true.B, p"[bpuPtr] $bpuPtr, [ifuPtr] $ifuPtr, [ifuWbPtr] $ifuWbPtr [commPtr] $commPtr\n")
151509c6f1ddSLingrui98  XSDebug(true.B, p"[in] v:${io.fromBpu.resp.valid} r:${io.fromBpu.resp.ready} " +
151609c6f1ddSLingrui98    p"[out] v:${io.toIfu.req.valid} r:${io.toIfu.req.ready}\n")
151709c6f1ddSLingrui98  XSDebug(do_commit, p"[deq info] cfiIndex: $commit_cfi, $commit_pc_bundle, target: ${Hexadecimal(commit_target)}\n")
151809c6f1ddSLingrui98
151909c6f1ddSLingrui98  //   def ubtbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
152009c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
152109c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
152209c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
152309c6f1ddSLingrui98  //         isWrong ^ Mux(ans.hit.asBool,
152409c6f1ddSLingrui98  //           Mux(ans.taken.asBool, taken && ans.target === commitEntry.target,
152509c6f1ddSLingrui98  //           !taken),
152609c6f1ddSLingrui98  //         !taken),
152709c6f1ddSLingrui98  //       false.B)
152809c6f1ddSLingrui98  //     }
152909c6f1ddSLingrui98  //   }
153009c6f1ddSLingrui98
153109c6f1ddSLingrui98  //   def btbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
153209c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
153309c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
153409c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
153509c6f1ddSLingrui98  //         isWrong ^ Mux(ans.hit.asBool,
153609c6f1ddSLingrui98  //           Mux(ans.taken.asBool, taken && ans.target === commitEntry.target,
153709c6f1ddSLingrui98  //           !taken),
153809c6f1ddSLingrui98  //         !taken),
153909c6f1ddSLingrui98  //       false.B)
154009c6f1ddSLingrui98  //     }
154109c6f1ddSLingrui98  //   }
154209c6f1ddSLingrui98
154309c6f1ddSLingrui98  //   def tageCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
154409c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
154509c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
154609c6f1ddSLingrui98  //       Mux(valid && pd.isBr,
154709c6f1ddSLingrui98  //         isWrong ^ (ans.taken.asBool === taken),
154809c6f1ddSLingrui98  //       false.B)
154909c6f1ddSLingrui98  //     }
155009c6f1ddSLingrui98  //   }
155109c6f1ddSLingrui98
155209c6f1ddSLingrui98  //   def loopCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
155309c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
155409c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
155509c6f1ddSLingrui98  //       Mux(valid && (pd.isBr) && ans.hit.asBool,
155609c6f1ddSLingrui98  //         isWrong ^ (!taken),
155709c6f1ddSLingrui98  //           false.B)
155809c6f1ddSLingrui98  //     }
155909c6f1ddSLingrui98  //   }
156009c6f1ddSLingrui98
156109c6f1ddSLingrui98  //   def rasCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = {
156209c6f1ddSLingrui98  //     commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map {
156309c6f1ddSLingrui98  //       case (((valid, pd), ans), taken) =>
156409c6f1ddSLingrui98  //       Mux(valid && pd.isRet.asBool /*&& taken*/ && ans.hit.asBool,
156509c6f1ddSLingrui98  //         isWrong ^ (ans.target === commitEntry.target),
156609c6f1ddSLingrui98  //           false.B)
156709c6f1ddSLingrui98  //     }
156809c6f1ddSLingrui98  //   }
156909c6f1ddSLingrui98
157009c6f1ddSLingrui98  //   val ubtbRights = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), false.B)
157109c6f1ddSLingrui98  //   val ubtbWrongs = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), true.B)
157209c6f1ddSLingrui98  //   // btb and ubtb pred jal and jalr as well
157309c6f1ddSLingrui98  //   val btbRights = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), false.B)
157409c6f1ddSLingrui98  //   val btbWrongs = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), true.B)
157509c6f1ddSLingrui98  //   val tageRights = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), false.B)
157609c6f1ddSLingrui98  //   val tageWrongs = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), true.B)
157709c6f1ddSLingrui98
157809c6f1ddSLingrui98  //   val loopRights = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), false.B)
157909c6f1ddSLingrui98  //   val loopWrongs = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), true.B)
158009c6f1ddSLingrui98
158109c6f1ddSLingrui98  //   val rasRights = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), false.B)
158209c6f1ddSLingrui98  //   val rasWrongs = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), true.B)
15831ca0e4f3SYinan Xu
1584cd365d4cSrvcoresjw  val perfEvents = Seq(
1585cd365d4cSrvcoresjw    ("bpu_s2_redirect        ", bpu_s2_redirect                                                             ),
1586cb4f77ceSLingrui98    ("bpu_s3_redirect        ", bpu_s3_redirect                                                             ),
1587cd365d4cSrvcoresjw    ("bpu_to_ftq_stall       ", enq.valid && ~enq.ready                                                     ),
1588cd365d4cSrvcoresjw    ("mispredictRedirect     ", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level),
1589cd365d4cSrvcoresjw    ("replayRedirect         ", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level)  ),
1590cd365d4cSrvcoresjw    ("predecodeRedirect      ", fromIfuRedirect.valid                                                       ),
1591cd365d4cSrvcoresjw    ("to_ifu_bubble          ", io.toIfu.req.ready && !io.toIfu.req.valid                                   ),
1592cd365d4cSrvcoresjw    ("from_bpu_real_bubble   ", !enq.valid && enq.ready && allowBpuIn                                       ),
1593cd365d4cSrvcoresjw    ("BpInstr                ", PopCount(mbpInstrs)                                                         ),
1594cd365d4cSrvcoresjw    ("BpBInstr               ", PopCount(mbpBRights | mbpBWrongs)                                           ),
1595cd365d4cSrvcoresjw    ("BpRight                ", PopCount(mbpRights)                                                         ),
1596cd365d4cSrvcoresjw    ("BpWrong                ", PopCount(mbpWrongs)                                                         ),
1597cd365d4cSrvcoresjw    ("BpBRight               ", PopCount(mbpBRights)                                                        ),
1598cd365d4cSrvcoresjw    ("BpBWrong               ", PopCount(mbpBWrongs)                                                        ),
1599cd365d4cSrvcoresjw    ("BpJRight               ", PopCount(mbpJRights)                                                        ),
1600cd365d4cSrvcoresjw    ("BpJWrong               ", PopCount(mbpJWrongs)                                                        ),
1601cd365d4cSrvcoresjw    ("BpIRight               ", PopCount(mbpIRights)                                                        ),
1602cd365d4cSrvcoresjw    ("BpIWrong               ", PopCount(mbpIWrongs)                                                        ),
1603cd365d4cSrvcoresjw    ("BpCRight               ", PopCount(mbpCRights)                                                        ),
1604cd365d4cSrvcoresjw    ("BpCWrong               ", PopCount(mbpCWrongs)                                                        ),
1605cd365d4cSrvcoresjw    ("BpRRight               ", PopCount(mbpRRights)                                                        ),
1606cd365d4cSrvcoresjw    ("BpRWrong               ", PopCount(mbpRWrongs)                                                        ),
1607cd365d4cSrvcoresjw    ("ftb_false_hit          ", PopCount(ftb_false_hit)                                                     ),
1608cd365d4cSrvcoresjw    ("ftb_hit                ", PopCount(ftb_hit)                                                           ),
1609cd365d4cSrvcoresjw  )
16101ca0e4f3SYinan Xu  generatePerfEvent()
161109c6f1ddSLingrui98}